blob: 017d439b327a91bf005f9e399c33f44663dec530 [file] [log] [blame]
Mike Marciniszyn77241052015-07-30 15:17:43 -04001/*
2 *
3 * This file is provided under a dual BSD/GPLv2 license. When using or
4 * redistributing this file, you may do so under either license.
5 *
6 * GPL LICENSE SUMMARY
7 *
8 * Copyright(c) 2015 Intel Corporation.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of version 2 of the GNU General Public License as
12 * published by the Free Software Foundation.
13 *
14 * This program is distributed in the hope that it will be useful, but
15 * WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * General Public License for more details.
18 *
19 * BSD LICENSE
20 *
21 * Copyright(c) 2015 Intel Corporation.
22 *
23 * Redistribution and use in source and binary forms, with or without
24 * modification, are permitted provided that the following conditions
25 * are met:
26 *
27 * - Redistributions of source code must retain the above copyright
28 * notice, this list of conditions and the following disclaimer.
29 * - Redistributions in binary form must reproduce the above copyright
30 * notice, this list of conditions and the following disclaimer in
31 * the documentation and/or other materials provided with the
32 * distribution.
33 * - Neither the name of Intel Corporation nor the names of its
34 * contributors may be used to endorse or promote products derived
35 * from this software without specific prior written permission.
36 *
37 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
38 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
39 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
40 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
41 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
42 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
43 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
44 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
45 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
46 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
47 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
48 *
49 */
50
51/*
52 * This file contains all of the code that is specific to the HFI chip
53 */
54
55#include <linux/pci.h>
56#include <linux/delay.h>
57#include <linux/interrupt.h>
58#include <linux/module.h>
59
60#include "hfi.h"
61#include "trace.h"
62#include "mad.h"
63#include "pio.h"
64#include "sdma.h"
65#include "eprom.h"
66
67#define NUM_IB_PORTS 1
68
69uint kdeth_qp;
70module_param_named(kdeth_qp, kdeth_qp, uint, S_IRUGO);
71MODULE_PARM_DESC(kdeth_qp, "Set the KDETH queue pair prefix");
72
73uint num_vls = HFI1_MAX_VLS_SUPPORTED;
74module_param(num_vls, uint, S_IRUGO);
75MODULE_PARM_DESC(num_vls, "Set number of Virtual Lanes to use (1-8)");
76
77/*
78 * Default time to aggregate two 10K packets from the idle state
79 * (timer not running). The timer starts at the end of the first packet,
80 * so only the time for one 10K packet and header plus a bit extra is needed.
81 * 10 * 1024 + 64 header byte = 10304 byte
82 * 10304 byte / 12.5 GB/s = 824.32ns
83 */
84uint rcv_intr_timeout = (824 + 16); /* 16 is for coalescing interrupt */
85module_param(rcv_intr_timeout, uint, S_IRUGO);
86MODULE_PARM_DESC(rcv_intr_timeout, "Receive interrupt mitigation timeout in ns");
87
88uint rcv_intr_count = 16; /* same as qib */
89module_param(rcv_intr_count, uint, S_IRUGO);
90MODULE_PARM_DESC(rcv_intr_count, "Receive interrupt mitigation count");
91
92ushort link_crc_mask = SUPPORTED_CRCS;
93module_param(link_crc_mask, ushort, S_IRUGO);
94MODULE_PARM_DESC(link_crc_mask, "CRCs to use on the link");
95
96uint loopback;
97module_param_named(loopback, loopback, uint, S_IRUGO);
98MODULE_PARM_DESC(loopback, "Put into loopback mode (1 = serdes, 3 = external cable");
99
100/* Other driver tunables */
101uint rcv_intr_dynamic = 1; /* enable dynamic mode for rcv int mitigation*/
102static ushort crc_14b_sideband = 1;
103static uint use_flr = 1;
104uint quick_linkup; /* skip LNI */
105
106struct flag_table {
107 u64 flag; /* the flag */
108 char *str; /* description string */
109 u16 extra; /* extra information */
110 u16 unused0;
111 u32 unused1;
112};
113
114/* str must be a string constant */
115#define FLAG_ENTRY(str, extra, flag) {flag, str, extra}
116#define FLAG_ENTRY0(str, flag) {flag, str, 0}
117
118/* Send Error Consequences */
119#define SEC_WRITE_DROPPED 0x1
120#define SEC_PACKET_DROPPED 0x2
121#define SEC_SC_HALTED 0x4 /* per-context only */
122#define SEC_SPC_FREEZE 0x8 /* per-HFI only */
123
Mike Marciniszyn77241052015-07-30 15:17:43 -0400124#define MIN_KERNEL_KCTXTS 2
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -0500125#define FIRST_KERNEL_KCTXT 1
Mike Marciniszyn77241052015-07-30 15:17:43 -0400126#define NUM_MAP_REGS 32
127
128/* Bit offset into the GUID which carries HFI id information */
129#define GUID_HFI_INDEX_SHIFT 39
130
131/* extract the emulation revision */
132#define emulator_rev(dd) ((dd)->irev >> 8)
133/* parallel and serial emulation versions are 3 and 4 respectively */
134#define is_emulator_p(dd) ((((dd)->irev) & 0xf) == 3)
135#define is_emulator_s(dd) ((((dd)->irev) & 0xf) == 4)
136
137/* RSM fields */
138
139/* packet type */
140#define IB_PACKET_TYPE 2ull
141#define QW_SHIFT 6ull
142/* QPN[7..1] */
143#define QPN_WIDTH 7ull
144
145/* LRH.BTH: QW 0, OFFSET 48 - for match */
146#define LRH_BTH_QW 0ull
147#define LRH_BTH_BIT_OFFSET 48ull
148#define LRH_BTH_OFFSET(off) ((LRH_BTH_QW << QW_SHIFT) | (off))
149#define LRH_BTH_MATCH_OFFSET LRH_BTH_OFFSET(LRH_BTH_BIT_OFFSET)
150#define LRH_BTH_SELECT
151#define LRH_BTH_MASK 3ull
152#define LRH_BTH_VALUE 2ull
153
154/* LRH.SC[3..0] QW 0, OFFSET 56 - for match */
155#define LRH_SC_QW 0ull
156#define LRH_SC_BIT_OFFSET 56ull
157#define LRH_SC_OFFSET(off) ((LRH_SC_QW << QW_SHIFT) | (off))
158#define LRH_SC_MATCH_OFFSET LRH_SC_OFFSET(LRH_SC_BIT_OFFSET)
159#define LRH_SC_MASK 128ull
160#define LRH_SC_VALUE 0ull
161
162/* SC[n..0] QW 0, OFFSET 60 - for select */
163#define LRH_SC_SELECT_OFFSET ((LRH_SC_QW << QW_SHIFT) | (60ull))
164
165/* QPN[m+n:1] QW 1, OFFSET 1 */
166#define QPN_SELECT_OFFSET ((1ull << QW_SHIFT) | (1ull))
167
168/* defines to build power on SC2VL table */
169#define SC2VL_VAL( \
170 num, \
171 sc0, sc0val, \
172 sc1, sc1val, \
173 sc2, sc2val, \
174 sc3, sc3val, \
175 sc4, sc4val, \
176 sc5, sc5val, \
177 sc6, sc6val, \
178 sc7, sc7val) \
179( \
180 ((u64)(sc0val) << SEND_SC2VLT##num##_SC##sc0##_SHIFT) | \
181 ((u64)(sc1val) << SEND_SC2VLT##num##_SC##sc1##_SHIFT) | \
182 ((u64)(sc2val) << SEND_SC2VLT##num##_SC##sc2##_SHIFT) | \
183 ((u64)(sc3val) << SEND_SC2VLT##num##_SC##sc3##_SHIFT) | \
184 ((u64)(sc4val) << SEND_SC2VLT##num##_SC##sc4##_SHIFT) | \
185 ((u64)(sc5val) << SEND_SC2VLT##num##_SC##sc5##_SHIFT) | \
186 ((u64)(sc6val) << SEND_SC2VLT##num##_SC##sc6##_SHIFT) | \
187 ((u64)(sc7val) << SEND_SC2VLT##num##_SC##sc7##_SHIFT) \
188)
189
190#define DC_SC_VL_VAL( \
191 range, \
192 e0, e0val, \
193 e1, e1val, \
194 e2, e2val, \
195 e3, e3val, \
196 e4, e4val, \
197 e5, e5val, \
198 e6, e6val, \
199 e7, e7val, \
200 e8, e8val, \
201 e9, e9val, \
202 e10, e10val, \
203 e11, e11val, \
204 e12, e12val, \
205 e13, e13val, \
206 e14, e14val, \
207 e15, e15val) \
208( \
209 ((u64)(e0val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e0##_SHIFT) | \
210 ((u64)(e1val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e1##_SHIFT) | \
211 ((u64)(e2val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e2##_SHIFT) | \
212 ((u64)(e3val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e3##_SHIFT) | \
213 ((u64)(e4val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e4##_SHIFT) | \
214 ((u64)(e5val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e5##_SHIFT) | \
215 ((u64)(e6val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e6##_SHIFT) | \
216 ((u64)(e7val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e7##_SHIFT) | \
217 ((u64)(e8val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e8##_SHIFT) | \
218 ((u64)(e9val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e9##_SHIFT) | \
219 ((u64)(e10val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e10##_SHIFT) | \
220 ((u64)(e11val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e11##_SHIFT) | \
221 ((u64)(e12val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e12##_SHIFT) | \
222 ((u64)(e13val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e13##_SHIFT) | \
223 ((u64)(e14val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e14##_SHIFT) | \
224 ((u64)(e15val) << DCC_CFG_SC_VL_TABLE_##range##_ENTRY##e15##_SHIFT) \
225)
226
227/* all CceStatus sub-block freeze bits */
228#define ALL_FROZE (CCE_STATUS_SDMA_FROZE_SMASK \
229 | CCE_STATUS_RXE_FROZE_SMASK \
230 | CCE_STATUS_TXE_FROZE_SMASK \
231 | CCE_STATUS_TXE_PIO_FROZE_SMASK)
232/* all CceStatus sub-block TXE pause bits */
233#define ALL_TXE_PAUSE (CCE_STATUS_TXE_PIO_PAUSED_SMASK \
234 | CCE_STATUS_TXE_PAUSED_SMASK \
235 | CCE_STATUS_SDMA_PAUSED_SMASK)
236/* all CceStatus sub-block RXE pause bits */
237#define ALL_RXE_PAUSE CCE_STATUS_RXE_PAUSED_SMASK
238
239/*
240 * CCE Error flags.
241 */
242static struct flag_table cce_err_status_flags[] = {
243/* 0*/ FLAG_ENTRY0("CceCsrParityErr",
244 CCE_ERR_STATUS_CCE_CSR_PARITY_ERR_SMASK),
245/* 1*/ FLAG_ENTRY0("CceCsrReadBadAddrErr",
246 CCE_ERR_STATUS_CCE_CSR_READ_BAD_ADDR_ERR_SMASK),
247/* 2*/ FLAG_ENTRY0("CceCsrWriteBadAddrErr",
248 CCE_ERR_STATUS_CCE_CSR_WRITE_BAD_ADDR_ERR_SMASK),
249/* 3*/ FLAG_ENTRY0("CceTrgtAsyncFifoParityErr",
250 CCE_ERR_STATUS_CCE_TRGT_ASYNC_FIFO_PARITY_ERR_SMASK),
251/* 4*/ FLAG_ENTRY0("CceTrgtAccessErr",
252 CCE_ERR_STATUS_CCE_TRGT_ACCESS_ERR_SMASK),
253/* 5*/ FLAG_ENTRY0("CceRspdDataParityErr",
254 CCE_ERR_STATUS_CCE_RSPD_DATA_PARITY_ERR_SMASK),
255/* 6*/ FLAG_ENTRY0("CceCli0AsyncFifoParityErr",
256 CCE_ERR_STATUS_CCE_CLI0_ASYNC_FIFO_PARITY_ERR_SMASK),
257/* 7*/ FLAG_ENTRY0("CceCsrCfgBusParityErr",
258 CCE_ERR_STATUS_CCE_CSR_CFG_BUS_PARITY_ERR_SMASK),
259/* 8*/ FLAG_ENTRY0("CceCli2AsyncFifoParityErr",
260 CCE_ERR_STATUS_CCE_CLI2_ASYNC_FIFO_PARITY_ERR_SMASK),
261/* 9*/ FLAG_ENTRY0("CceCli1AsyncFifoPioCrdtParityErr",
262 CCE_ERR_STATUS_CCE_CLI1_ASYNC_FIFO_PIO_CRDT_PARITY_ERR_SMASK),
263/*10*/ FLAG_ENTRY0("CceCli1AsyncFifoPioCrdtParityErr",
264 CCE_ERR_STATUS_CCE_CLI1_ASYNC_FIFO_SDMA_HD_PARITY_ERR_SMASK),
265/*11*/ FLAG_ENTRY0("CceCli1AsyncFifoRxdmaParityError",
266 CCE_ERR_STATUS_CCE_CLI1_ASYNC_FIFO_RXDMA_PARITY_ERROR_SMASK),
267/*12*/ FLAG_ENTRY0("CceCli1AsyncFifoDbgParityError",
268 CCE_ERR_STATUS_CCE_CLI1_ASYNC_FIFO_DBG_PARITY_ERROR_SMASK),
269/*13*/ FLAG_ENTRY0("PcicRetryMemCorErr",
270 CCE_ERR_STATUS_PCIC_RETRY_MEM_COR_ERR_SMASK),
271/*14*/ FLAG_ENTRY0("PcicRetryMemCorErr",
272 CCE_ERR_STATUS_PCIC_RETRY_SOT_MEM_COR_ERR_SMASK),
273/*15*/ FLAG_ENTRY0("PcicPostHdQCorErr",
274 CCE_ERR_STATUS_PCIC_POST_HD_QCOR_ERR_SMASK),
275/*16*/ FLAG_ENTRY0("PcicPostHdQCorErr",
276 CCE_ERR_STATUS_PCIC_POST_DAT_QCOR_ERR_SMASK),
277/*17*/ FLAG_ENTRY0("PcicPostHdQCorErr",
278 CCE_ERR_STATUS_PCIC_CPL_HD_QCOR_ERR_SMASK),
279/*18*/ FLAG_ENTRY0("PcicCplDatQCorErr",
280 CCE_ERR_STATUS_PCIC_CPL_DAT_QCOR_ERR_SMASK),
281/*19*/ FLAG_ENTRY0("PcicNPostHQParityErr",
282 CCE_ERR_STATUS_PCIC_NPOST_HQ_PARITY_ERR_SMASK),
283/*20*/ FLAG_ENTRY0("PcicNPostDatQParityErr",
284 CCE_ERR_STATUS_PCIC_NPOST_DAT_QPARITY_ERR_SMASK),
285/*21*/ FLAG_ENTRY0("PcicRetryMemUncErr",
286 CCE_ERR_STATUS_PCIC_RETRY_MEM_UNC_ERR_SMASK),
287/*22*/ FLAG_ENTRY0("PcicRetrySotMemUncErr",
288 CCE_ERR_STATUS_PCIC_RETRY_SOT_MEM_UNC_ERR_SMASK),
289/*23*/ FLAG_ENTRY0("PcicPostHdQUncErr",
290 CCE_ERR_STATUS_PCIC_POST_HD_QUNC_ERR_SMASK),
291/*24*/ FLAG_ENTRY0("PcicPostDatQUncErr",
292 CCE_ERR_STATUS_PCIC_POST_DAT_QUNC_ERR_SMASK),
293/*25*/ FLAG_ENTRY0("PcicCplHdQUncErr",
294 CCE_ERR_STATUS_PCIC_CPL_HD_QUNC_ERR_SMASK),
295/*26*/ FLAG_ENTRY0("PcicCplDatQUncErr",
296 CCE_ERR_STATUS_PCIC_CPL_DAT_QUNC_ERR_SMASK),
297/*27*/ FLAG_ENTRY0("PcicTransmitFrontParityErr",
298 CCE_ERR_STATUS_PCIC_TRANSMIT_FRONT_PARITY_ERR_SMASK),
299/*28*/ FLAG_ENTRY0("PcicTransmitBackParityErr",
300 CCE_ERR_STATUS_PCIC_TRANSMIT_BACK_PARITY_ERR_SMASK),
301/*29*/ FLAG_ENTRY0("PcicReceiveParityErr",
302 CCE_ERR_STATUS_PCIC_RECEIVE_PARITY_ERR_SMASK),
303/*30*/ FLAG_ENTRY0("CceTrgtCplTimeoutErr",
304 CCE_ERR_STATUS_CCE_TRGT_CPL_TIMEOUT_ERR_SMASK),
305/*31*/ FLAG_ENTRY0("LATriggered",
306 CCE_ERR_STATUS_LA_TRIGGERED_SMASK),
307/*32*/ FLAG_ENTRY0("CceSegReadBadAddrErr",
308 CCE_ERR_STATUS_CCE_SEG_READ_BAD_ADDR_ERR_SMASK),
309/*33*/ FLAG_ENTRY0("CceSegWriteBadAddrErr",
310 CCE_ERR_STATUS_CCE_SEG_WRITE_BAD_ADDR_ERR_SMASK),
311/*34*/ FLAG_ENTRY0("CceRcplAsyncFifoParityErr",
312 CCE_ERR_STATUS_CCE_RCPL_ASYNC_FIFO_PARITY_ERR_SMASK),
313/*35*/ FLAG_ENTRY0("CceRxdmaConvFifoParityErr",
314 CCE_ERR_STATUS_CCE_RXDMA_CONV_FIFO_PARITY_ERR_SMASK),
315/*36*/ FLAG_ENTRY0("CceMsixTableCorErr",
316 CCE_ERR_STATUS_CCE_MSIX_TABLE_COR_ERR_SMASK),
317/*37*/ FLAG_ENTRY0("CceMsixTableUncErr",
318 CCE_ERR_STATUS_CCE_MSIX_TABLE_UNC_ERR_SMASK),
319/*38*/ FLAG_ENTRY0("CceIntMapCorErr",
320 CCE_ERR_STATUS_CCE_INT_MAP_COR_ERR_SMASK),
321/*39*/ FLAG_ENTRY0("CceIntMapUncErr",
322 CCE_ERR_STATUS_CCE_INT_MAP_UNC_ERR_SMASK),
323/*40*/ FLAG_ENTRY0("CceMsixCsrParityErr",
324 CCE_ERR_STATUS_CCE_MSIX_CSR_PARITY_ERR_SMASK),
325/*41-63 reserved*/
326};
327
328/*
329 * Misc Error flags
330 */
331#define MES(text) MISC_ERR_STATUS_MISC_##text##_ERR_SMASK
332static struct flag_table misc_err_status_flags[] = {
333/* 0*/ FLAG_ENTRY0("CSR_PARITY", MES(CSR_PARITY)),
334/* 1*/ FLAG_ENTRY0("CSR_READ_BAD_ADDR", MES(CSR_READ_BAD_ADDR)),
335/* 2*/ FLAG_ENTRY0("CSR_WRITE_BAD_ADDR", MES(CSR_WRITE_BAD_ADDR)),
336/* 3*/ FLAG_ENTRY0("SBUS_WRITE_FAILED", MES(SBUS_WRITE_FAILED)),
337/* 4*/ FLAG_ENTRY0("KEY_MISMATCH", MES(KEY_MISMATCH)),
338/* 5*/ FLAG_ENTRY0("FW_AUTH_FAILED", MES(FW_AUTH_FAILED)),
339/* 6*/ FLAG_ENTRY0("EFUSE_CSR_PARITY", MES(EFUSE_CSR_PARITY)),
340/* 7*/ FLAG_ENTRY0("EFUSE_READ_BAD_ADDR", MES(EFUSE_READ_BAD_ADDR)),
341/* 8*/ FLAG_ENTRY0("EFUSE_WRITE", MES(EFUSE_WRITE)),
342/* 9*/ FLAG_ENTRY0("EFUSE_DONE_PARITY", MES(EFUSE_DONE_PARITY)),
343/*10*/ FLAG_ENTRY0("INVALID_EEP_CMD", MES(INVALID_EEP_CMD)),
344/*11*/ FLAG_ENTRY0("MBIST_FAIL", MES(MBIST_FAIL)),
345/*12*/ FLAG_ENTRY0("PLL_LOCK_FAIL", MES(PLL_LOCK_FAIL))
346};
347
348/*
349 * TXE PIO Error flags and consequences
350 */
351static struct flag_table pio_err_status_flags[] = {
352/* 0*/ FLAG_ENTRY("PioWriteBadCtxt",
353 SEC_WRITE_DROPPED,
354 SEND_PIO_ERR_STATUS_PIO_WRITE_BAD_CTXT_ERR_SMASK),
355/* 1*/ FLAG_ENTRY("PioWriteAddrParity",
356 SEC_SPC_FREEZE,
357 SEND_PIO_ERR_STATUS_PIO_WRITE_ADDR_PARITY_ERR_SMASK),
358/* 2*/ FLAG_ENTRY("PioCsrParity",
359 SEC_SPC_FREEZE,
360 SEND_PIO_ERR_STATUS_PIO_CSR_PARITY_ERR_SMASK),
361/* 3*/ FLAG_ENTRY("PioSbMemFifo0",
362 SEC_SPC_FREEZE,
363 SEND_PIO_ERR_STATUS_PIO_SB_MEM_FIFO0_ERR_SMASK),
364/* 4*/ FLAG_ENTRY("PioSbMemFifo1",
365 SEC_SPC_FREEZE,
366 SEND_PIO_ERR_STATUS_PIO_SB_MEM_FIFO1_ERR_SMASK),
367/* 5*/ FLAG_ENTRY("PioPccFifoParity",
368 SEC_SPC_FREEZE,
369 SEND_PIO_ERR_STATUS_PIO_PCC_FIFO_PARITY_ERR_SMASK),
370/* 6*/ FLAG_ENTRY("PioPecFifoParity",
371 SEC_SPC_FREEZE,
372 SEND_PIO_ERR_STATUS_PIO_PEC_FIFO_PARITY_ERR_SMASK),
373/* 7*/ FLAG_ENTRY("PioSbrdctlCrrelParity",
374 SEC_SPC_FREEZE,
375 SEND_PIO_ERR_STATUS_PIO_SBRDCTL_CRREL_PARITY_ERR_SMASK),
376/* 8*/ FLAG_ENTRY("PioSbrdctrlCrrelFifoParity",
377 SEC_SPC_FREEZE,
378 SEND_PIO_ERR_STATUS_PIO_SBRDCTRL_CRREL_FIFO_PARITY_ERR_SMASK),
379/* 9*/ FLAG_ENTRY("PioPktEvictFifoParityErr",
380 SEC_SPC_FREEZE,
381 SEND_PIO_ERR_STATUS_PIO_PKT_EVICT_FIFO_PARITY_ERR_SMASK),
382/*10*/ FLAG_ENTRY("PioSmPktResetParity",
383 SEC_SPC_FREEZE,
384 SEND_PIO_ERR_STATUS_PIO_SM_PKT_RESET_PARITY_ERR_SMASK),
385/*11*/ FLAG_ENTRY("PioVlLenMemBank0Unc",
386 SEC_SPC_FREEZE,
387 SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK0_UNC_ERR_SMASK),
388/*12*/ FLAG_ENTRY("PioVlLenMemBank1Unc",
389 SEC_SPC_FREEZE,
390 SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK1_UNC_ERR_SMASK),
391/*13*/ FLAG_ENTRY("PioVlLenMemBank0Cor",
392 0,
393 SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK0_COR_ERR_SMASK),
394/*14*/ FLAG_ENTRY("PioVlLenMemBank1Cor",
395 0,
396 SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK1_COR_ERR_SMASK),
397/*15*/ FLAG_ENTRY("PioCreditRetFifoParity",
398 SEC_SPC_FREEZE,
399 SEND_PIO_ERR_STATUS_PIO_CREDIT_RET_FIFO_PARITY_ERR_SMASK),
400/*16*/ FLAG_ENTRY("PioPpmcPblFifo",
401 SEC_SPC_FREEZE,
402 SEND_PIO_ERR_STATUS_PIO_PPMC_PBL_FIFO_ERR_SMASK),
403/*17*/ FLAG_ENTRY("PioInitSmIn",
404 0,
405 SEND_PIO_ERR_STATUS_PIO_INIT_SM_IN_ERR_SMASK),
406/*18*/ FLAG_ENTRY("PioPktEvictSmOrArbSm",
407 SEC_SPC_FREEZE,
408 SEND_PIO_ERR_STATUS_PIO_PKT_EVICT_SM_OR_ARB_SM_ERR_SMASK),
409/*19*/ FLAG_ENTRY("PioHostAddrMemUnc",
410 SEC_SPC_FREEZE,
411 SEND_PIO_ERR_STATUS_PIO_HOST_ADDR_MEM_UNC_ERR_SMASK),
412/*20*/ FLAG_ENTRY("PioHostAddrMemCor",
413 0,
414 SEND_PIO_ERR_STATUS_PIO_HOST_ADDR_MEM_COR_ERR_SMASK),
415/*21*/ FLAG_ENTRY("PioWriteDataParity",
416 SEC_SPC_FREEZE,
417 SEND_PIO_ERR_STATUS_PIO_WRITE_DATA_PARITY_ERR_SMASK),
418/*22*/ FLAG_ENTRY("PioStateMachine",
419 SEC_SPC_FREEZE,
420 SEND_PIO_ERR_STATUS_PIO_STATE_MACHINE_ERR_SMASK),
421/*23*/ FLAG_ENTRY("PioWriteQwValidParity",
422 SEC_WRITE_DROPPED|SEC_SPC_FREEZE,
423 SEND_PIO_ERR_STATUS_PIO_WRITE_QW_VALID_PARITY_ERR_SMASK),
424/*24*/ FLAG_ENTRY("PioBlockQwCountParity",
425 SEC_WRITE_DROPPED|SEC_SPC_FREEZE,
426 SEND_PIO_ERR_STATUS_PIO_BLOCK_QW_COUNT_PARITY_ERR_SMASK),
427/*25*/ FLAG_ENTRY("PioVlfVlLenParity",
428 SEC_SPC_FREEZE,
429 SEND_PIO_ERR_STATUS_PIO_VLF_VL_LEN_PARITY_ERR_SMASK),
430/*26*/ FLAG_ENTRY("PioVlfSopParity",
431 SEC_SPC_FREEZE,
432 SEND_PIO_ERR_STATUS_PIO_VLF_SOP_PARITY_ERR_SMASK),
433/*27*/ FLAG_ENTRY("PioVlFifoParity",
434 SEC_SPC_FREEZE,
435 SEND_PIO_ERR_STATUS_PIO_VL_FIFO_PARITY_ERR_SMASK),
436/*28*/ FLAG_ENTRY("PioPpmcBqcMemParity",
437 SEC_SPC_FREEZE,
438 SEND_PIO_ERR_STATUS_PIO_PPMC_BQC_MEM_PARITY_ERR_SMASK),
439/*29*/ FLAG_ENTRY("PioPpmcSopLen",
440 SEC_SPC_FREEZE,
441 SEND_PIO_ERR_STATUS_PIO_PPMC_SOP_LEN_ERR_SMASK),
442/*30-31 reserved*/
443/*32*/ FLAG_ENTRY("PioCurrentFreeCntParity",
444 SEC_SPC_FREEZE,
445 SEND_PIO_ERR_STATUS_PIO_CURRENT_FREE_CNT_PARITY_ERR_SMASK),
446/*33*/ FLAG_ENTRY("PioLastReturnedCntParity",
447 SEC_SPC_FREEZE,
448 SEND_PIO_ERR_STATUS_PIO_LAST_RETURNED_CNT_PARITY_ERR_SMASK),
449/*34*/ FLAG_ENTRY("PioPccSopHeadParity",
450 SEC_SPC_FREEZE,
451 SEND_PIO_ERR_STATUS_PIO_PCC_SOP_HEAD_PARITY_ERR_SMASK),
452/*35*/ FLAG_ENTRY("PioPecSopHeadParityErr",
453 SEC_SPC_FREEZE,
454 SEND_PIO_ERR_STATUS_PIO_PEC_SOP_HEAD_PARITY_ERR_SMASK),
455/*36-63 reserved*/
456};
457
458/* TXE PIO errors that cause an SPC freeze */
459#define ALL_PIO_FREEZE_ERR \
460 (SEND_PIO_ERR_STATUS_PIO_WRITE_ADDR_PARITY_ERR_SMASK \
461 | SEND_PIO_ERR_STATUS_PIO_CSR_PARITY_ERR_SMASK \
462 | SEND_PIO_ERR_STATUS_PIO_SB_MEM_FIFO0_ERR_SMASK \
463 | SEND_PIO_ERR_STATUS_PIO_SB_MEM_FIFO1_ERR_SMASK \
464 | SEND_PIO_ERR_STATUS_PIO_PCC_FIFO_PARITY_ERR_SMASK \
465 | SEND_PIO_ERR_STATUS_PIO_PEC_FIFO_PARITY_ERR_SMASK \
466 | SEND_PIO_ERR_STATUS_PIO_SBRDCTL_CRREL_PARITY_ERR_SMASK \
467 | SEND_PIO_ERR_STATUS_PIO_SBRDCTRL_CRREL_FIFO_PARITY_ERR_SMASK \
468 | SEND_PIO_ERR_STATUS_PIO_PKT_EVICT_FIFO_PARITY_ERR_SMASK \
469 | SEND_PIO_ERR_STATUS_PIO_SM_PKT_RESET_PARITY_ERR_SMASK \
470 | SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK0_UNC_ERR_SMASK \
471 | SEND_PIO_ERR_STATUS_PIO_VL_LEN_MEM_BANK1_UNC_ERR_SMASK \
472 | SEND_PIO_ERR_STATUS_PIO_CREDIT_RET_FIFO_PARITY_ERR_SMASK \
473 | SEND_PIO_ERR_STATUS_PIO_PPMC_PBL_FIFO_ERR_SMASK \
474 | SEND_PIO_ERR_STATUS_PIO_PKT_EVICT_SM_OR_ARB_SM_ERR_SMASK \
475 | SEND_PIO_ERR_STATUS_PIO_HOST_ADDR_MEM_UNC_ERR_SMASK \
476 | SEND_PIO_ERR_STATUS_PIO_WRITE_DATA_PARITY_ERR_SMASK \
477 | SEND_PIO_ERR_STATUS_PIO_STATE_MACHINE_ERR_SMASK \
478 | SEND_PIO_ERR_STATUS_PIO_WRITE_QW_VALID_PARITY_ERR_SMASK \
479 | SEND_PIO_ERR_STATUS_PIO_BLOCK_QW_COUNT_PARITY_ERR_SMASK \
480 | SEND_PIO_ERR_STATUS_PIO_VLF_VL_LEN_PARITY_ERR_SMASK \
481 | SEND_PIO_ERR_STATUS_PIO_VLF_SOP_PARITY_ERR_SMASK \
482 | SEND_PIO_ERR_STATUS_PIO_VL_FIFO_PARITY_ERR_SMASK \
483 | SEND_PIO_ERR_STATUS_PIO_PPMC_BQC_MEM_PARITY_ERR_SMASK \
484 | SEND_PIO_ERR_STATUS_PIO_PPMC_SOP_LEN_ERR_SMASK \
485 | SEND_PIO_ERR_STATUS_PIO_CURRENT_FREE_CNT_PARITY_ERR_SMASK \
486 | SEND_PIO_ERR_STATUS_PIO_LAST_RETURNED_CNT_PARITY_ERR_SMASK \
487 | SEND_PIO_ERR_STATUS_PIO_PCC_SOP_HEAD_PARITY_ERR_SMASK \
488 | SEND_PIO_ERR_STATUS_PIO_PEC_SOP_HEAD_PARITY_ERR_SMASK)
489
490/*
491 * TXE SDMA Error flags
492 */
493static struct flag_table sdma_err_status_flags[] = {
494/* 0*/ FLAG_ENTRY0("SDmaRpyTagErr",
495 SEND_DMA_ERR_STATUS_SDMA_RPY_TAG_ERR_SMASK),
496/* 1*/ FLAG_ENTRY0("SDmaCsrParityErr",
497 SEND_DMA_ERR_STATUS_SDMA_CSR_PARITY_ERR_SMASK),
498/* 2*/ FLAG_ENTRY0("SDmaPcieReqTrackingUncErr",
499 SEND_DMA_ERR_STATUS_SDMA_PCIE_REQ_TRACKING_UNC_ERR_SMASK),
500/* 3*/ FLAG_ENTRY0("SDmaPcieReqTrackingCorErr",
501 SEND_DMA_ERR_STATUS_SDMA_PCIE_REQ_TRACKING_COR_ERR_SMASK),
502/*04-63 reserved*/
503};
504
505/* TXE SDMA errors that cause an SPC freeze */
506#define ALL_SDMA_FREEZE_ERR \
507 (SEND_DMA_ERR_STATUS_SDMA_RPY_TAG_ERR_SMASK \
508 | SEND_DMA_ERR_STATUS_SDMA_CSR_PARITY_ERR_SMASK \
509 | SEND_DMA_ERR_STATUS_SDMA_PCIE_REQ_TRACKING_UNC_ERR_SMASK)
510
511/*
512 * TXE Egress Error flags
513 */
514#define SEES(text) SEND_EGRESS_ERR_STATUS_##text##_ERR_SMASK
515static struct flag_table egress_err_status_flags[] = {
516/* 0*/ FLAG_ENTRY0("TxPktIntegrityMemCorErr", SEES(TX_PKT_INTEGRITY_MEM_COR)),
517/* 1*/ FLAG_ENTRY0("TxPktIntegrityMemUncErr", SEES(TX_PKT_INTEGRITY_MEM_UNC)),
518/* 2 reserved */
519/* 3*/ FLAG_ENTRY0("TxEgressFifoUnderrunOrParityErr",
520 SEES(TX_EGRESS_FIFO_UNDERRUN_OR_PARITY)),
521/* 4*/ FLAG_ENTRY0("TxLinkdownErr", SEES(TX_LINKDOWN)),
522/* 5*/ FLAG_ENTRY0("TxIncorrectLinkStateErr", SEES(TX_INCORRECT_LINK_STATE)),
523/* 6 reserved */
524/* 7*/ FLAG_ENTRY0("TxPioLaunchIntfParityErr",
525 SEES(TX_PIO_LAUNCH_INTF_PARITY)),
526/* 8*/ FLAG_ENTRY0("TxSdmaLaunchIntfParityErr",
527 SEES(TX_SDMA_LAUNCH_INTF_PARITY)),
528/* 9-10 reserved */
529/*11*/ FLAG_ENTRY0("TxSbrdCtlStateMachineParityErr",
530 SEES(TX_SBRD_CTL_STATE_MACHINE_PARITY)),
531/*12*/ FLAG_ENTRY0("TxIllegalVLErr", SEES(TX_ILLEGAL_VL)),
532/*13*/ FLAG_ENTRY0("TxLaunchCsrParityErr", SEES(TX_LAUNCH_CSR_PARITY)),
533/*14*/ FLAG_ENTRY0("TxSbrdCtlCsrParityErr", SEES(TX_SBRD_CTL_CSR_PARITY)),
534/*15*/ FLAG_ENTRY0("TxConfigParityErr", SEES(TX_CONFIG_PARITY)),
535/*16*/ FLAG_ENTRY0("TxSdma0DisallowedPacketErr",
536 SEES(TX_SDMA0_DISALLOWED_PACKET)),
537/*17*/ FLAG_ENTRY0("TxSdma1DisallowedPacketErr",
538 SEES(TX_SDMA1_DISALLOWED_PACKET)),
539/*18*/ FLAG_ENTRY0("TxSdma2DisallowedPacketErr",
540 SEES(TX_SDMA2_DISALLOWED_PACKET)),
541/*19*/ FLAG_ENTRY0("TxSdma3DisallowedPacketErr",
542 SEES(TX_SDMA3_DISALLOWED_PACKET)),
543/*20*/ FLAG_ENTRY0("TxSdma4DisallowedPacketErr",
544 SEES(TX_SDMA4_DISALLOWED_PACKET)),
545/*21*/ FLAG_ENTRY0("TxSdma5DisallowedPacketErr",
546 SEES(TX_SDMA5_DISALLOWED_PACKET)),
547/*22*/ FLAG_ENTRY0("TxSdma6DisallowedPacketErr",
548 SEES(TX_SDMA6_DISALLOWED_PACKET)),
549/*23*/ FLAG_ENTRY0("TxSdma7DisallowedPacketErr",
550 SEES(TX_SDMA7_DISALLOWED_PACKET)),
551/*24*/ FLAG_ENTRY0("TxSdma8DisallowedPacketErr",
552 SEES(TX_SDMA8_DISALLOWED_PACKET)),
553/*25*/ FLAG_ENTRY0("TxSdma9DisallowedPacketErr",
554 SEES(TX_SDMA9_DISALLOWED_PACKET)),
555/*26*/ FLAG_ENTRY0("TxSdma10DisallowedPacketErr",
556 SEES(TX_SDMA10_DISALLOWED_PACKET)),
557/*27*/ FLAG_ENTRY0("TxSdma11DisallowedPacketErr",
558 SEES(TX_SDMA11_DISALLOWED_PACKET)),
559/*28*/ FLAG_ENTRY0("TxSdma12DisallowedPacketErr",
560 SEES(TX_SDMA12_DISALLOWED_PACKET)),
561/*29*/ FLAG_ENTRY0("TxSdma13DisallowedPacketErr",
562 SEES(TX_SDMA13_DISALLOWED_PACKET)),
563/*30*/ FLAG_ENTRY0("TxSdma14DisallowedPacketErr",
564 SEES(TX_SDMA14_DISALLOWED_PACKET)),
565/*31*/ FLAG_ENTRY0("TxSdma15DisallowedPacketErr",
566 SEES(TX_SDMA15_DISALLOWED_PACKET)),
567/*32*/ FLAG_ENTRY0("TxLaunchFifo0UncOrParityErr",
568 SEES(TX_LAUNCH_FIFO0_UNC_OR_PARITY)),
569/*33*/ FLAG_ENTRY0("TxLaunchFifo1UncOrParityErr",
570 SEES(TX_LAUNCH_FIFO1_UNC_OR_PARITY)),
571/*34*/ FLAG_ENTRY0("TxLaunchFifo2UncOrParityErr",
572 SEES(TX_LAUNCH_FIFO2_UNC_OR_PARITY)),
573/*35*/ FLAG_ENTRY0("TxLaunchFifo3UncOrParityErr",
574 SEES(TX_LAUNCH_FIFO3_UNC_OR_PARITY)),
575/*36*/ FLAG_ENTRY0("TxLaunchFifo4UncOrParityErr",
576 SEES(TX_LAUNCH_FIFO4_UNC_OR_PARITY)),
577/*37*/ FLAG_ENTRY0("TxLaunchFifo5UncOrParityErr",
578 SEES(TX_LAUNCH_FIFO5_UNC_OR_PARITY)),
579/*38*/ FLAG_ENTRY0("TxLaunchFifo6UncOrParityErr",
580 SEES(TX_LAUNCH_FIFO6_UNC_OR_PARITY)),
581/*39*/ FLAG_ENTRY0("TxLaunchFifo7UncOrParityErr",
582 SEES(TX_LAUNCH_FIFO7_UNC_OR_PARITY)),
583/*40*/ FLAG_ENTRY0("TxLaunchFifo8UncOrParityErr",
584 SEES(TX_LAUNCH_FIFO8_UNC_OR_PARITY)),
585/*41*/ FLAG_ENTRY0("TxCreditReturnParityErr", SEES(TX_CREDIT_RETURN_PARITY)),
586/*42*/ FLAG_ENTRY0("TxSbHdrUncErr", SEES(TX_SB_HDR_UNC)),
587/*43*/ FLAG_ENTRY0("TxReadSdmaMemoryUncErr", SEES(TX_READ_SDMA_MEMORY_UNC)),
588/*44*/ FLAG_ENTRY0("TxReadPioMemoryUncErr", SEES(TX_READ_PIO_MEMORY_UNC)),
589/*45*/ FLAG_ENTRY0("TxEgressFifoUncErr", SEES(TX_EGRESS_FIFO_UNC)),
590/*46*/ FLAG_ENTRY0("TxHcrcInsertionErr", SEES(TX_HCRC_INSERTION)),
591/*47*/ FLAG_ENTRY0("TxCreditReturnVLErr", SEES(TX_CREDIT_RETURN_VL)),
592/*48*/ FLAG_ENTRY0("TxLaunchFifo0CorErr", SEES(TX_LAUNCH_FIFO0_COR)),
593/*49*/ FLAG_ENTRY0("TxLaunchFifo1CorErr", SEES(TX_LAUNCH_FIFO1_COR)),
594/*50*/ FLAG_ENTRY0("TxLaunchFifo2CorErr", SEES(TX_LAUNCH_FIFO2_COR)),
595/*51*/ FLAG_ENTRY0("TxLaunchFifo3CorErr", SEES(TX_LAUNCH_FIFO3_COR)),
596/*52*/ FLAG_ENTRY0("TxLaunchFifo4CorErr", SEES(TX_LAUNCH_FIFO4_COR)),
597/*53*/ FLAG_ENTRY0("TxLaunchFifo5CorErr", SEES(TX_LAUNCH_FIFO5_COR)),
598/*54*/ FLAG_ENTRY0("TxLaunchFifo6CorErr", SEES(TX_LAUNCH_FIFO6_COR)),
599/*55*/ FLAG_ENTRY0("TxLaunchFifo7CorErr", SEES(TX_LAUNCH_FIFO7_COR)),
600/*56*/ FLAG_ENTRY0("TxLaunchFifo8CorErr", SEES(TX_LAUNCH_FIFO8_COR)),
601/*57*/ FLAG_ENTRY0("TxCreditOverrunErr", SEES(TX_CREDIT_OVERRUN)),
602/*58*/ FLAG_ENTRY0("TxSbHdrCorErr", SEES(TX_SB_HDR_COR)),
603/*59*/ FLAG_ENTRY0("TxReadSdmaMemoryCorErr", SEES(TX_READ_SDMA_MEMORY_COR)),
604/*60*/ FLAG_ENTRY0("TxReadPioMemoryCorErr", SEES(TX_READ_PIO_MEMORY_COR)),
605/*61*/ FLAG_ENTRY0("TxEgressFifoCorErr", SEES(TX_EGRESS_FIFO_COR)),
606/*62*/ FLAG_ENTRY0("TxReadSdmaMemoryCsrUncErr",
607 SEES(TX_READ_SDMA_MEMORY_CSR_UNC)),
608/*63*/ FLAG_ENTRY0("TxReadPioMemoryCsrUncErr",
609 SEES(TX_READ_PIO_MEMORY_CSR_UNC)),
610};
611
612/*
613 * TXE Egress Error Info flags
614 */
615#define SEEI(text) SEND_EGRESS_ERR_INFO_##text##_ERR_SMASK
616static struct flag_table egress_err_info_flags[] = {
617/* 0*/ FLAG_ENTRY0("Reserved", 0ull),
618/* 1*/ FLAG_ENTRY0("VLErr", SEEI(VL)),
619/* 2*/ FLAG_ENTRY0("JobKeyErr", SEEI(JOB_KEY)),
620/* 3*/ FLAG_ENTRY0("JobKeyErr", SEEI(JOB_KEY)),
621/* 4*/ FLAG_ENTRY0("PartitionKeyErr", SEEI(PARTITION_KEY)),
622/* 5*/ FLAG_ENTRY0("SLIDErr", SEEI(SLID)),
623/* 6*/ FLAG_ENTRY0("OpcodeErr", SEEI(OPCODE)),
624/* 7*/ FLAG_ENTRY0("VLMappingErr", SEEI(VL_MAPPING)),
625/* 8*/ FLAG_ENTRY0("RawErr", SEEI(RAW)),
626/* 9*/ FLAG_ENTRY0("RawIPv6Err", SEEI(RAW_IPV6)),
627/*10*/ FLAG_ENTRY0("GRHErr", SEEI(GRH)),
628/*11*/ FLAG_ENTRY0("BypassErr", SEEI(BYPASS)),
629/*12*/ FLAG_ENTRY0("KDETHPacketsErr", SEEI(KDETH_PACKETS)),
630/*13*/ FLAG_ENTRY0("NonKDETHPacketsErr", SEEI(NON_KDETH_PACKETS)),
631/*14*/ FLAG_ENTRY0("TooSmallIBPacketsErr", SEEI(TOO_SMALL_IB_PACKETS)),
632/*15*/ FLAG_ENTRY0("TooSmallBypassPacketsErr", SEEI(TOO_SMALL_BYPASS_PACKETS)),
633/*16*/ FLAG_ENTRY0("PbcTestErr", SEEI(PBC_TEST)),
634/*17*/ FLAG_ENTRY0("BadPktLenErr", SEEI(BAD_PKT_LEN)),
635/*18*/ FLAG_ENTRY0("TooLongIBPacketErr", SEEI(TOO_LONG_IB_PACKET)),
636/*19*/ FLAG_ENTRY0("TooLongBypassPacketsErr", SEEI(TOO_LONG_BYPASS_PACKETS)),
637/*20*/ FLAG_ENTRY0("PbcStaticRateControlErr", SEEI(PBC_STATIC_RATE_CONTROL)),
638/*21*/ FLAG_ENTRY0("BypassBadPktLenErr", SEEI(BAD_PKT_LEN)),
639};
640
641/* TXE Egress errors that cause an SPC freeze */
642#define ALL_TXE_EGRESS_FREEZE_ERR \
643 (SEES(TX_EGRESS_FIFO_UNDERRUN_OR_PARITY) \
644 | SEES(TX_PIO_LAUNCH_INTF_PARITY) \
645 | SEES(TX_SDMA_LAUNCH_INTF_PARITY) \
646 | SEES(TX_SBRD_CTL_STATE_MACHINE_PARITY) \
647 | SEES(TX_LAUNCH_CSR_PARITY) \
648 | SEES(TX_SBRD_CTL_CSR_PARITY) \
649 | SEES(TX_CONFIG_PARITY) \
650 | SEES(TX_LAUNCH_FIFO0_UNC_OR_PARITY) \
651 | SEES(TX_LAUNCH_FIFO1_UNC_OR_PARITY) \
652 | SEES(TX_LAUNCH_FIFO2_UNC_OR_PARITY) \
653 | SEES(TX_LAUNCH_FIFO3_UNC_OR_PARITY) \
654 | SEES(TX_LAUNCH_FIFO4_UNC_OR_PARITY) \
655 | SEES(TX_LAUNCH_FIFO5_UNC_OR_PARITY) \
656 | SEES(TX_LAUNCH_FIFO6_UNC_OR_PARITY) \
657 | SEES(TX_LAUNCH_FIFO7_UNC_OR_PARITY) \
658 | SEES(TX_LAUNCH_FIFO8_UNC_OR_PARITY) \
659 | SEES(TX_CREDIT_RETURN_PARITY))
660
661/*
662 * TXE Send error flags
663 */
664#define SES(name) SEND_ERR_STATUS_SEND_##name##_ERR_SMASK
665static struct flag_table send_err_status_flags[] = {
666/* 0*/ FLAG_ENTRY0("SDmaRpyTagErr", SES(CSR_PARITY)),
667/* 1*/ FLAG_ENTRY0("SendCsrReadBadAddrErr", SES(CSR_READ_BAD_ADDR)),
668/* 2*/ FLAG_ENTRY0("SendCsrWriteBadAddrErr", SES(CSR_WRITE_BAD_ADDR))
669};
670
671/*
672 * TXE Send Context Error flags and consequences
673 */
674static struct flag_table sc_err_status_flags[] = {
675/* 0*/ FLAG_ENTRY("InconsistentSop",
676 SEC_PACKET_DROPPED | SEC_SC_HALTED,
677 SEND_CTXT_ERR_STATUS_PIO_INCONSISTENT_SOP_ERR_SMASK),
678/* 1*/ FLAG_ENTRY("DisallowedPacket",
679 SEC_PACKET_DROPPED | SEC_SC_HALTED,
680 SEND_CTXT_ERR_STATUS_PIO_DISALLOWED_PACKET_ERR_SMASK),
681/* 2*/ FLAG_ENTRY("WriteCrossesBoundary",
682 SEC_WRITE_DROPPED | SEC_SC_HALTED,
683 SEND_CTXT_ERR_STATUS_PIO_WRITE_CROSSES_BOUNDARY_ERR_SMASK),
684/* 3*/ FLAG_ENTRY("WriteOverflow",
685 SEC_WRITE_DROPPED | SEC_SC_HALTED,
686 SEND_CTXT_ERR_STATUS_PIO_WRITE_OVERFLOW_ERR_SMASK),
687/* 4*/ FLAG_ENTRY("WriteOutOfBounds",
688 SEC_WRITE_DROPPED | SEC_SC_HALTED,
689 SEND_CTXT_ERR_STATUS_PIO_WRITE_OUT_OF_BOUNDS_ERR_SMASK),
690/* 5-63 reserved*/
691};
692
693/*
694 * RXE Receive Error flags
695 */
696#define RXES(name) RCV_ERR_STATUS_RX_##name##_ERR_SMASK
697static struct flag_table rxe_err_status_flags[] = {
698/* 0*/ FLAG_ENTRY0("RxDmaCsrCorErr", RXES(DMA_CSR_COR)),
699/* 1*/ FLAG_ENTRY0("RxDcIntfParityErr", RXES(DC_INTF_PARITY)),
700/* 2*/ FLAG_ENTRY0("RxRcvHdrUncErr", RXES(RCV_HDR_UNC)),
701/* 3*/ FLAG_ENTRY0("RxRcvHdrCorErr", RXES(RCV_HDR_COR)),
702/* 4*/ FLAG_ENTRY0("RxRcvDataUncErr", RXES(RCV_DATA_UNC)),
703/* 5*/ FLAG_ENTRY0("RxRcvDataCorErr", RXES(RCV_DATA_COR)),
704/* 6*/ FLAG_ENTRY0("RxRcvQpMapTableUncErr", RXES(RCV_QP_MAP_TABLE_UNC)),
705/* 7*/ FLAG_ENTRY0("RxRcvQpMapTableCorErr", RXES(RCV_QP_MAP_TABLE_COR)),
706/* 8*/ FLAG_ENTRY0("RxRcvCsrParityErr", RXES(RCV_CSR_PARITY)),
707/* 9*/ FLAG_ENTRY0("RxDcSopEopParityErr", RXES(DC_SOP_EOP_PARITY)),
708/*10*/ FLAG_ENTRY0("RxDmaFlagUncErr", RXES(DMA_FLAG_UNC)),
709/*11*/ FLAG_ENTRY0("RxDmaFlagCorErr", RXES(DMA_FLAG_COR)),
710/*12*/ FLAG_ENTRY0("RxRcvFsmEncodingErr", RXES(RCV_FSM_ENCODING)),
711/*13*/ FLAG_ENTRY0("RxRbufFreeListUncErr", RXES(RBUF_FREE_LIST_UNC)),
712/*14*/ FLAG_ENTRY0("RxRbufFreeListCorErr", RXES(RBUF_FREE_LIST_COR)),
713/*15*/ FLAG_ENTRY0("RxRbufLookupDesRegUncErr", RXES(RBUF_LOOKUP_DES_REG_UNC)),
714/*16*/ FLAG_ENTRY0("RxRbufLookupDesRegUncCorErr",
715 RXES(RBUF_LOOKUP_DES_REG_UNC_COR)),
716/*17*/ FLAG_ENTRY0("RxRbufLookupDesUncErr", RXES(RBUF_LOOKUP_DES_UNC)),
717/*18*/ FLAG_ENTRY0("RxRbufLookupDesCorErr", RXES(RBUF_LOOKUP_DES_COR)),
718/*19*/ FLAG_ENTRY0("RxRbufBlockListReadUncErr",
719 RXES(RBUF_BLOCK_LIST_READ_UNC)),
720/*20*/ FLAG_ENTRY0("RxRbufBlockListReadCorErr",
721 RXES(RBUF_BLOCK_LIST_READ_COR)),
722/*21*/ FLAG_ENTRY0("RxRbufCsrQHeadBufNumParityErr",
723 RXES(RBUF_CSR_QHEAD_BUF_NUM_PARITY)),
724/*22*/ FLAG_ENTRY0("RxRbufCsrQEntCntParityErr",
725 RXES(RBUF_CSR_QENT_CNT_PARITY)),
726/*23*/ FLAG_ENTRY0("RxRbufCsrQNextBufParityErr",
727 RXES(RBUF_CSR_QNEXT_BUF_PARITY)),
728/*24*/ FLAG_ENTRY0("RxRbufCsrQVldBitParityErr",
729 RXES(RBUF_CSR_QVLD_BIT_PARITY)),
730/*25*/ FLAG_ENTRY0("RxRbufCsrQHdPtrParityErr", RXES(RBUF_CSR_QHD_PTR_PARITY)),
731/*26*/ FLAG_ENTRY0("RxRbufCsrQTlPtrParityErr", RXES(RBUF_CSR_QTL_PTR_PARITY)),
732/*27*/ FLAG_ENTRY0("RxRbufCsrQNumOfPktParityErr",
733 RXES(RBUF_CSR_QNUM_OF_PKT_PARITY)),
734/*28*/ FLAG_ENTRY0("RxRbufCsrQEOPDWParityErr", RXES(RBUF_CSR_QEOPDW_PARITY)),
735/*29*/ FLAG_ENTRY0("RxRbufCtxIdParityErr", RXES(RBUF_CTX_ID_PARITY)),
736/*30*/ FLAG_ENTRY0("RxRBufBadLookupErr", RXES(RBUF_BAD_LOOKUP)),
737/*31*/ FLAG_ENTRY0("RxRbufFullErr", RXES(RBUF_FULL)),
738/*32*/ FLAG_ENTRY0("RxRbufEmptyErr", RXES(RBUF_EMPTY)),
739/*33*/ FLAG_ENTRY0("RxRbufFlRdAddrParityErr", RXES(RBUF_FL_RD_ADDR_PARITY)),
740/*34*/ FLAG_ENTRY0("RxRbufFlWrAddrParityErr", RXES(RBUF_FL_WR_ADDR_PARITY)),
741/*35*/ FLAG_ENTRY0("RxRbufFlInitdoneParityErr",
742 RXES(RBUF_FL_INITDONE_PARITY)),
743/*36*/ FLAG_ENTRY0("RxRbufFlInitWrAddrParityErr",
744 RXES(RBUF_FL_INIT_WR_ADDR_PARITY)),
745/*37*/ FLAG_ENTRY0("RxRbufNextFreeBufUncErr", RXES(RBUF_NEXT_FREE_BUF_UNC)),
746/*38*/ FLAG_ENTRY0("RxRbufNextFreeBufCorErr", RXES(RBUF_NEXT_FREE_BUF_COR)),
747/*39*/ FLAG_ENTRY0("RxLookupDesPart1UncErr", RXES(LOOKUP_DES_PART1_UNC)),
748/*40*/ FLAG_ENTRY0("RxLookupDesPart1UncCorErr",
749 RXES(LOOKUP_DES_PART1_UNC_COR)),
750/*41*/ FLAG_ENTRY0("RxLookupDesPart2ParityErr",
751 RXES(LOOKUP_DES_PART2_PARITY)),
752/*42*/ FLAG_ENTRY0("RxLookupRcvArrayUncErr", RXES(LOOKUP_RCV_ARRAY_UNC)),
753/*43*/ FLAG_ENTRY0("RxLookupRcvArrayCorErr", RXES(LOOKUP_RCV_ARRAY_COR)),
754/*44*/ FLAG_ENTRY0("RxLookupCsrParityErr", RXES(LOOKUP_CSR_PARITY)),
755/*45*/ FLAG_ENTRY0("RxHqIntrCsrParityErr", RXES(HQ_INTR_CSR_PARITY)),
756/*46*/ FLAG_ENTRY0("RxHqIntrFsmErr", RXES(HQ_INTR_FSM)),
757/*47*/ FLAG_ENTRY0("RxRbufDescPart1UncErr", RXES(RBUF_DESC_PART1_UNC)),
758/*48*/ FLAG_ENTRY0("RxRbufDescPart1CorErr", RXES(RBUF_DESC_PART1_COR)),
759/*49*/ FLAG_ENTRY0("RxRbufDescPart2UncErr", RXES(RBUF_DESC_PART2_UNC)),
760/*50*/ FLAG_ENTRY0("RxRbufDescPart2CorErr", RXES(RBUF_DESC_PART2_COR)),
761/*51*/ FLAG_ENTRY0("RxDmaHdrFifoRdUncErr", RXES(DMA_HDR_FIFO_RD_UNC)),
762/*52*/ FLAG_ENTRY0("RxDmaHdrFifoRdCorErr", RXES(DMA_HDR_FIFO_RD_COR)),
763/*53*/ FLAG_ENTRY0("RxDmaDataFifoRdUncErr", RXES(DMA_DATA_FIFO_RD_UNC)),
764/*54*/ FLAG_ENTRY0("RxDmaDataFifoRdCorErr", RXES(DMA_DATA_FIFO_RD_COR)),
765/*55*/ FLAG_ENTRY0("RxRbufDataUncErr", RXES(RBUF_DATA_UNC)),
766/*56*/ FLAG_ENTRY0("RxRbufDataCorErr", RXES(RBUF_DATA_COR)),
767/*57*/ FLAG_ENTRY0("RxDmaCsrParityErr", RXES(DMA_CSR_PARITY)),
768/*58*/ FLAG_ENTRY0("RxDmaEqFsmEncodingErr", RXES(DMA_EQ_FSM_ENCODING)),
769/*59*/ FLAG_ENTRY0("RxDmaDqFsmEncodingErr", RXES(DMA_DQ_FSM_ENCODING)),
770/*60*/ FLAG_ENTRY0("RxDmaCsrUncErr", RXES(DMA_CSR_UNC)),
771/*61*/ FLAG_ENTRY0("RxCsrReadBadAddrErr", RXES(CSR_READ_BAD_ADDR)),
772/*62*/ FLAG_ENTRY0("RxCsrWriteBadAddrErr", RXES(CSR_WRITE_BAD_ADDR)),
773/*63*/ FLAG_ENTRY0("RxCsrParityErr", RXES(CSR_PARITY))
774};
775
776/* RXE errors that will trigger an SPC freeze */
777#define ALL_RXE_FREEZE_ERR \
778 (RCV_ERR_STATUS_RX_RCV_QP_MAP_TABLE_UNC_ERR_SMASK \
779 | RCV_ERR_STATUS_RX_RCV_CSR_PARITY_ERR_SMASK \
780 | RCV_ERR_STATUS_RX_DMA_FLAG_UNC_ERR_SMASK \
781 | RCV_ERR_STATUS_RX_RCV_FSM_ENCODING_ERR_SMASK \
782 | RCV_ERR_STATUS_RX_RBUF_FREE_LIST_UNC_ERR_SMASK \
783 | RCV_ERR_STATUS_RX_RBUF_LOOKUP_DES_REG_UNC_ERR_SMASK \
784 | RCV_ERR_STATUS_RX_RBUF_LOOKUP_DES_REG_UNC_COR_ERR_SMASK \
785 | RCV_ERR_STATUS_RX_RBUF_LOOKUP_DES_UNC_ERR_SMASK \
786 | RCV_ERR_STATUS_RX_RBUF_BLOCK_LIST_READ_UNC_ERR_SMASK \
787 | RCV_ERR_STATUS_RX_RBUF_CSR_QHEAD_BUF_NUM_PARITY_ERR_SMASK \
788 | RCV_ERR_STATUS_RX_RBUF_CSR_QENT_CNT_PARITY_ERR_SMASK \
789 | RCV_ERR_STATUS_RX_RBUF_CSR_QNEXT_BUF_PARITY_ERR_SMASK \
790 | RCV_ERR_STATUS_RX_RBUF_CSR_QVLD_BIT_PARITY_ERR_SMASK \
791 | RCV_ERR_STATUS_RX_RBUF_CSR_QHD_PTR_PARITY_ERR_SMASK \
792 | RCV_ERR_STATUS_RX_RBUF_CSR_QTL_PTR_PARITY_ERR_SMASK \
793 | RCV_ERR_STATUS_RX_RBUF_CSR_QNUM_OF_PKT_PARITY_ERR_SMASK \
794 | RCV_ERR_STATUS_RX_RBUF_CSR_QEOPDW_PARITY_ERR_SMASK \
795 | RCV_ERR_STATUS_RX_RBUF_CTX_ID_PARITY_ERR_SMASK \
796 | RCV_ERR_STATUS_RX_RBUF_BAD_LOOKUP_ERR_SMASK \
797 | RCV_ERR_STATUS_RX_RBUF_FULL_ERR_SMASK \
798 | RCV_ERR_STATUS_RX_RBUF_EMPTY_ERR_SMASK \
799 | RCV_ERR_STATUS_RX_RBUF_FL_RD_ADDR_PARITY_ERR_SMASK \
800 | RCV_ERR_STATUS_RX_RBUF_FL_WR_ADDR_PARITY_ERR_SMASK \
801 | RCV_ERR_STATUS_RX_RBUF_FL_INITDONE_PARITY_ERR_SMASK \
802 | RCV_ERR_STATUS_RX_RBUF_FL_INIT_WR_ADDR_PARITY_ERR_SMASK \
803 | RCV_ERR_STATUS_RX_RBUF_NEXT_FREE_BUF_UNC_ERR_SMASK \
804 | RCV_ERR_STATUS_RX_LOOKUP_DES_PART1_UNC_ERR_SMASK \
805 | RCV_ERR_STATUS_RX_LOOKUP_DES_PART1_UNC_COR_ERR_SMASK \
806 | RCV_ERR_STATUS_RX_LOOKUP_DES_PART2_PARITY_ERR_SMASK \
807 | RCV_ERR_STATUS_RX_LOOKUP_RCV_ARRAY_UNC_ERR_SMASK \
808 | RCV_ERR_STATUS_RX_LOOKUP_CSR_PARITY_ERR_SMASK \
809 | RCV_ERR_STATUS_RX_HQ_INTR_CSR_PARITY_ERR_SMASK \
810 | RCV_ERR_STATUS_RX_HQ_INTR_FSM_ERR_SMASK \
811 | RCV_ERR_STATUS_RX_RBUF_DESC_PART1_UNC_ERR_SMASK \
812 | RCV_ERR_STATUS_RX_RBUF_DESC_PART1_COR_ERR_SMASK \
813 | RCV_ERR_STATUS_RX_RBUF_DESC_PART2_UNC_ERR_SMASK \
814 | RCV_ERR_STATUS_RX_DMA_HDR_FIFO_RD_UNC_ERR_SMASK \
815 | RCV_ERR_STATUS_RX_DMA_DATA_FIFO_RD_UNC_ERR_SMASK \
816 | RCV_ERR_STATUS_RX_RBUF_DATA_UNC_ERR_SMASK \
817 | RCV_ERR_STATUS_RX_DMA_CSR_PARITY_ERR_SMASK \
818 | RCV_ERR_STATUS_RX_DMA_EQ_FSM_ENCODING_ERR_SMASK \
819 | RCV_ERR_STATUS_RX_DMA_DQ_FSM_ENCODING_ERR_SMASK \
820 | RCV_ERR_STATUS_RX_DMA_CSR_UNC_ERR_SMASK \
821 | RCV_ERR_STATUS_RX_CSR_PARITY_ERR_SMASK)
822
823#define RXE_FREEZE_ABORT_MASK \
824 (RCV_ERR_STATUS_RX_DMA_CSR_UNC_ERR_SMASK | \
825 RCV_ERR_STATUS_RX_DMA_HDR_FIFO_RD_UNC_ERR_SMASK | \
826 RCV_ERR_STATUS_RX_DMA_DATA_FIFO_RD_UNC_ERR_SMASK)
827
828/*
829 * DCC Error Flags
830 */
831#define DCCE(name) DCC_ERR_FLG_##name##_SMASK
832static struct flag_table dcc_err_flags[] = {
833 FLAG_ENTRY0("bad_l2_err", DCCE(BAD_L2_ERR)),
834 FLAG_ENTRY0("bad_sc_err", DCCE(BAD_SC_ERR)),
835 FLAG_ENTRY0("bad_mid_tail_err", DCCE(BAD_MID_TAIL_ERR)),
836 FLAG_ENTRY0("bad_preemption_err", DCCE(BAD_PREEMPTION_ERR)),
837 FLAG_ENTRY0("preemption_err", DCCE(PREEMPTION_ERR)),
838 FLAG_ENTRY0("preemptionvl15_err", DCCE(PREEMPTIONVL15_ERR)),
839 FLAG_ENTRY0("bad_vl_marker_err", DCCE(BAD_VL_MARKER_ERR)),
840 FLAG_ENTRY0("bad_dlid_target_err", DCCE(BAD_DLID_TARGET_ERR)),
841 FLAG_ENTRY0("bad_lver_err", DCCE(BAD_LVER_ERR)),
842 FLAG_ENTRY0("uncorrectable_err", DCCE(UNCORRECTABLE_ERR)),
843 FLAG_ENTRY0("bad_crdt_ack_err", DCCE(BAD_CRDT_ACK_ERR)),
844 FLAG_ENTRY0("unsup_pkt_type", DCCE(UNSUP_PKT_TYPE)),
845 FLAG_ENTRY0("bad_ctrl_flit_err", DCCE(BAD_CTRL_FLIT_ERR)),
846 FLAG_ENTRY0("event_cntr_parity_err", DCCE(EVENT_CNTR_PARITY_ERR)),
847 FLAG_ENTRY0("event_cntr_rollover_err", DCCE(EVENT_CNTR_ROLLOVER_ERR)),
848 FLAG_ENTRY0("link_err", DCCE(LINK_ERR)),
849 FLAG_ENTRY0("misc_cntr_rollover_err", DCCE(MISC_CNTR_ROLLOVER_ERR)),
850 FLAG_ENTRY0("bad_ctrl_dist_err", DCCE(BAD_CTRL_DIST_ERR)),
851 FLAG_ENTRY0("bad_tail_dist_err", DCCE(BAD_TAIL_DIST_ERR)),
852 FLAG_ENTRY0("bad_head_dist_err", DCCE(BAD_HEAD_DIST_ERR)),
853 FLAG_ENTRY0("nonvl15_state_err", DCCE(NONVL15_STATE_ERR)),
854 FLAG_ENTRY0("vl15_multi_err", DCCE(VL15_MULTI_ERR)),
855 FLAG_ENTRY0("bad_pkt_length_err", DCCE(BAD_PKT_LENGTH_ERR)),
856 FLAG_ENTRY0("unsup_vl_err", DCCE(UNSUP_VL_ERR)),
857 FLAG_ENTRY0("perm_nvl15_err", DCCE(PERM_NVL15_ERR)),
858 FLAG_ENTRY0("slid_zero_err", DCCE(SLID_ZERO_ERR)),
859 FLAG_ENTRY0("dlid_zero_err", DCCE(DLID_ZERO_ERR)),
860 FLAG_ENTRY0("length_mtu_err", DCCE(LENGTH_MTU_ERR)),
861 FLAG_ENTRY0("rx_early_drop_err", DCCE(RX_EARLY_DROP_ERR)),
862 FLAG_ENTRY0("late_short_err", DCCE(LATE_SHORT_ERR)),
863 FLAG_ENTRY0("late_long_err", DCCE(LATE_LONG_ERR)),
864 FLAG_ENTRY0("late_ebp_err", DCCE(LATE_EBP_ERR)),
865 FLAG_ENTRY0("fpe_tx_fifo_ovflw_err", DCCE(FPE_TX_FIFO_OVFLW_ERR)),
866 FLAG_ENTRY0("fpe_tx_fifo_unflw_err", DCCE(FPE_TX_FIFO_UNFLW_ERR)),
867 FLAG_ENTRY0("csr_access_blocked_host", DCCE(CSR_ACCESS_BLOCKED_HOST)),
868 FLAG_ENTRY0("csr_access_blocked_uc", DCCE(CSR_ACCESS_BLOCKED_UC)),
869 FLAG_ENTRY0("tx_ctrl_parity_err", DCCE(TX_CTRL_PARITY_ERR)),
870 FLAG_ENTRY0("tx_ctrl_parity_mbe_err", DCCE(TX_CTRL_PARITY_MBE_ERR)),
871 FLAG_ENTRY0("tx_sc_parity_err", DCCE(TX_SC_PARITY_ERR)),
872 FLAG_ENTRY0("rx_ctrl_parity_mbe_err", DCCE(RX_CTRL_PARITY_MBE_ERR)),
873 FLAG_ENTRY0("csr_parity_err", DCCE(CSR_PARITY_ERR)),
874 FLAG_ENTRY0("csr_inval_addr", DCCE(CSR_INVAL_ADDR)),
875 FLAG_ENTRY0("tx_byte_shft_parity_err", DCCE(TX_BYTE_SHFT_PARITY_ERR)),
876 FLAG_ENTRY0("rx_byte_shft_parity_err", DCCE(RX_BYTE_SHFT_PARITY_ERR)),
877 FLAG_ENTRY0("fmconfig_err", DCCE(FMCONFIG_ERR)),
878 FLAG_ENTRY0("rcvport_err", DCCE(RCVPORT_ERR)),
879};
880
881/*
882 * LCB error flags
883 */
884#define LCBE(name) DC_LCB_ERR_FLG_##name##_SMASK
885static struct flag_table lcb_err_flags[] = {
886/* 0*/ FLAG_ENTRY0("CSR_PARITY_ERR", LCBE(CSR_PARITY_ERR)),
887/* 1*/ FLAG_ENTRY0("INVALID_CSR_ADDR", LCBE(INVALID_CSR_ADDR)),
888/* 2*/ FLAG_ENTRY0("RST_FOR_FAILED_DESKEW", LCBE(RST_FOR_FAILED_DESKEW)),
889/* 3*/ FLAG_ENTRY0("ALL_LNS_FAILED_REINIT_TEST",
890 LCBE(ALL_LNS_FAILED_REINIT_TEST)),
891/* 4*/ FLAG_ENTRY0("LOST_REINIT_STALL_OR_TOS", LCBE(LOST_REINIT_STALL_OR_TOS)),
892/* 5*/ FLAG_ENTRY0("TX_LESS_THAN_FOUR_LNS", LCBE(TX_LESS_THAN_FOUR_LNS)),
893/* 6*/ FLAG_ENTRY0("RX_LESS_THAN_FOUR_LNS", LCBE(RX_LESS_THAN_FOUR_LNS)),
894/* 7*/ FLAG_ENTRY0("SEQ_CRC_ERR", LCBE(SEQ_CRC_ERR)),
895/* 8*/ FLAG_ENTRY0("REINIT_FROM_PEER", LCBE(REINIT_FROM_PEER)),
896/* 9*/ FLAG_ENTRY0("REINIT_FOR_LN_DEGRADE", LCBE(REINIT_FOR_LN_DEGRADE)),
897/*10*/ FLAG_ENTRY0("CRC_ERR_CNT_HIT_LIMIT", LCBE(CRC_ERR_CNT_HIT_LIMIT)),
898/*11*/ FLAG_ENTRY0("RCLK_STOPPED", LCBE(RCLK_STOPPED)),
899/*12*/ FLAG_ENTRY0("UNEXPECTED_REPLAY_MARKER", LCBE(UNEXPECTED_REPLAY_MARKER)),
900/*13*/ FLAG_ENTRY0("UNEXPECTED_ROUND_TRIP_MARKER",
901 LCBE(UNEXPECTED_ROUND_TRIP_MARKER)),
902/*14*/ FLAG_ENTRY0("ILLEGAL_NULL_LTP", LCBE(ILLEGAL_NULL_LTP)),
903/*15*/ FLAG_ENTRY0("ILLEGAL_FLIT_ENCODING", LCBE(ILLEGAL_FLIT_ENCODING)),
904/*16*/ FLAG_ENTRY0("FLIT_INPUT_BUF_OFLW", LCBE(FLIT_INPUT_BUF_OFLW)),
905/*17*/ FLAG_ENTRY0("VL_ACK_INPUT_BUF_OFLW", LCBE(VL_ACK_INPUT_BUF_OFLW)),
906/*18*/ FLAG_ENTRY0("VL_ACK_INPUT_PARITY_ERR", LCBE(VL_ACK_INPUT_PARITY_ERR)),
907/*19*/ FLAG_ENTRY0("VL_ACK_INPUT_WRONG_CRC_MODE",
908 LCBE(VL_ACK_INPUT_WRONG_CRC_MODE)),
909/*20*/ FLAG_ENTRY0("FLIT_INPUT_BUF_MBE", LCBE(FLIT_INPUT_BUF_MBE)),
910/*21*/ FLAG_ENTRY0("FLIT_INPUT_BUF_SBE", LCBE(FLIT_INPUT_BUF_SBE)),
911/*22*/ FLAG_ENTRY0("REPLAY_BUF_MBE", LCBE(REPLAY_BUF_MBE)),
912/*23*/ FLAG_ENTRY0("REPLAY_BUF_SBE", LCBE(REPLAY_BUF_SBE)),
913/*24*/ FLAG_ENTRY0("CREDIT_RETURN_FLIT_MBE", LCBE(CREDIT_RETURN_FLIT_MBE)),
914/*25*/ FLAG_ENTRY0("RST_FOR_LINK_TIMEOUT", LCBE(RST_FOR_LINK_TIMEOUT)),
915/*26*/ FLAG_ENTRY0("RST_FOR_INCOMPLT_RND_TRIP",
916 LCBE(RST_FOR_INCOMPLT_RND_TRIP)),
917/*27*/ FLAG_ENTRY0("HOLD_REINIT", LCBE(HOLD_REINIT)),
918/*28*/ FLAG_ENTRY0("NEG_EDGE_LINK_TRANSFER_ACTIVE",
919 LCBE(NEG_EDGE_LINK_TRANSFER_ACTIVE)),
920/*29*/ FLAG_ENTRY0("REDUNDANT_FLIT_PARITY_ERR",
921 LCBE(REDUNDANT_FLIT_PARITY_ERR))
922};
923
924/*
925 * DC8051 Error Flags
926 */
927#define D8E(name) DC_DC8051_ERR_FLG_##name##_SMASK
928static struct flag_table dc8051_err_flags[] = {
929 FLAG_ENTRY0("SET_BY_8051", D8E(SET_BY_8051)),
930 FLAG_ENTRY0("LOST_8051_HEART_BEAT", D8E(LOST_8051_HEART_BEAT)),
931 FLAG_ENTRY0("CRAM_MBE", D8E(CRAM_MBE)),
932 FLAG_ENTRY0("CRAM_SBE", D8E(CRAM_SBE)),
933 FLAG_ENTRY0("DRAM_MBE", D8E(DRAM_MBE)),
934 FLAG_ENTRY0("DRAM_SBE", D8E(DRAM_SBE)),
935 FLAG_ENTRY0("IRAM_MBE", D8E(IRAM_MBE)),
936 FLAG_ENTRY0("IRAM_SBE", D8E(IRAM_SBE)),
937 FLAG_ENTRY0("UNMATCHED_SECURE_MSG_ACROSS_BCC_LANES",
938 D8E(UNMATCHED_SECURE_MSG_ACROSS_BCC_LANES)),
939 FLAG_ENTRY0("INVALID_CSR_ADDR", D8E(INVALID_CSR_ADDR)),
940};
941
942/*
943 * DC8051 Information Error flags
944 *
945 * Flags in DC8051_DBG_ERR_INFO_SET_BY_8051.ERROR field.
946 */
947static struct flag_table dc8051_info_err_flags[] = {
948 FLAG_ENTRY0("Spico ROM check failed", SPICO_ROM_FAILED),
949 FLAG_ENTRY0("Unknown frame received", UNKNOWN_FRAME),
950 FLAG_ENTRY0("Target BER not met", TARGET_BER_NOT_MET),
951 FLAG_ENTRY0("Serdes internal loopback failure",
952 FAILED_SERDES_INTERNAL_LOOPBACK),
953 FLAG_ENTRY0("Failed SerDes init", FAILED_SERDES_INIT),
954 FLAG_ENTRY0("Failed LNI(Polling)", FAILED_LNI_POLLING),
955 FLAG_ENTRY0("Failed LNI(Debounce)", FAILED_LNI_DEBOUNCE),
956 FLAG_ENTRY0("Failed LNI(EstbComm)", FAILED_LNI_ESTBCOMM),
957 FLAG_ENTRY0("Failed LNI(OptEq)", FAILED_LNI_OPTEQ),
958 FLAG_ENTRY0("Failed LNI(VerifyCap_1)", FAILED_LNI_VERIFY_CAP1),
959 FLAG_ENTRY0("Failed LNI(VerifyCap_2)", FAILED_LNI_VERIFY_CAP2),
960 FLAG_ENTRY0("Failed LNI(ConfigLT)", FAILED_LNI_CONFIGLT)
961};
962
963/*
964 * DC8051 Information Host Information flags
965 *
966 * Flags in DC8051_DBG_ERR_INFO_SET_BY_8051.HOST_MSG field.
967 */
968static struct flag_table dc8051_info_host_msg_flags[] = {
969 FLAG_ENTRY0("Host request done", 0x0001),
970 FLAG_ENTRY0("BC SMA message", 0x0002),
971 FLAG_ENTRY0("BC PWR_MGM message", 0x0004),
972 FLAG_ENTRY0("BC Unknown message (BCC)", 0x0008),
973 FLAG_ENTRY0("BC Unknown message (LCB)", 0x0010),
974 FLAG_ENTRY0("External device config request", 0x0020),
975 FLAG_ENTRY0("VerifyCap all frames received", 0x0040),
976 FLAG_ENTRY0("LinkUp achieved", 0x0080),
977 FLAG_ENTRY0("Link going down", 0x0100),
978};
979
980
981static u32 encoded_size(u32 size);
982static u32 chip_to_opa_lstate(struct hfi1_devdata *dd, u32 chip_lstate);
983static int set_physical_link_state(struct hfi1_devdata *dd, u64 state);
984static void read_vc_remote_phy(struct hfi1_devdata *dd, u8 *power_management,
985 u8 *continuous);
986static void read_vc_remote_fabric(struct hfi1_devdata *dd, u8 *vau, u8 *z,
987 u8 *vcu, u16 *vl15buf, u8 *crc_sizes);
988static void read_vc_remote_link_width(struct hfi1_devdata *dd,
989 u8 *remote_tx_rate, u16 *link_widths);
990static void read_vc_local_link_width(struct hfi1_devdata *dd, u8 *misc_bits,
991 u8 *flag_bits, u16 *link_widths);
992static void read_remote_device_id(struct hfi1_devdata *dd, u16 *device_id,
993 u8 *device_rev);
994static void read_mgmt_allowed(struct hfi1_devdata *dd, u8 *mgmt_allowed);
995static void read_local_lni(struct hfi1_devdata *dd, u8 *enable_lane_rx);
996static int read_tx_settings(struct hfi1_devdata *dd, u8 *enable_lane_tx,
997 u8 *tx_polarity_inversion,
998 u8 *rx_polarity_inversion, u8 *max_rate);
999static void handle_sdma_eng_err(struct hfi1_devdata *dd,
1000 unsigned int context, u64 err_status);
1001static void handle_qsfp_int(struct hfi1_devdata *dd, u32 source, u64 reg);
1002static void handle_dcc_err(struct hfi1_devdata *dd,
1003 unsigned int context, u64 err_status);
1004static void handle_lcb_err(struct hfi1_devdata *dd,
1005 unsigned int context, u64 err_status);
1006static void handle_8051_interrupt(struct hfi1_devdata *dd, u32 unused, u64 reg);
1007static void handle_cce_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1008static void handle_rxe_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1009static void handle_misc_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1010static void handle_pio_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1011static void handle_sdma_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1012static void handle_egress_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1013static void handle_txe_err(struct hfi1_devdata *dd, u32 unused, u64 reg);
1014static void set_partition_keys(struct hfi1_pportdata *);
1015static const char *link_state_name(u32 state);
1016static const char *link_state_reason_name(struct hfi1_pportdata *ppd,
1017 u32 state);
1018static int do_8051_command(struct hfi1_devdata *dd, u32 type, u64 in_data,
1019 u64 *out_data);
1020static int read_idle_sma(struct hfi1_devdata *dd, u64 *data);
1021static int thermal_init(struct hfi1_devdata *dd);
1022
1023static int wait_logical_linkstate(struct hfi1_pportdata *ppd, u32 state,
1024 int msecs);
1025static void read_planned_down_reason_code(struct hfi1_devdata *dd, u8 *pdrrc);
1026static void handle_temp_err(struct hfi1_devdata *);
1027static void dc_shutdown(struct hfi1_devdata *);
1028static void dc_start(struct hfi1_devdata *);
1029
1030/*
1031 * Error interrupt table entry. This is used as input to the interrupt
1032 * "clear down" routine used for all second tier error interrupt register.
1033 * Second tier interrupt registers have a single bit representing them
1034 * in the top-level CceIntStatus.
1035 */
1036struct err_reg_info {
1037 u32 status; /* status CSR offset */
1038 u32 clear; /* clear CSR offset */
1039 u32 mask; /* mask CSR offset */
1040 void (*handler)(struct hfi1_devdata *dd, u32 source, u64 reg);
1041 const char *desc;
1042};
1043
1044#define NUM_MISC_ERRS (IS_GENERAL_ERR_END - IS_GENERAL_ERR_START)
1045#define NUM_DC_ERRS (IS_DC_END - IS_DC_START)
1046#define NUM_VARIOUS (IS_VARIOUS_END - IS_VARIOUS_START)
1047
1048/*
1049 * Helpers for building HFI and DC error interrupt table entries. Different
1050 * helpers are needed because of inconsistent register names.
1051 */
1052#define EE(reg, handler, desc) \
1053 { reg##_STATUS, reg##_CLEAR, reg##_MASK, \
1054 handler, desc }
1055#define DC_EE1(reg, handler, desc) \
1056 { reg##_FLG, reg##_FLG_CLR, reg##_FLG_EN, handler, desc }
1057#define DC_EE2(reg, handler, desc) \
1058 { reg##_FLG, reg##_CLR, reg##_EN, handler, desc }
1059
1060/*
1061 * Table of the "misc" grouping of error interrupts. Each entry refers to
1062 * another register containing more information.
1063 */
1064static const struct err_reg_info misc_errs[NUM_MISC_ERRS] = {
1065/* 0*/ EE(CCE_ERR, handle_cce_err, "CceErr"),
1066/* 1*/ EE(RCV_ERR, handle_rxe_err, "RxeErr"),
1067/* 2*/ EE(MISC_ERR, handle_misc_err, "MiscErr"),
1068/* 3*/ { 0, 0, 0, NULL }, /* reserved */
1069/* 4*/ EE(SEND_PIO_ERR, handle_pio_err, "PioErr"),
1070/* 5*/ EE(SEND_DMA_ERR, handle_sdma_err, "SDmaErr"),
1071/* 6*/ EE(SEND_EGRESS_ERR, handle_egress_err, "EgressErr"),
1072/* 7*/ EE(SEND_ERR, handle_txe_err, "TxeErr")
1073 /* the rest are reserved */
1074};
1075
1076/*
1077 * Index into the Various section of the interrupt sources
1078 * corresponding to the Critical Temperature interrupt.
1079 */
1080#define TCRIT_INT_SOURCE 4
1081
1082/*
1083 * SDMA error interrupt entry - refers to another register containing more
1084 * information.
1085 */
1086static const struct err_reg_info sdma_eng_err =
1087 EE(SEND_DMA_ENG_ERR, handle_sdma_eng_err, "SDmaEngErr");
1088
1089static const struct err_reg_info various_err[NUM_VARIOUS] = {
1090/* 0*/ { 0, 0, 0, NULL }, /* PbcInt */
1091/* 1*/ { 0, 0, 0, NULL }, /* GpioAssertInt */
1092/* 2*/ EE(ASIC_QSFP1, handle_qsfp_int, "QSFP1"),
1093/* 3*/ EE(ASIC_QSFP2, handle_qsfp_int, "QSFP2"),
1094/* 4*/ { 0, 0, 0, NULL }, /* TCritInt */
1095 /* rest are reserved */
1096};
1097
1098/*
1099 * The DC encoding of mtu_cap for 10K MTU in the DCC_CFG_PORT_CONFIG
1100 * register can not be derived from the MTU value because 10K is not
1101 * a power of 2. Therefore, we need a constant. Everything else can
1102 * be calculated.
1103 */
1104#define DCC_CFG_PORT_MTU_CAP_10240 7
1105
1106/*
1107 * Table of the DC grouping of error interrupts. Each entry refers to
1108 * another register containing more information.
1109 */
1110static const struct err_reg_info dc_errs[NUM_DC_ERRS] = {
1111/* 0*/ DC_EE1(DCC_ERR, handle_dcc_err, "DCC Err"),
1112/* 1*/ DC_EE2(DC_LCB_ERR, handle_lcb_err, "LCB Err"),
1113/* 2*/ DC_EE2(DC_DC8051_ERR, handle_8051_interrupt, "DC8051 Interrupt"),
1114/* 3*/ /* dc_lbm_int - special, see is_dc_int() */
1115 /* the rest are reserved */
1116};
1117
1118struct cntr_entry {
1119 /*
1120 * counter name
1121 */
1122 char *name;
1123
1124 /*
1125 * csr to read for name (if applicable)
1126 */
1127 u64 csr;
1128
1129 /*
1130 * offset into dd or ppd to store the counter's value
1131 */
1132 int offset;
1133
1134 /*
1135 * flags
1136 */
1137 u8 flags;
1138
1139 /*
1140 * accessor for stat element, context either dd or ppd
1141 */
1142 u64 (*rw_cntr)(const struct cntr_entry *,
1143 void *context,
1144 int vl,
1145 int mode,
1146 u64 data);
1147};
1148
1149#define C_RCV_HDR_OVF_FIRST C_RCV_HDR_OVF_0
1150#define C_RCV_HDR_OVF_LAST C_RCV_HDR_OVF_159
1151
1152#define CNTR_ELEM(name, csr, offset, flags, accessor) \
1153{ \
1154 name, \
1155 csr, \
1156 offset, \
1157 flags, \
1158 accessor \
1159}
1160
1161/* 32bit RXE */
1162#define RXE32_PORT_CNTR_ELEM(name, counter, flags) \
1163CNTR_ELEM(#name, \
1164 (counter * 8 + RCV_COUNTER_ARRAY32), \
1165 0, flags | CNTR_32BIT, \
1166 port_access_u32_csr)
1167
1168#define RXE32_DEV_CNTR_ELEM(name, counter, flags) \
1169CNTR_ELEM(#name, \
1170 (counter * 8 + RCV_COUNTER_ARRAY32), \
1171 0, flags | CNTR_32BIT, \
1172 dev_access_u32_csr)
1173
1174/* 64bit RXE */
1175#define RXE64_PORT_CNTR_ELEM(name, counter, flags) \
1176CNTR_ELEM(#name, \
1177 (counter * 8 + RCV_COUNTER_ARRAY64), \
1178 0, flags, \
1179 port_access_u64_csr)
1180
1181#define RXE64_DEV_CNTR_ELEM(name, counter, flags) \
1182CNTR_ELEM(#name, \
1183 (counter * 8 + RCV_COUNTER_ARRAY64), \
1184 0, flags, \
1185 dev_access_u64_csr)
1186
1187#define OVR_LBL(ctx) C_RCV_HDR_OVF_ ## ctx
1188#define OVR_ELM(ctx) \
1189CNTR_ELEM("RcvHdrOvr" #ctx, \
1190 (RCV_HDR_OVFL_CNT + ctx*0x100), \
1191 0, CNTR_NORMAL, port_access_u64_csr)
1192
1193/* 32bit TXE */
1194#define TXE32_PORT_CNTR_ELEM(name, counter, flags) \
1195CNTR_ELEM(#name, \
1196 (counter * 8 + SEND_COUNTER_ARRAY32), \
1197 0, flags | CNTR_32BIT, \
1198 port_access_u32_csr)
1199
1200/* 64bit TXE */
1201#define TXE64_PORT_CNTR_ELEM(name, counter, flags) \
1202CNTR_ELEM(#name, \
1203 (counter * 8 + SEND_COUNTER_ARRAY64), \
1204 0, flags, \
1205 port_access_u64_csr)
1206
1207# define TX64_DEV_CNTR_ELEM(name, counter, flags) \
1208CNTR_ELEM(#name,\
1209 counter * 8 + SEND_COUNTER_ARRAY64, \
1210 0, \
1211 flags, \
1212 dev_access_u64_csr)
1213
1214/* CCE */
1215#define CCE_PERF_DEV_CNTR_ELEM(name, counter, flags) \
1216CNTR_ELEM(#name, \
1217 (counter * 8 + CCE_COUNTER_ARRAY32), \
1218 0, flags | CNTR_32BIT, \
1219 dev_access_u32_csr)
1220
1221#define CCE_INT_DEV_CNTR_ELEM(name, counter, flags) \
1222CNTR_ELEM(#name, \
1223 (counter * 8 + CCE_INT_COUNTER_ARRAY32), \
1224 0, flags | CNTR_32BIT, \
1225 dev_access_u32_csr)
1226
1227/* DC */
1228#define DC_PERF_CNTR(name, counter, flags) \
1229CNTR_ELEM(#name, \
1230 counter, \
1231 0, \
1232 flags, \
1233 dev_access_u64_csr)
1234
1235#define DC_PERF_CNTR_LCB(name, counter, flags) \
1236CNTR_ELEM(#name, \
1237 counter, \
1238 0, \
1239 flags, \
1240 dc_access_lcb_cntr)
1241
1242/* ibp counters */
1243#define SW_IBP_CNTR(name, cntr) \
1244CNTR_ELEM(#name, \
1245 0, \
1246 0, \
1247 CNTR_SYNTH, \
1248 access_ibp_##cntr)
1249
1250u64 read_csr(const struct hfi1_devdata *dd, u32 offset)
1251{
1252 u64 val;
1253
1254 if (dd->flags & HFI1_PRESENT) {
1255 val = readq((void __iomem *)dd->kregbase + offset);
1256 return val;
1257 }
1258 return -1;
1259}
1260
1261void write_csr(const struct hfi1_devdata *dd, u32 offset, u64 value)
1262{
1263 if (dd->flags & HFI1_PRESENT)
1264 writeq(value, (void __iomem *)dd->kregbase + offset);
1265}
1266
1267void __iomem *get_csr_addr(
1268 struct hfi1_devdata *dd,
1269 u32 offset)
1270{
1271 return (void __iomem *)dd->kregbase + offset;
1272}
1273
1274static inline u64 read_write_csr(const struct hfi1_devdata *dd, u32 csr,
1275 int mode, u64 value)
1276{
1277 u64 ret;
1278
1279
1280 if (mode == CNTR_MODE_R) {
1281 ret = read_csr(dd, csr);
1282 } else if (mode == CNTR_MODE_W) {
1283 write_csr(dd, csr, value);
1284 ret = value;
1285 } else {
1286 dd_dev_err(dd, "Invalid cntr register access mode");
1287 return 0;
1288 }
1289
1290 hfi1_cdbg(CNTR, "csr 0x%x val 0x%llx mode %d", csr, ret, mode);
1291 return ret;
1292}
1293
1294/* Dev Access */
1295static u64 dev_access_u32_csr(const struct cntr_entry *entry,
1296 void *context, int vl, int mode, u64 data)
1297{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301298 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001299
1300 if (vl != CNTR_INVALID_VL)
1301 return 0;
1302 return read_write_csr(dd, entry->csr, mode, data);
1303}
1304
1305static u64 dev_access_u64_csr(const struct cntr_entry *entry, void *context,
1306 int vl, int mode, u64 data)
1307{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301308 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001309
1310 u64 val = 0;
1311 u64 csr = entry->csr;
1312
1313 if (entry->flags & CNTR_VL) {
1314 if (vl == CNTR_INVALID_VL)
1315 return 0;
1316 csr += 8 * vl;
1317 } else {
1318 if (vl != CNTR_INVALID_VL)
1319 return 0;
1320 }
1321
1322 val = read_write_csr(dd, csr, mode, data);
1323 return val;
1324}
1325
1326static u64 dc_access_lcb_cntr(const struct cntr_entry *entry, void *context,
1327 int vl, int mode, u64 data)
1328{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301329 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001330 u32 csr = entry->csr;
1331 int ret = 0;
1332
1333 if (vl != CNTR_INVALID_VL)
1334 return 0;
1335 if (mode == CNTR_MODE_R)
1336 ret = read_lcb_csr(dd, csr, &data);
1337 else if (mode == CNTR_MODE_W)
1338 ret = write_lcb_csr(dd, csr, data);
1339
1340 if (ret) {
1341 dd_dev_err(dd, "Could not acquire LCB for counter 0x%x", csr);
1342 return 0;
1343 }
1344
1345 hfi1_cdbg(CNTR, "csr 0x%x val 0x%llx mode %d", csr, data, mode);
1346 return data;
1347}
1348
1349/* Port Access */
1350static u64 port_access_u32_csr(const struct cntr_entry *entry, void *context,
1351 int vl, int mode, u64 data)
1352{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301353 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001354
1355 if (vl != CNTR_INVALID_VL)
1356 return 0;
1357 return read_write_csr(ppd->dd, entry->csr, mode, data);
1358}
1359
1360static u64 port_access_u64_csr(const struct cntr_entry *entry,
1361 void *context, int vl, int mode, u64 data)
1362{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301363 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001364 u64 val;
1365 u64 csr = entry->csr;
1366
1367 if (entry->flags & CNTR_VL) {
1368 if (vl == CNTR_INVALID_VL)
1369 return 0;
1370 csr += 8 * vl;
1371 } else {
1372 if (vl != CNTR_INVALID_VL)
1373 return 0;
1374 }
1375 val = read_write_csr(ppd->dd, csr, mode, data);
1376 return val;
1377}
1378
1379/* Software defined */
1380static inline u64 read_write_sw(struct hfi1_devdata *dd, u64 *cntr, int mode,
1381 u64 data)
1382{
1383 u64 ret;
1384
1385 if (mode == CNTR_MODE_R) {
1386 ret = *cntr;
1387 } else if (mode == CNTR_MODE_W) {
1388 *cntr = data;
1389 ret = data;
1390 } else {
1391 dd_dev_err(dd, "Invalid cntr sw access mode");
1392 return 0;
1393 }
1394
1395 hfi1_cdbg(CNTR, "val 0x%llx mode %d", ret, mode);
1396
1397 return ret;
1398}
1399
1400static u64 access_sw_link_dn_cnt(const struct cntr_entry *entry, void *context,
1401 int vl, int mode, u64 data)
1402{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301403 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001404
1405 if (vl != CNTR_INVALID_VL)
1406 return 0;
1407 return read_write_sw(ppd->dd, &ppd->link_downed, mode, data);
1408}
1409
1410static u64 access_sw_link_up_cnt(const struct cntr_entry *entry, void *context,
1411 int vl, int mode, u64 data)
1412{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301413 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001414
1415 if (vl != CNTR_INVALID_VL)
1416 return 0;
1417 return read_write_sw(ppd->dd, &ppd->link_up, mode, data);
1418}
1419
1420static u64 access_sw_xmit_discards(const struct cntr_entry *entry,
1421 void *context, int vl, int mode, u64 data)
1422{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301423 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001424
1425 if (vl != CNTR_INVALID_VL)
1426 return 0;
1427
1428 return read_write_sw(ppd->dd, &ppd->port_xmit_discards, mode, data);
1429}
1430
1431static u64 access_xmit_constraint_errs(const struct cntr_entry *entry,
1432 void *context, int vl, int mode, u64 data)
1433{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301434 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001435
1436 if (vl != CNTR_INVALID_VL)
1437 return 0;
1438
1439 return read_write_sw(ppd->dd, &ppd->port_xmit_constraint_errors,
1440 mode, data);
1441}
1442
1443static u64 access_rcv_constraint_errs(const struct cntr_entry *entry,
1444 void *context, int vl, int mode, u64 data)
1445{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301446 struct hfi1_pportdata *ppd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001447
1448 if (vl != CNTR_INVALID_VL)
1449 return 0;
1450
1451 return read_write_sw(ppd->dd, &ppd->port_rcv_constraint_errors,
1452 mode, data);
1453}
1454
1455u64 get_all_cpu_total(u64 __percpu *cntr)
1456{
1457 int cpu;
1458 u64 counter = 0;
1459
1460 for_each_possible_cpu(cpu)
1461 counter += *per_cpu_ptr(cntr, cpu);
1462 return counter;
1463}
1464
1465static u64 read_write_cpu(struct hfi1_devdata *dd, u64 *z_val,
1466 u64 __percpu *cntr,
1467 int vl, int mode, u64 data)
1468{
1469
1470 u64 ret = 0;
1471
1472 if (vl != CNTR_INVALID_VL)
1473 return 0;
1474
1475 if (mode == CNTR_MODE_R) {
1476 ret = get_all_cpu_total(cntr) - *z_val;
1477 } else if (mode == CNTR_MODE_W) {
1478 /* A write can only zero the counter */
1479 if (data == 0)
1480 *z_val = get_all_cpu_total(cntr);
1481 else
1482 dd_dev_err(dd, "Per CPU cntrs can only be zeroed");
1483 } else {
1484 dd_dev_err(dd, "Invalid cntr sw cpu access mode");
1485 return 0;
1486 }
1487
1488 return ret;
1489}
1490
1491static u64 access_sw_cpu_intr(const struct cntr_entry *entry,
1492 void *context, int vl, int mode, u64 data)
1493{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301494 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001495
1496 return read_write_cpu(dd, &dd->z_int_counter, dd->int_counter, vl,
1497 mode, data);
1498}
1499
1500static u64 access_sw_cpu_rcv_limit(const struct cntr_entry *entry,
1501 void *context, int vl, int mode, u64 data)
1502{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301503 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001504
1505 return read_write_cpu(dd, &dd->z_rcv_limit, dd->rcv_limit, vl,
1506 mode, data);
1507}
1508
1509static u64 access_sw_pio_wait(const struct cntr_entry *entry,
1510 void *context, int vl, int mode, u64 data)
1511{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301512 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001513
1514 return dd->verbs_dev.n_piowait;
1515}
1516
1517static u64 access_sw_vtx_wait(const struct cntr_entry *entry,
1518 void *context, int vl, int mode, u64 data)
1519{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301520 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001521
1522 return dd->verbs_dev.n_txwait;
1523}
1524
1525static u64 access_sw_kmem_wait(const struct cntr_entry *entry,
1526 void *context, int vl, int mode, u64 data)
1527{
Shraddha Barkea787bde2015-10-15 00:58:29 +05301528 struct hfi1_devdata *dd = context;
Mike Marciniszyn77241052015-07-30 15:17:43 -04001529
1530 return dd->verbs_dev.n_kmem_wait;
1531}
1532
Dean Luickb4219222015-10-26 10:28:35 -04001533static u64 access_sw_send_schedule(const struct cntr_entry *entry,
1534 void *context, int vl, int mode, u64 data)
1535{
1536 struct hfi1_devdata *dd = (struct hfi1_devdata *)context;
1537
1538 return dd->verbs_dev.n_send_schedule;
1539}
1540
Mike Marciniszyn77241052015-07-30 15:17:43 -04001541#define def_access_sw_cpu(cntr) \
1542static u64 access_sw_cpu_##cntr(const struct cntr_entry *entry, \
1543 void *context, int vl, int mode, u64 data) \
1544{ \
1545 struct hfi1_pportdata *ppd = (struct hfi1_pportdata *)context; \
1546 return read_write_cpu(ppd->dd, &ppd->ibport_data.z_ ##cntr, \
1547 ppd->ibport_data.cntr, vl, \
1548 mode, data); \
1549}
1550
1551def_access_sw_cpu(rc_acks);
1552def_access_sw_cpu(rc_qacks);
1553def_access_sw_cpu(rc_delayed_comp);
1554
1555#define def_access_ibp_counter(cntr) \
1556static u64 access_ibp_##cntr(const struct cntr_entry *entry, \
1557 void *context, int vl, int mode, u64 data) \
1558{ \
1559 struct hfi1_pportdata *ppd = (struct hfi1_pportdata *)context; \
1560 \
1561 if (vl != CNTR_INVALID_VL) \
1562 return 0; \
1563 \
1564 return read_write_sw(ppd->dd, &ppd->ibport_data.n_ ##cntr, \
1565 mode, data); \
1566}
1567
1568def_access_ibp_counter(loop_pkts);
1569def_access_ibp_counter(rc_resends);
1570def_access_ibp_counter(rnr_naks);
1571def_access_ibp_counter(other_naks);
1572def_access_ibp_counter(rc_timeouts);
1573def_access_ibp_counter(pkt_drops);
1574def_access_ibp_counter(dmawait);
1575def_access_ibp_counter(rc_seqnak);
1576def_access_ibp_counter(rc_dupreq);
1577def_access_ibp_counter(rdma_seq);
1578def_access_ibp_counter(unaligned);
1579def_access_ibp_counter(seq_naks);
1580
1581static struct cntr_entry dev_cntrs[DEV_CNTR_LAST] = {
1582[C_RCV_OVF] = RXE32_DEV_CNTR_ELEM(RcvOverflow, RCV_BUF_OVFL_CNT, CNTR_SYNTH),
1583[C_RX_TID_FULL] = RXE32_DEV_CNTR_ELEM(RxTIDFullEr, RCV_TID_FULL_ERR_CNT,
1584 CNTR_NORMAL),
1585[C_RX_TID_INVALID] = RXE32_DEV_CNTR_ELEM(RxTIDInvalid, RCV_TID_VALID_ERR_CNT,
1586 CNTR_NORMAL),
1587[C_RX_TID_FLGMS] = RXE32_DEV_CNTR_ELEM(RxTidFLGMs,
1588 RCV_TID_FLOW_GEN_MISMATCH_CNT,
1589 CNTR_NORMAL),
1590[C_RX_CTX_RHQS] = RXE32_DEV_CNTR_ELEM(RxCtxRHQS, RCV_CONTEXT_RHQ_STALL,
1591 CNTR_NORMAL),
1592[C_RX_CTX_EGRS] = RXE32_DEV_CNTR_ELEM(RxCtxEgrS, RCV_CONTEXT_EGR_STALL,
1593 CNTR_NORMAL),
1594[C_RCV_TID_FLSMS] = RXE32_DEV_CNTR_ELEM(RxTidFLSMs,
1595 RCV_TID_FLOW_SEQ_MISMATCH_CNT, CNTR_NORMAL),
1596[C_CCE_PCI_CR_ST] = CCE_PERF_DEV_CNTR_ELEM(CcePciCrSt,
1597 CCE_PCIE_POSTED_CRDT_STALL_CNT, CNTR_NORMAL),
1598[C_CCE_PCI_TR_ST] = CCE_PERF_DEV_CNTR_ELEM(CcePciTrSt, CCE_PCIE_TRGT_STALL_CNT,
1599 CNTR_NORMAL),
1600[C_CCE_PIO_WR_ST] = CCE_PERF_DEV_CNTR_ELEM(CcePioWrSt, CCE_PIO_WR_STALL_CNT,
1601 CNTR_NORMAL),
1602[C_CCE_ERR_INT] = CCE_INT_DEV_CNTR_ELEM(CceErrInt, CCE_ERR_INT_CNT,
1603 CNTR_NORMAL),
1604[C_CCE_SDMA_INT] = CCE_INT_DEV_CNTR_ELEM(CceSdmaInt, CCE_SDMA_INT_CNT,
1605 CNTR_NORMAL),
1606[C_CCE_MISC_INT] = CCE_INT_DEV_CNTR_ELEM(CceMiscInt, CCE_MISC_INT_CNT,
1607 CNTR_NORMAL),
1608[C_CCE_RCV_AV_INT] = CCE_INT_DEV_CNTR_ELEM(CceRcvAvInt, CCE_RCV_AVAIL_INT_CNT,
1609 CNTR_NORMAL),
1610[C_CCE_RCV_URG_INT] = CCE_INT_DEV_CNTR_ELEM(CceRcvUrgInt,
1611 CCE_RCV_URGENT_INT_CNT, CNTR_NORMAL),
1612[C_CCE_SEND_CR_INT] = CCE_INT_DEV_CNTR_ELEM(CceSndCrInt,
1613 CCE_SEND_CREDIT_INT_CNT, CNTR_NORMAL),
1614[C_DC_UNC_ERR] = DC_PERF_CNTR(DcUnctblErr, DCC_ERR_UNCORRECTABLE_CNT,
1615 CNTR_SYNTH),
1616[C_DC_RCV_ERR] = DC_PERF_CNTR(DcRecvErr, DCC_ERR_PORTRCV_ERR_CNT, CNTR_SYNTH),
1617[C_DC_FM_CFG_ERR] = DC_PERF_CNTR(DcFmCfgErr, DCC_ERR_FMCONFIG_ERR_CNT,
1618 CNTR_SYNTH),
1619[C_DC_RMT_PHY_ERR] = DC_PERF_CNTR(DcRmtPhyErr, DCC_ERR_RCVREMOTE_PHY_ERR_CNT,
1620 CNTR_SYNTH),
1621[C_DC_DROPPED_PKT] = DC_PERF_CNTR(DcDroppedPkt, DCC_ERR_DROPPED_PKT_CNT,
1622 CNTR_SYNTH),
1623[C_DC_MC_XMIT_PKTS] = DC_PERF_CNTR(DcMcXmitPkts,
1624 DCC_PRF_PORT_XMIT_MULTICAST_CNT, CNTR_SYNTH),
1625[C_DC_MC_RCV_PKTS] = DC_PERF_CNTR(DcMcRcvPkts,
1626 DCC_PRF_PORT_RCV_MULTICAST_PKT_CNT,
1627 CNTR_SYNTH),
1628[C_DC_XMIT_CERR] = DC_PERF_CNTR(DcXmitCorr,
1629 DCC_PRF_PORT_XMIT_CORRECTABLE_CNT, CNTR_SYNTH),
1630[C_DC_RCV_CERR] = DC_PERF_CNTR(DcRcvCorrCnt, DCC_PRF_PORT_RCV_CORRECTABLE_CNT,
1631 CNTR_SYNTH),
1632[C_DC_RCV_FCC] = DC_PERF_CNTR(DcRxFCntl, DCC_PRF_RX_FLOW_CRTL_CNT,
1633 CNTR_SYNTH),
1634[C_DC_XMIT_FCC] = DC_PERF_CNTR(DcXmitFCntl, DCC_PRF_TX_FLOW_CRTL_CNT,
1635 CNTR_SYNTH),
1636[C_DC_XMIT_FLITS] = DC_PERF_CNTR(DcXmitFlits, DCC_PRF_PORT_XMIT_DATA_CNT,
1637 CNTR_SYNTH),
1638[C_DC_RCV_FLITS] = DC_PERF_CNTR(DcRcvFlits, DCC_PRF_PORT_RCV_DATA_CNT,
1639 CNTR_SYNTH),
1640[C_DC_XMIT_PKTS] = DC_PERF_CNTR(DcXmitPkts, DCC_PRF_PORT_XMIT_PKTS_CNT,
1641 CNTR_SYNTH),
1642[C_DC_RCV_PKTS] = DC_PERF_CNTR(DcRcvPkts, DCC_PRF_PORT_RCV_PKTS_CNT,
1643 CNTR_SYNTH),
1644[C_DC_RX_FLIT_VL] = DC_PERF_CNTR(DcRxFlitVl, DCC_PRF_PORT_VL_RCV_DATA_CNT,
1645 CNTR_SYNTH | CNTR_VL),
1646[C_DC_RX_PKT_VL] = DC_PERF_CNTR(DcRxPktVl, DCC_PRF_PORT_VL_RCV_PKTS_CNT,
1647 CNTR_SYNTH | CNTR_VL),
1648[C_DC_RCV_FCN] = DC_PERF_CNTR(DcRcvFcn, DCC_PRF_PORT_RCV_FECN_CNT, CNTR_SYNTH),
1649[C_DC_RCV_FCN_VL] = DC_PERF_CNTR(DcRcvFcnVl, DCC_PRF_PORT_VL_RCV_FECN_CNT,
1650 CNTR_SYNTH | CNTR_VL),
1651[C_DC_RCV_BCN] = DC_PERF_CNTR(DcRcvBcn, DCC_PRF_PORT_RCV_BECN_CNT, CNTR_SYNTH),
1652[C_DC_RCV_BCN_VL] = DC_PERF_CNTR(DcRcvBcnVl, DCC_PRF_PORT_VL_RCV_BECN_CNT,
1653 CNTR_SYNTH | CNTR_VL),
1654[C_DC_RCV_BBL] = DC_PERF_CNTR(DcRcvBbl, DCC_PRF_PORT_RCV_BUBBLE_CNT,
1655 CNTR_SYNTH),
1656[C_DC_RCV_BBL_VL] = DC_PERF_CNTR(DcRcvBblVl, DCC_PRF_PORT_VL_RCV_BUBBLE_CNT,
1657 CNTR_SYNTH | CNTR_VL),
1658[C_DC_MARK_FECN] = DC_PERF_CNTR(DcMarkFcn, DCC_PRF_PORT_MARK_FECN_CNT,
1659 CNTR_SYNTH),
1660[C_DC_MARK_FECN_VL] = DC_PERF_CNTR(DcMarkFcnVl, DCC_PRF_PORT_VL_MARK_FECN_CNT,
1661 CNTR_SYNTH | CNTR_VL),
1662[C_DC_TOTAL_CRC] =
1663 DC_PERF_CNTR_LCB(DcTotCrc, DC_LCB_ERR_INFO_TOTAL_CRC_ERR,
1664 CNTR_SYNTH),
1665[C_DC_CRC_LN0] = DC_PERF_CNTR_LCB(DcCrcLn0, DC_LCB_ERR_INFO_CRC_ERR_LN0,
1666 CNTR_SYNTH),
1667[C_DC_CRC_LN1] = DC_PERF_CNTR_LCB(DcCrcLn1, DC_LCB_ERR_INFO_CRC_ERR_LN1,
1668 CNTR_SYNTH),
1669[C_DC_CRC_LN2] = DC_PERF_CNTR_LCB(DcCrcLn2, DC_LCB_ERR_INFO_CRC_ERR_LN2,
1670 CNTR_SYNTH),
1671[C_DC_CRC_LN3] = DC_PERF_CNTR_LCB(DcCrcLn3, DC_LCB_ERR_INFO_CRC_ERR_LN3,
1672 CNTR_SYNTH),
1673[C_DC_CRC_MULT_LN] =
1674 DC_PERF_CNTR_LCB(DcMultLn, DC_LCB_ERR_INFO_CRC_ERR_MULTI_LN,
1675 CNTR_SYNTH),
1676[C_DC_TX_REPLAY] = DC_PERF_CNTR_LCB(DcTxReplay, DC_LCB_ERR_INFO_TX_REPLAY_CNT,
1677 CNTR_SYNTH),
1678[C_DC_RX_REPLAY] = DC_PERF_CNTR_LCB(DcRxReplay, DC_LCB_ERR_INFO_RX_REPLAY_CNT,
1679 CNTR_SYNTH),
1680[C_DC_SEQ_CRC_CNT] =
1681 DC_PERF_CNTR_LCB(DcLinkSeqCrc, DC_LCB_ERR_INFO_SEQ_CRC_CNT,
1682 CNTR_SYNTH),
1683[C_DC_ESC0_ONLY_CNT] =
1684 DC_PERF_CNTR_LCB(DcEsc0, DC_LCB_ERR_INFO_ESCAPE_0_ONLY_CNT,
1685 CNTR_SYNTH),
1686[C_DC_ESC0_PLUS1_CNT] =
1687 DC_PERF_CNTR_LCB(DcEsc1, DC_LCB_ERR_INFO_ESCAPE_0_PLUS1_CNT,
1688 CNTR_SYNTH),
1689[C_DC_ESC0_PLUS2_CNT] =
1690 DC_PERF_CNTR_LCB(DcEsc0Plus2, DC_LCB_ERR_INFO_ESCAPE_0_PLUS2_CNT,
1691 CNTR_SYNTH),
1692[C_DC_REINIT_FROM_PEER_CNT] =
1693 DC_PERF_CNTR_LCB(DcReinitPeer, DC_LCB_ERR_INFO_REINIT_FROM_PEER_CNT,
1694 CNTR_SYNTH),
1695[C_DC_SBE_CNT] = DC_PERF_CNTR_LCB(DcSbe, DC_LCB_ERR_INFO_SBE_CNT,
1696 CNTR_SYNTH),
1697[C_DC_MISC_FLG_CNT] =
1698 DC_PERF_CNTR_LCB(DcMiscFlg, DC_LCB_ERR_INFO_MISC_FLG_CNT,
1699 CNTR_SYNTH),
1700[C_DC_PRF_GOOD_LTP_CNT] =
1701 DC_PERF_CNTR_LCB(DcGoodLTP, DC_LCB_PRF_GOOD_LTP_CNT, CNTR_SYNTH),
1702[C_DC_PRF_ACCEPTED_LTP_CNT] =
1703 DC_PERF_CNTR_LCB(DcAccLTP, DC_LCB_PRF_ACCEPTED_LTP_CNT,
1704 CNTR_SYNTH),
1705[C_DC_PRF_RX_FLIT_CNT] =
1706 DC_PERF_CNTR_LCB(DcPrfRxFlit, DC_LCB_PRF_RX_FLIT_CNT, CNTR_SYNTH),
1707[C_DC_PRF_TX_FLIT_CNT] =
1708 DC_PERF_CNTR_LCB(DcPrfTxFlit, DC_LCB_PRF_TX_FLIT_CNT, CNTR_SYNTH),
1709[C_DC_PRF_CLK_CNTR] =
1710 DC_PERF_CNTR_LCB(DcPrfClk, DC_LCB_PRF_CLK_CNTR, CNTR_SYNTH),
1711[C_DC_PG_DBG_FLIT_CRDTS_CNT] =
1712 DC_PERF_CNTR_LCB(DcFltCrdts, DC_LCB_PG_DBG_FLIT_CRDTS_CNT, CNTR_SYNTH),
1713[C_DC_PG_STS_PAUSE_COMPLETE_CNT] =
1714 DC_PERF_CNTR_LCB(DcPauseComp, DC_LCB_PG_STS_PAUSE_COMPLETE_CNT,
1715 CNTR_SYNTH),
1716[C_DC_PG_STS_TX_SBE_CNT] =
1717 DC_PERF_CNTR_LCB(DcStsTxSbe, DC_LCB_PG_STS_TX_SBE_CNT, CNTR_SYNTH),
1718[C_DC_PG_STS_TX_MBE_CNT] =
1719 DC_PERF_CNTR_LCB(DcStsTxMbe, DC_LCB_PG_STS_TX_MBE_CNT,
1720 CNTR_SYNTH),
1721[C_SW_CPU_INTR] = CNTR_ELEM("Intr", 0, 0, CNTR_NORMAL,
1722 access_sw_cpu_intr),
1723[C_SW_CPU_RCV_LIM] = CNTR_ELEM("RcvLimit", 0, 0, CNTR_NORMAL,
1724 access_sw_cpu_rcv_limit),
1725[C_SW_VTX_WAIT] = CNTR_ELEM("vTxWait", 0, 0, CNTR_NORMAL,
1726 access_sw_vtx_wait),
1727[C_SW_PIO_WAIT] = CNTR_ELEM("PioWait", 0, 0, CNTR_NORMAL,
1728 access_sw_pio_wait),
1729[C_SW_KMEM_WAIT] = CNTR_ELEM("KmemWait", 0, 0, CNTR_NORMAL,
1730 access_sw_kmem_wait),
Dean Luickb4219222015-10-26 10:28:35 -04001731[C_SW_SEND_SCHED] = CNTR_ELEM("SendSched", 0, 0, CNTR_NORMAL,
1732 access_sw_send_schedule),
Mike Marciniszyn77241052015-07-30 15:17:43 -04001733};
1734
1735static struct cntr_entry port_cntrs[PORT_CNTR_LAST] = {
1736[C_TX_UNSUP_VL] = TXE32_PORT_CNTR_ELEM(TxUnVLErr, SEND_UNSUP_VL_ERR_CNT,
1737 CNTR_NORMAL),
1738[C_TX_INVAL_LEN] = TXE32_PORT_CNTR_ELEM(TxInvalLen, SEND_LEN_ERR_CNT,
1739 CNTR_NORMAL),
1740[C_TX_MM_LEN_ERR] = TXE32_PORT_CNTR_ELEM(TxMMLenErr, SEND_MAX_MIN_LEN_ERR_CNT,
1741 CNTR_NORMAL),
1742[C_TX_UNDERRUN] = TXE32_PORT_CNTR_ELEM(TxUnderrun, SEND_UNDERRUN_CNT,
1743 CNTR_NORMAL),
1744[C_TX_FLOW_STALL] = TXE32_PORT_CNTR_ELEM(TxFlowStall, SEND_FLOW_STALL_CNT,
1745 CNTR_NORMAL),
1746[C_TX_DROPPED] = TXE32_PORT_CNTR_ELEM(TxDropped, SEND_DROPPED_PKT_CNT,
1747 CNTR_NORMAL),
1748[C_TX_HDR_ERR] = TXE32_PORT_CNTR_ELEM(TxHdrErr, SEND_HEADERS_ERR_CNT,
1749 CNTR_NORMAL),
1750[C_TX_PKT] = TXE64_PORT_CNTR_ELEM(TxPkt, SEND_DATA_PKT_CNT, CNTR_NORMAL),
1751[C_TX_WORDS] = TXE64_PORT_CNTR_ELEM(TxWords, SEND_DWORD_CNT, CNTR_NORMAL),
1752[C_TX_WAIT] = TXE64_PORT_CNTR_ELEM(TxWait, SEND_WAIT_CNT, CNTR_SYNTH),
1753[C_TX_FLIT_VL] = TXE64_PORT_CNTR_ELEM(TxFlitVL, SEND_DATA_VL0_CNT,
1754 CNTR_SYNTH | CNTR_VL),
1755[C_TX_PKT_VL] = TXE64_PORT_CNTR_ELEM(TxPktVL, SEND_DATA_PKT_VL0_CNT,
1756 CNTR_SYNTH | CNTR_VL),
1757[C_TX_WAIT_VL] = TXE64_PORT_CNTR_ELEM(TxWaitVL, SEND_WAIT_VL0_CNT,
1758 CNTR_SYNTH | CNTR_VL),
1759[C_RX_PKT] = RXE64_PORT_CNTR_ELEM(RxPkt, RCV_DATA_PKT_CNT, CNTR_NORMAL),
1760[C_RX_WORDS] = RXE64_PORT_CNTR_ELEM(RxWords, RCV_DWORD_CNT, CNTR_NORMAL),
1761[C_SW_LINK_DOWN] = CNTR_ELEM("SwLinkDown", 0, 0, CNTR_SYNTH | CNTR_32BIT,
1762 access_sw_link_dn_cnt),
1763[C_SW_LINK_UP] = CNTR_ELEM("SwLinkUp", 0, 0, CNTR_SYNTH | CNTR_32BIT,
1764 access_sw_link_up_cnt),
1765[C_SW_XMIT_DSCD] = CNTR_ELEM("XmitDscd", 0, 0, CNTR_SYNTH | CNTR_32BIT,
1766 access_sw_xmit_discards),
1767[C_SW_XMIT_DSCD_VL] = CNTR_ELEM("XmitDscdVl", 0, 0,
1768 CNTR_SYNTH | CNTR_32BIT | CNTR_VL,
1769 access_sw_xmit_discards),
1770[C_SW_XMIT_CSTR_ERR] = CNTR_ELEM("XmitCstrErr", 0, 0, CNTR_SYNTH,
1771 access_xmit_constraint_errs),
1772[C_SW_RCV_CSTR_ERR] = CNTR_ELEM("RcvCstrErr", 0, 0, CNTR_SYNTH,
1773 access_rcv_constraint_errs),
1774[C_SW_IBP_LOOP_PKTS] = SW_IBP_CNTR(LoopPkts, loop_pkts),
1775[C_SW_IBP_RC_RESENDS] = SW_IBP_CNTR(RcResend, rc_resends),
1776[C_SW_IBP_RNR_NAKS] = SW_IBP_CNTR(RnrNak, rnr_naks),
1777[C_SW_IBP_OTHER_NAKS] = SW_IBP_CNTR(OtherNak, other_naks),
1778[C_SW_IBP_RC_TIMEOUTS] = SW_IBP_CNTR(RcTimeOut, rc_timeouts),
1779[C_SW_IBP_PKT_DROPS] = SW_IBP_CNTR(PktDrop, pkt_drops),
1780[C_SW_IBP_DMA_WAIT] = SW_IBP_CNTR(DmaWait, dmawait),
1781[C_SW_IBP_RC_SEQNAK] = SW_IBP_CNTR(RcSeqNak, rc_seqnak),
1782[C_SW_IBP_RC_DUPREQ] = SW_IBP_CNTR(RcDupRew, rc_dupreq),
1783[C_SW_IBP_RDMA_SEQ] = SW_IBP_CNTR(RdmaSeq, rdma_seq),
1784[C_SW_IBP_UNALIGNED] = SW_IBP_CNTR(Unaligned, unaligned),
1785[C_SW_IBP_SEQ_NAK] = SW_IBP_CNTR(SeqNak, seq_naks),
1786[C_SW_CPU_RC_ACKS] = CNTR_ELEM("RcAcks", 0, 0, CNTR_NORMAL,
1787 access_sw_cpu_rc_acks),
1788[C_SW_CPU_RC_QACKS] = CNTR_ELEM("RcQacks", 0, 0, CNTR_NORMAL,
1789 access_sw_cpu_rc_qacks),
1790[C_SW_CPU_RC_DELAYED_COMP] = CNTR_ELEM("RcDelayComp", 0, 0, CNTR_NORMAL,
1791 access_sw_cpu_rc_delayed_comp),
1792[OVR_LBL(0)] = OVR_ELM(0), [OVR_LBL(1)] = OVR_ELM(1),
1793[OVR_LBL(2)] = OVR_ELM(2), [OVR_LBL(3)] = OVR_ELM(3),
1794[OVR_LBL(4)] = OVR_ELM(4), [OVR_LBL(5)] = OVR_ELM(5),
1795[OVR_LBL(6)] = OVR_ELM(6), [OVR_LBL(7)] = OVR_ELM(7),
1796[OVR_LBL(8)] = OVR_ELM(8), [OVR_LBL(9)] = OVR_ELM(9),
1797[OVR_LBL(10)] = OVR_ELM(10), [OVR_LBL(11)] = OVR_ELM(11),
1798[OVR_LBL(12)] = OVR_ELM(12), [OVR_LBL(13)] = OVR_ELM(13),
1799[OVR_LBL(14)] = OVR_ELM(14), [OVR_LBL(15)] = OVR_ELM(15),
1800[OVR_LBL(16)] = OVR_ELM(16), [OVR_LBL(17)] = OVR_ELM(17),
1801[OVR_LBL(18)] = OVR_ELM(18), [OVR_LBL(19)] = OVR_ELM(19),
1802[OVR_LBL(20)] = OVR_ELM(20), [OVR_LBL(21)] = OVR_ELM(21),
1803[OVR_LBL(22)] = OVR_ELM(22), [OVR_LBL(23)] = OVR_ELM(23),
1804[OVR_LBL(24)] = OVR_ELM(24), [OVR_LBL(25)] = OVR_ELM(25),
1805[OVR_LBL(26)] = OVR_ELM(26), [OVR_LBL(27)] = OVR_ELM(27),
1806[OVR_LBL(28)] = OVR_ELM(28), [OVR_LBL(29)] = OVR_ELM(29),
1807[OVR_LBL(30)] = OVR_ELM(30), [OVR_LBL(31)] = OVR_ELM(31),
1808[OVR_LBL(32)] = OVR_ELM(32), [OVR_LBL(33)] = OVR_ELM(33),
1809[OVR_LBL(34)] = OVR_ELM(34), [OVR_LBL(35)] = OVR_ELM(35),
1810[OVR_LBL(36)] = OVR_ELM(36), [OVR_LBL(37)] = OVR_ELM(37),
1811[OVR_LBL(38)] = OVR_ELM(38), [OVR_LBL(39)] = OVR_ELM(39),
1812[OVR_LBL(40)] = OVR_ELM(40), [OVR_LBL(41)] = OVR_ELM(41),
1813[OVR_LBL(42)] = OVR_ELM(42), [OVR_LBL(43)] = OVR_ELM(43),
1814[OVR_LBL(44)] = OVR_ELM(44), [OVR_LBL(45)] = OVR_ELM(45),
1815[OVR_LBL(46)] = OVR_ELM(46), [OVR_LBL(47)] = OVR_ELM(47),
1816[OVR_LBL(48)] = OVR_ELM(48), [OVR_LBL(49)] = OVR_ELM(49),
1817[OVR_LBL(50)] = OVR_ELM(50), [OVR_LBL(51)] = OVR_ELM(51),
1818[OVR_LBL(52)] = OVR_ELM(52), [OVR_LBL(53)] = OVR_ELM(53),
1819[OVR_LBL(54)] = OVR_ELM(54), [OVR_LBL(55)] = OVR_ELM(55),
1820[OVR_LBL(56)] = OVR_ELM(56), [OVR_LBL(57)] = OVR_ELM(57),
1821[OVR_LBL(58)] = OVR_ELM(58), [OVR_LBL(59)] = OVR_ELM(59),
1822[OVR_LBL(60)] = OVR_ELM(60), [OVR_LBL(61)] = OVR_ELM(61),
1823[OVR_LBL(62)] = OVR_ELM(62), [OVR_LBL(63)] = OVR_ELM(63),
1824[OVR_LBL(64)] = OVR_ELM(64), [OVR_LBL(65)] = OVR_ELM(65),
1825[OVR_LBL(66)] = OVR_ELM(66), [OVR_LBL(67)] = OVR_ELM(67),
1826[OVR_LBL(68)] = OVR_ELM(68), [OVR_LBL(69)] = OVR_ELM(69),
1827[OVR_LBL(70)] = OVR_ELM(70), [OVR_LBL(71)] = OVR_ELM(71),
1828[OVR_LBL(72)] = OVR_ELM(72), [OVR_LBL(73)] = OVR_ELM(73),
1829[OVR_LBL(74)] = OVR_ELM(74), [OVR_LBL(75)] = OVR_ELM(75),
1830[OVR_LBL(76)] = OVR_ELM(76), [OVR_LBL(77)] = OVR_ELM(77),
1831[OVR_LBL(78)] = OVR_ELM(78), [OVR_LBL(79)] = OVR_ELM(79),
1832[OVR_LBL(80)] = OVR_ELM(80), [OVR_LBL(81)] = OVR_ELM(81),
1833[OVR_LBL(82)] = OVR_ELM(82), [OVR_LBL(83)] = OVR_ELM(83),
1834[OVR_LBL(84)] = OVR_ELM(84), [OVR_LBL(85)] = OVR_ELM(85),
1835[OVR_LBL(86)] = OVR_ELM(86), [OVR_LBL(87)] = OVR_ELM(87),
1836[OVR_LBL(88)] = OVR_ELM(88), [OVR_LBL(89)] = OVR_ELM(89),
1837[OVR_LBL(90)] = OVR_ELM(90), [OVR_LBL(91)] = OVR_ELM(91),
1838[OVR_LBL(92)] = OVR_ELM(92), [OVR_LBL(93)] = OVR_ELM(93),
1839[OVR_LBL(94)] = OVR_ELM(94), [OVR_LBL(95)] = OVR_ELM(95),
1840[OVR_LBL(96)] = OVR_ELM(96), [OVR_LBL(97)] = OVR_ELM(97),
1841[OVR_LBL(98)] = OVR_ELM(98), [OVR_LBL(99)] = OVR_ELM(99),
1842[OVR_LBL(100)] = OVR_ELM(100), [OVR_LBL(101)] = OVR_ELM(101),
1843[OVR_LBL(102)] = OVR_ELM(102), [OVR_LBL(103)] = OVR_ELM(103),
1844[OVR_LBL(104)] = OVR_ELM(104), [OVR_LBL(105)] = OVR_ELM(105),
1845[OVR_LBL(106)] = OVR_ELM(106), [OVR_LBL(107)] = OVR_ELM(107),
1846[OVR_LBL(108)] = OVR_ELM(108), [OVR_LBL(109)] = OVR_ELM(109),
1847[OVR_LBL(110)] = OVR_ELM(110), [OVR_LBL(111)] = OVR_ELM(111),
1848[OVR_LBL(112)] = OVR_ELM(112), [OVR_LBL(113)] = OVR_ELM(113),
1849[OVR_LBL(114)] = OVR_ELM(114), [OVR_LBL(115)] = OVR_ELM(115),
1850[OVR_LBL(116)] = OVR_ELM(116), [OVR_LBL(117)] = OVR_ELM(117),
1851[OVR_LBL(118)] = OVR_ELM(118), [OVR_LBL(119)] = OVR_ELM(119),
1852[OVR_LBL(120)] = OVR_ELM(120), [OVR_LBL(121)] = OVR_ELM(121),
1853[OVR_LBL(122)] = OVR_ELM(122), [OVR_LBL(123)] = OVR_ELM(123),
1854[OVR_LBL(124)] = OVR_ELM(124), [OVR_LBL(125)] = OVR_ELM(125),
1855[OVR_LBL(126)] = OVR_ELM(126), [OVR_LBL(127)] = OVR_ELM(127),
1856[OVR_LBL(128)] = OVR_ELM(128), [OVR_LBL(129)] = OVR_ELM(129),
1857[OVR_LBL(130)] = OVR_ELM(130), [OVR_LBL(131)] = OVR_ELM(131),
1858[OVR_LBL(132)] = OVR_ELM(132), [OVR_LBL(133)] = OVR_ELM(133),
1859[OVR_LBL(134)] = OVR_ELM(134), [OVR_LBL(135)] = OVR_ELM(135),
1860[OVR_LBL(136)] = OVR_ELM(136), [OVR_LBL(137)] = OVR_ELM(137),
1861[OVR_LBL(138)] = OVR_ELM(138), [OVR_LBL(139)] = OVR_ELM(139),
1862[OVR_LBL(140)] = OVR_ELM(140), [OVR_LBL(141)] = OVR_ELM(141),
1863[OVR_LBL(142)] = OVR_ELM(142), [OVR_LBL(143)] = OVR_ELM(143),
1864[OVR_LBL(144)] = OVR_ELM(144), [OVR_LBL(145)] = OVR_ELM(145),
1865[OVR_LBL(146)] = OVR_ELM(146), [OVR_LBL(147)] = OVR_ELM(147),
1866[OVR_LBL(148)] = OVR_ELM(148), [OVR_LBL(149)] = OVR_ELM(149),
1867[OVR_LBL(150)] = OVR_ELM(150), [OVR_LBL(151)] = OVR_ELM(151),
1868[OVR_LBL(152)] = OVR_ELM(152), [OVR_LBL(153)] = OVR_ELM(153),
1869[OVR_LBL(154)] = OVR_ELM(154), [OVR_LBL(155)] = OVR_ELM(155),
1870[OVR_LBL(156)] = OVR_ELM(156), [OVR_LBL(157)] = OVR_ELM(157),
1871[OVR_LBL(158)] = OVR_ELM(158), [OVR_LBL(159)] = OVR_ELM(159),
1872};
1873
1874/* ======================================================================== */
1875
1876/* return true if this is chip revision revision a0 */
1877int is_a0(struct hfi1_devdata *dd)
1878{
1879 return ((dd->revision >> CCE_REVISION_CHIP_REV_MINOR_SHIFT)
1880 & CCE_REVISION_CHIP_REV_MINOR_MASK) == 0;
1881}
1882
1883/* return true if this is chip revision revision a */
1884int is_ax(struct hfi1_devdata *dd)
1885{
1886 u8 chip_rev_minor =
1887 dd->revision >> CCE_REVISION_CHIP_REV_MINOR_SHIFT
1888 & CCE_REVISION_CHIP_REV_MINOR_MASK;
1889 return (chip_rev_minor & 0xf0) == 0;
1890}
1891
1892/* return true if this is chip revision revision b */
1893int is_bx(struct hfi1_devdata *dd)
1894{
1895 u8 chip_rev_minor =
1896 dd->revision >> CCE_REVISION_CHIP_REV_MINOR_SHIFT
1897 & CCE_REVISION_CHIP_REV_MINOR_MASK;
1898 return !!(chip_rev_minor & 0x10);
1899}
1900
1901/*
1902 * Append string s to buffer buf. Arguments curp and len are the current
1903 * position and remaining length, respectively.
1904 *
1905 * return 0 on success, 1 on out of room
1906 */
1907static int append_str(char *buf, char **curp, int *lenp, const char *s)
1908{
1909 char *p = *curp;
1910 int len = *lenp;
1911 int result = 0; /* success */
1912 char c;
1913
1914 /* add a comma, if first in the buffer */
1915 if (p != buf) {
1916 if (len == 0) {
1917 result = 1; /* out of room */
1918 goto done;
1919 }
1920 *p++ = ',';
1921 len--;
1922 }
1923
1924 /* copy the string */
1925 while ((c = *s++) != 0) {
1926 if (len == 0) {
1927 result = 1; /* out of room */
1928 goto done;
1929 }
1930 *p++ = c;
1931 len--;
1932 }
1933
1934done:
1935 /* write return values */
1936 *curp = p;
1937 *lenp = len;
1938
1939 return result;
1940}
1941
1942/*
1943 * Using the given flag table, print a comma separated string into
1944 * the buffer. End in '*' if the buffer is too short.
1945 */
1946static char *flag_string(char *buf, int buf_len, u64 flags,
1947 struct flag_table *table, int table_size)
1948{
1949 char extra[32];
1950 char *p = buf;
1951 int len = buf_len;
1952 int no_room = 0;
1953 int i;
1954
1955 /* make sure there is at least 2 so we can form "*" */
1956 if (len < 2)
1957 return "";
1958
1959 len--; /* leave room for a nul */
1960 for (i = 0; i < table_size; i++) {
1961 if (flags & table[i].flag) {
1962 no_room = append_str(buf, &p, &len, table[i].str);
1963 if (no_room)
1964 break;
1965 flags &= ~table[i].flag;
1966 }
1967 }
1968
1969 /* any undocumented bits left? */
1970 if (!no_room && flags) {
1971 snprintf(extra, sizeof(extra), "bits 0x%llx", flags);
1972 no_room = append_str(buf, &p, &len, extra);
1973 }
1974
1975 /* add * if ran out of room */
1976 if (no_room) {
1977 /* may need to back up to add space for a '*' */
1978 if (len == 0)
1979 --p;
1980 *p++ = '*';
1981 }
1982
1983 /* add final nul - space already allocated above */
1984 *p = 0;
1985 return buf;
1986}
1987
1988/* first 8 CCE error interrupt source names */
1989static const char * const cce_misc_names[] = {
1990 "CceErrInt", /* 0 */
1991 "RxeErrInt", /* 1 */
1992 "MiscErrInt", /* 2 */
1993 "Reserved3", /* 3 */
1994 "PioErrInt", /* 4 */
1995 "SDmaErrInt", /* 5 */
1996 "EgressErrInt", /* 6 */
1997 "TxeErrInt" /* 7 */
1998};
1999
2000/*
2001 * Return the miscellaneous error interrupt name.
2002 */
2003static char *is_misc_err_name(char *buf, size_t bsize, unsigned int source)
2004{
2005 if (source < ARRAY_SIZE(cce_misc_names))
2006 strncpy(buf, cce_misc_names[source], bsize);
2007 else
2008 snprintf(buf,
2009 bsize,
2010 "Reserved%u",
2011 source + IS_GENERAL_ERR_START);
2012
2013 return buf;
2014}
2015
2016/*
2017 * Return the SDMA engine error interrupt name.
2018 */
2019static char *is_sdma_eng_err_name(char *buf, size_t bsize, unsigned int source)
2020{
2021 snprintf(buf, bsize, "SDmaEngErrInt%u", source);
2022 return buf;
2023}
2024
2025/*
2026 * Return the send context error interrupt name.
2027 */
2028static char *is_sendctxt_err_name(char *buf, size_t bsize, unsigned int source)
2029{
2030 snprintf(buf, bsize, "SendCtxtErrInt%u", source);
2031 return buf;
2032}
2033
2034static const char * const various_names[] = {
2035 "PbcInt",
2036 "GpioAssertInt",
2037 "Qsfp1Int",
2038 "Qsfp2Int",
2039 "TCritInt"
2040};
2041
2042/*
2043 * Return the various interrupt name.
2044 */
2045static char *is_various_name(char *buf, size_t bsize, unsigned int source)
2046{
2047 if (source < ARRAY_SIZE(various_names))
2048 strncpy(buf, various_names[source], bsize);
2049 else
2050 snprintf(buf, bsize, "Reserved%u", source+IS_VARIOUS_START);
2051 return buf;
2052}
2053
2054/*
2055 * Return the DC interrupt name.
2056 */
2057static char *is_dc_name(char *buf, size_t bsize, unsigned int source)
2058{
2059 static const char * const dc_int_names[] = {
2060 "common",
2061 "lcb",
2062 "8051",
2063 "lbm" /* local block merge */
2064 };
2065
2066 if (source < ARRAY_SIZE(dc_int_names))
2067 snprintf(buf, bsize, "dc_%s_int", dc_int_names[source]);
2068 else
2069 snprintf(buf, bsize, "DCInt%u", source);
2070 return buf;
2071}
2072
2073static const char * const sdma_int_names[] = {
2074 "SDmaInt",
2075 "SdmaIdleInt",
2076 "SdmaProgressInt",
2077};
2078
2079/*
2080 * Return the SDMA engine interrupt name.
2081 */
2082static char *is_sdma_eng_name(char *buf, size_t bsize, unsigned int source)
2083{
2084 /* what interrupt */
2085 unsigned int what = source / TXE_NUM_SDMA_ENGINES;
2086 /* which engine */
2087 unsigned int which = source % TXE_NUM_SDMA_ENGINES;
2088
2089 if (likely(what < 3))
2090 snprintf(buf, bsize, "%s%u", sdma_int_names[what], which);
2091 else
2092 snprintf(buf, bsize, "Invalid SDMA interrupt %u", source);
2093 return buf;
2094}
2095
2096/*
2097 * Return the receive available interrupt name.
2098 */
2099static char *is_rcv_avail_name(char *buf, size_t bsize, unsigned int source)
2100{
2101 snprintf(buf, bsize, "RcvAvailInt%u", source);
2102 return buf;
2103}
2104
2105/*
2106 * Return the receive urgent interrupt name.
2107 */
2108static char *is_rcv_urgent_name(char *buf, size_t bsize, unsigned int source)
2109{
2110 snprintf(buf, bsize, "RcvUrgentInt%u", source);
2111 return buf;
2112}
2113
2114/*
2115 * Return the send credit interrupt name.
2116 */
2117static char *is_send_credit_name(char *buf, size_t bsize, unsigned int source)
2118{
2119 snprintf(buf, bsize, "SendCreditInt%u", source);
2120 return buf;
2121}
2122
2123/*
2124 * Return the reserved interrupt name.
2125 */
2126static char *is_reserved_name(char *buf, size_t bsize, unsigned int source)
2127{
2128 snprintf(buf, bsize, "Reserved%u", source + IS_RESERVED_START);
2129 return buf;
2130}
2131
2132static char *cce_err_status_string(char *buf, int buf_len, u64 flags)
2133{
2134 return flag_string(buf, buf_len, flags,
2135 cce_err_status_flags, ARRAY_SIZE(cce_err_status_flags));
2136}
2137
2138static char *rxe_err_status_string(char *buf, int buf_len, u64 flags)
2139{
2140 return flag_string(buf, buf_len, flags,
2141 rxe_err_status_flags, ARRAY_SIZE(rxe_err_status_flags));
2142}
2143
2144static char *misc_err_status_string(char *buf, int buf_len, u64 flags)
2145{
2146 return flag_string(buf, buf_len, flags, misc_err_status_flags,
2147 ARRAY_SIZE(misc_err_status_flags));
2148}
2149
2150static char *pio_err_status_string(char *buf, int buf_len, u64 flags)
2151{
2152 return flag_string(buf, buf_len, flags,
2153 pio_err_status_flags, ARRAY_SIZE(pio_err_status_flags));
2154}
2155
2156static char *sdma_err_status_string(char *buf, int buf_len, u64 flags)
2157{
2158 return flag_string(buf, buf_len, flags,
2159 sdma_err_status_flags,
2160 ARRAY_SIZE(sdma_err_status_flags));
2161}
2162
2163static char *egress_err_status_string(char *buf, int buf_len, u64 flags)
2164{
2165 return flag_string(buf, buf_len, flags,
2166 egress_err_status_flags, ARRAY_SIZE(egress_err_status_flags));
2167}
2168
2169static char *egress_err_info_string(char *buf, int buf_len, u64 flags)
2170{
2171 return flag_string(buf, buf_len, flags,
2172 egress_err_info_flags, ARRAY_SIZE(egress_err_info_flags));
2173}
2174
2175static char *send_err_status_string(char *buf, int buf_len, u64 flags)
2176{
2177 return flag_string(buf, buf_len, flags,
2178 send_err_status_flags,
2179 ARRAY_SIZE(send_err_status_flags));
2180}
2181
2182static void handle_cce_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2183{
2184 char buf[96];
2185
2186 /*
2187 * For most these errors, there is nothing that can be done except
2188 * report or record it.
2189 */
2190 dd_dev_info(dd, "CCE Error: %s\n",
2191 cce_err_status_string(buf, sizeof(buf), reg));
2192
2193 if ((reg & CCE_ERR_STATUS_CCE_CLI2_ASYNC_FIFO_PARITY_ERR_SMASK)
2194 && is_a0(dd)
2195 && (dd->icode != ICODE_FUNCTIONAL_SIMULATOR)) {
2196 /* this error requires a manual drop into SPC freeze mode */
2197 /* then a fix up */
2198 start_freeze_handling(dd->pport, FREEZE_SELF);
2199 }
2200}
2201
2202/*
2203 * Check counters for receive errors that do not have an interrupt
2204 * associated with them.
2205 */
2206#define RCVERR_CHECK_TIME 10
2207static void update_rcverr_timer(unsigned long opaque)
2208{
2209 struct hfi1_devdata *dd = (struct hfi1_devdata *)opaque;
2210 struct hfi1_pportdata *ppd = dd->pport;
2211 u32 cur_ovfl_cnt = read_dev_cntr(dd, C_RCV_OVF, CNTR_INVALID_VL);
2212
2213 if (dd->rcv_ovfl_cnt < cur_ovfl_cnt &&
2214 ppd->port_error_action & OPA_PI_MASK_EX_BUFFER_OVERRUN) {
2215 dd_dev_info(dd, "%s: PortErrorAction bounce\n", __func__);
2216 set_link_down_reason(ppd,
2217 OPA_LINKDOWN_REASON_EXCESSIVE_BUFFER_OVERRUN, 0,
2218 OPA_LINKDOWN_REASON_EXCESSIVE_BUFFER_OVERRUN);
2219 queue_work(ppd->hfi1_wq, &ppd->link_bounce_work);
2220 }
2221 dd->rcv_ovfl_cnt = (u32) cur_ovfl_cnt;
2222
2223 mod_timer(&dd->rcverr_timer, jiffies + HZ * RCVERR_CHECK_TIME);
2224}
2225
2226static int init_rcverr(struct hfi1_devdata *dd)
2227{
Muhammad Falak R Wani24523a92015-10-25 16:13:23 +05302228 setup_timer(&dd->rcverr_timer, update_rcverr_timer, (unsigned long)dd);
Mike Marciniszyn77241052015-07-30 15:17:43 -04002229 /* Assume the hardware counter has been reset */
2230 dd->rcv_ovfl_cnt = 0;
2231 return mod_timer(&dd->rcverr_timer, jiffies + HZ * RCVERR_CHECK_TIME);
2232}
2233
2234static void free_rcverr(struct hfi1_devdata *dd)
2235{
2236 if (dd->rcverr_timer.data)
2237 del_timer_sync(&dd->rcverr_timer);
2238 dd->rcverr_timer.data = 0;
2239}
2240
2241static void handle_rxe_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2242{
2243 char buf[96];
2244
2245 dd_dev_info(dd, "Receive Error: %s\n",
2246 rxe_err_status_string(buf, sizeof(buf), reg));
2247
2248 if (reg & ALL_RXE_FREEZE_ERR) {
2249 int flags = 0;
2250
2251 /*
2252 * Freeze mode recovery is disabled for the errors
2253 * in RXE_FREEZE_ABORT_MASK
2254 */
2255 if (is_a0(dd) && (reg & RXE_FREEZE_ABORT_MASK))
2256 flags = FREEZE_ABORT;
2257
2258 start_freeze_handling(dd->pport, flags);
2259 }
2260}
2261
2262static void handle_misc_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2263{
2264 char buf[96];
2265
2266 dd_dev_info(dd, "Misc Error: %s",
2267 misc_err_status_string(buf, sizeof(buf), reg));
2268}
2269
2270static void handle_pio_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2271{
2272 char buf[96];
2273
2274 dd_dev_info(dd, "PIO Error: %s\n",
2275 pio_err_status_string(buf, sizeof(buf), reg));
2276
2277 if (reg & ALL_PIO_FREEZE_ERR)
2278 start_freeze_handling(dd->pport, 0);
2279}
2280
2281static void handle_sdma_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2282{
2283 char buf[96];
2284
2285 dd_dev_info(dd, "SDMA Error: %s\n",
2286 sdma_err_status_string(buf, sizeof(buf), reg));
2287
2288 if (reg & ALL_SDMA_FREEZE_ERR)
2289 start_freeze_handling(dd->pport, 0);
2290}
2291
2292static void count_port_inactive(struct hfi1_devdata *dd)
2293{
2294 struct hfi1_pportdata *ppd = dd->pport;
2295
2296 if (ppd->port_xmit_discards < ~(u64)0)
2297 ppd->port_xmit_discards++;
2298}
2299
2300/*
2301 * We have had a "disallowed packet" error during egress. Determine the
2302 * integrity check which failed, and update relevant error counter, etc.
2303 *
2304 * Note that the SEND_EGRESS_ERR_INFO register has only a single
2305 * bit of state per integrity check, and so we can miss the reason for an
2306 * egress error if more than one packet fails the same integrity check
2307 * since we cleared the corresponding bit in SEND_EGRESS_ERR_INFO.
2308 */
2309static void handle_send_egress_err_info(struct hfi1_devdata *dd)
2310{
2311 struct hfi1_pportdata *ppd = dd->pport;
2312 u64 src = read_csr(dd, SEND_EGRESS_ERR_SOURCE); /* read first */
2313 u64 info = read_csr(dd, SEND_EGRESS_ERR_INFO);
2314 char buf[96];
2315
2316 /* clear down all observed info as quickly as possible after read */
2317 write_csr(dd, SEND_EGRESS_ERR_INFO, info);
2318
2319 dd_dev_info(dd,
2320 "Egress Error Info: 0x%llx, %s Egress Error Src 0x%llx\n",
2321 info, egress_err_info_string(buf, sizeof(buf), info), src);
2322
2323 /* Eventually add other counters for each bit */
2324
2325 if (info & SEND_EGRESS_ERR_INFO_TOO_LONG_IB_PACKET_ERR_SMASK) {
2326 if (ppd->port_xmit_discards < ~(u64)0)
2327 ppd->port_xmit_discards++;
2328 }
2329}
2330
2331/*
2332 * Input value is a bit position within the SEND_EGRESS_ERR_STATUS
2333 * register. Does it represent a 'port inactive' error?
2334 */
2335static inline int port_inactive_err(u64 posn)
2336{
2337 return (posn >= SEES(TX_LINKDOWN) &&
2338 posn <= SEES(TX_INCORRECT_LINK_STATE));
2339}
2340
2341/*
2342 * Input value is a bit position within the SEND_EGRESS_ERR_STATUS
2343 * register. Does it represent a 'disallowed packet' error?
2344 */
2345static inline int disallowed_pkt_err(u64 posn)
2346{
2347 return (posn >= SEES(TX_SDMA0_DISALLOWED_PACKET) &&
2348 posn <= SEES(TX_SDMA15_DISALLOWED_PACKET));
2349}
2350
2351static void handle_egress_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2352{
2353 u64 reg_copy = reg, handled = 0;
2354 char buf[96];
2355
2356 if (reg & ALL_TXE_EGRESS_FREEZE_ERR)
2357 start_freeze_handling(dd->pport, 0);
2358 if (is_a0(dd) && (reg &
2359 SEND_EGRESS_ERR_STATUS_TX_CREDIT_RETURN_VL_ERR_SMASK)
2360 && (dd->icode != ICODE_FUNCTIONAL_SIMULATOR))
2361 start_freeze_handling(dd->pport, 0);
2362
2363 while (reg_copy) {
2364 int posn = fls64(reg_copy);
2365 /*
2366 * fls64() returns a 1-based offset, but we generally
2367 * want 0-based offsets.
2368 */
2369 int shift = posn - 1;
2370
2371 if (port_inactive_err(shift)) {
2372 count_port_inactive(dd);
2373 handled |= (1ULL << shift);
2374 } else if (disallowed_pkt_err(shift)) {
2375 handle_send_egress_err_info(dd);
2376 handled |= (1ULL << shift);
2377 }
2378 clear_bit(shift, (unsigned long *)&reg_copy);
2379 }
2380
2381 reg &= ~handled;
2382
2383 if (reg)
2384 dd_dev_info(dd, "Egress Error: %s\n",
2385 egress_err_status_string(buf, sizeof(buf), reg));
2386}
2387
2388static void handle_txe_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
2389{
2390 char buf[96];
2391
2392 dd_dev_info(dd, "Send Error: %s\n",
2393 send_err_status_string(buf, sizeof(buf), reg));
2394
2395}
2396
2397/*
2398 * The maximum number of times the error clear down will loop before
2399 * blocking a repeating error. This value is arbitrary.
2400 */
2401#define MAX_CLEAR_COUNT 20
2402
2403/*
2404 * Clear and handle an error register. All error interrupts are funneled
2405 * through here to have a central location to correctly handle single-
2406 * or multi-shot errors.
2407 *
2408 * For non per-context registers, call this routine with a context value
2409 * of 0 so the per-context offset is zero.
2410 *
2411 * If the handler loops too many times, assume that something is wrong
2412 * and can't be fixed, so mask the error bits.
2413 */
2414static void interrupt_clear_down(struct hfi1_devdata *dd,
2415 u32 context,
2416 const struct err_reg_info *eri)
2417{
2418 u64 reg;
2419 u32 count;
2420
2421 /* read in a loop until no more errors are seen */
2422 count = 0;
2423 while (1) {
2424 reg = read_kctxt_csr(dd, context, eri->status);
2425 if (reg == 0)
2426 break;
2427 write_kctxt_csr(dd, context, eri->clear, reg);
2428 if (likely(eri->handler))
2429 eri->handler(dd, context, reg);
2430 count++;
2431 if (count > MAX_CLEAR_COUNT) {
2432 u64 mask;
2433
2434 dd_dev_err(dd, "Repeating %s bits 0x%llx - masking\n",
2435 eri->desc, reg);
2436 /*
2437 * Read-modify-write so any other masked bits
2438 * remain masked.
2439 */
2440 mask = read_kctxt_csr(dd, context, eri->mask);
2441 mask &= ~reg;
2442 write_kctxt_csr(dd, context, eri->mask, mask);
2443 break;
2444 }
2445 }
2446}
2447
2448/*
2449 * CCE block "misc" interrupt. Source is < 16.
2450 */
2451static void is_misc_err_int(struct hfi1_devdata *dd, unsigned int source)
2452{
2453 const struct err_reg_info *eri = &misc_errs[source];
2454
2455 if (eri->handler) {
2456 interrupt_clear_down(dd, 0, eri);
2457 } else {
2458 dd_dev_err(dd, "Unexpected misc interrupt (%u) - reserved\n",
2459 source);
2460 }
2461}
2462
2463static char *send_context_err_status_string(char *buf, int buf_len, u64 flags)
2464{
2465 return flag_string(buf, buf_len, flags,
2466 sc_err_status_flags, ARRAY_SIZE(sc_err_status_flags));
2467}
2468
2469/*
2470 * Send context error interrupt. Source (hw_context) is < 160.
2471 *
2472 * All send context errors cause the send context to halt. The normal
2473 * clear-down mechanism cannot be used because we cannot clear the
2474 * error bits until several other long-running items are done first.
2475 * This is OK because with the context halted, nothing else is going
2476 * to happen on it anyway.
2477 */
2478static void is_sendctxt_err_int(struct hfi1_devdata *dd,
2479 unsigned int hw_context)
2480{
2481 struct send_context_info *sci;
2482 struct send_context *sc;
2483 char flags[96];
2484 u64 status;
2485 u32 sw_index;
2486
2487 sw_index = dd->hw_to_sw[hw_context];
2488 if (sw_index >= dd->num_send_contexts) {
2489 dd_dev_err(dd,
2490 "out of range sw index %u for send context %u\n",
2491 sw_index, hw_context);
2492 return;
2493 }
2494 sci = &dd->send_contexts[sw_index];
2495 sc = sci->sc;
2496 if (!sc) {
2497 dd_dev_err(dd, "%s: context %u(%u): no sc?\n", __func__,
2498 sw_index, hw_context);
2499 return;
2500 }
2501
2502 /* tell the software that a halt has begun */
2503 sc_stop(sc, SCF_HALTED);
2504
2505 status = read_kctxt_csr(dd, hw_context, SEND_CTXT_ERR_STATUS);
2506
2507 dd_dev_info(dd, "Send Context %u(%u) Error: %s\n", sw_index, hw_context,
2508 send_context_err_status_string(flags, sizeof(flags), status));
2509
2510 if (status & SEND_CTXT_ERR_STATUS_PIO_DISALLOWED_PACKET_ERR_SMASK)
2511 handle_send_egress_err_info(dd);
2512
2513 /*
2514 * Automatically restart halted kernel contexts out of interrupt
2515 * context. User contexts must ask the driver to restart the context.
2516 */
2517 if (sc->type != SC_USER)
2518 queue_work(dd->pport->hfi1_wq, &sc->halt_work);
2519}
2520
2521static void handle_sdma_eng_err(struct hfi1_devdata *dd,
2522 unsigned int source, u64 status)
2523{
2524 struct sdma_engine *sde;
2525
2526 sde = &dd->per_sdma[source];
2527#ifdef CONFIG_SDMA_VERBOSITY
2528 dd_dev_err(sde->dd, "CONFIG SDMA(%u) %s:%d %s()\n", sde->this_idx,
2529 slashstrip(__FILE__), __LINE__, __func__);
2530 dd_dev_err(sde->dd, "CONFIG SDMA(%u) source: %u status 0x%llx\n",
2531 sde->this_idx, source, (unsigned long long)status);
2532#endif
2533 sdma_engine_error(sde, status);
2534}
2535
2536/*
2537 * CCE block SDMA error interrupt. Source is < 16.
2538 */
2539static void is_sdma_eng_err_int(struct hfi1_devdata *dd, unsigned int source)
2540{
2541#ifdef CONFIG_SDMA_VERBOSITY
2542 struct sdma_engine *sde = &dd->per_sdma[source];
2543
2544 dd_dev_err(dd, "CONFIG SDMA(%u) %s:%d %s()\n", sde->this_idx,
2545 slashstrip(__FILE__), __LINE__, __func__);
2546 dd_dev_err(dd, "CONFIG SDMA(%u) source: %u\n", sde->this_idx,
2547 source);
2548 sdma_dumpstate(sde);
2549#endif
2550 interrupt_clear_down(dd, source, &sdma_eng_err);
2551}
2552
2553/*
2554 * CCE block "various" interrupt. Source is < 8.
2555 */
2556static void is_various_int(struct hfi1_devdata *dd, unsigned int source)
2557{
2558 const struct err_reg_info *eri = &various_err[source];
2559
2560 /*
2561 * TCritInt cannot go through interrupt_clear_down()
2562 * because it is not a second tier interrupt. The handler
2563 * should be called directly.
2564 */
2565 if (source == TCRIT_INT_SOURCE)
2566 handle_temp_err(dd);
2567 else if (eri->handler)
2568 interrupt_clear_down(dd, 0, eri);
2569 else
2570 dd_dev_info(dd,
2571 "%s: Unimplemented/reserved interrupt %d\n",
2572 __func__, source);
2573}
2574
2575static void handle_qsfp_int(struct hfi1_devdata *dd, u32 src_ctx, u64 reg)
2576{
2577 /* source is always zero */
2578 struct hfi1_pportdata *ppd = dd->pport;
2579 unsigned long flags;
2580 u64 qsfp_int_mgmt = (u64)(QSFP_HFI0_INT_N | QSFP_HFI0_MODPRST_N);
2581
2582 if (reg & QSFP_HFI0_MODPRST_N) {
2583
2584 dd_dev_info(dd, "%s: ModPresent triggered QSFP interrupt\n",
2585 __func__);
2586
2587 if (!qsfp_mod_present(ppd)) {
2588 ppd->driver_link_ready = 0;
2589 /*
2590 * Cable removed, reset all our information about the
2591 * cache and cable capabilities
2592 */
2593
2594 spin_lock_irqsave(&ppd->qsfp_info.qsfp_lock, flags);
2595 /*
2596 * We don't set cache_refresh_required here as we expect
2597 * an interrupt when a cable is inserted
2598 */
2599 ppd->qsfp_info.cache_valid = 0;
2600 ppd->qsfp_info.qsfp_interrupt_functional = 0;
2601 spin_unlock_irqrestore(&ppd->qsfp_info.qsfp_lock,
2602 flags);
2603 write_csr(dd,
2604 dd->hfi1_id ?
2605 ASIC_QSFP2_INVERT :
2606 ASIC_QSFP1_INVERT,
2607 qsfp_int_mgmt);
2608 if (ppd->host_link_state == HLS_DN_POLL) {
2609 /*
2610 * The link is still in POLL. This means
2611 * that the normal link down processing
2612 * will not happen. We have to do it here
2613 * before turning the DC off.
2614 */
2615 queue_work(ppd->hfi1_wq, &ppd->link_down_work);
2616 }
2617 } else {
2618 spin_lock_irqsave(&ppd->qsfp_info.qsfp_lock, flags);
2619 ppd->qsfp_info.cache_valid = 0;
2620 ppd->qsfp_info.cache_refresh_required = 1;
2621 spin_unlock_irqrestore(&ppd->qsfp_info.qsfp_lock,
2622 flags);
2623
2624 qsfp_int_mgmt &= ~(u64)QSFP_HFI0_MODPRST_N;
2625 write_csr(dd,
2626 dd->hfi1_id ?
2627 ASIC_QSFP2_INVERT :
2628 ASIC_QSFP1_INVERT,
2629 qsfp_int_mgmt);
2630 }
2631 }
2632
2633 if (reg & QSFP_HFI0_INT_N) {
2634
2635 dd_dev_info(dd, "%s: IntN triggered QSFP interrupt\n",
2636 __func__);
2637 spin_lock_irqsave(&ppd->qsfp_info.qsfp_lock, flags);
2638 ppd->qsfp_info.check_interrupt_flags = 1;
2639 ppd->qsfp_info.qsfp_interrupt_functional = 1;
2640 spin_unlock_irqrestore(&ppd->qsfp_info.qsfp_lock, flags);
2641 }
2642
2643 /* Schedule the QSFP work only if there is a cable attached. */
2644 if (qsfp_mod_present(ppd))
2645 queue_work(ppd->hfi1_wq, &ppd->qsfp_info.qsfp_work);
2646}
2647
2648static int request_host_lcb_access(struct hfi1_devdata *dd)
2649{
2650 int ret;
2651
2652 ret = do_8051_command(dd, HCMD_MISC,
2653 (u64)HCMD_MISC_REQUEST_LCB_ACCESS << LOAD_DATA_FIELD_ID_SHIFT,
2654 NULL);
2655 if (ret != HCMD_SUCCESS) {
2656 dd_dev_err(dd, "%s: command failed with error %d\n",
2657 __func__, ret);
2658 }
2659 return ret == HCMD_SUCCESS ? 0 : -EBUSY;
2660}
2661
2662static int request_8051_lcb_access(struct hfi1_devdata *dd)
2663{
2664 int ret;
2665
2666 ret = do_8051_command(dd, HCMD_MISC,
2667 (u64)HCMD_MISC_GRANT_LCB_ACCESS << LOAD_DATA_FIELD_ID_SHIFT,
2668 NULL);
2669 if (ret != HCMD_SUCCESS) {
2670 dd_dev_err(dd, "%s: command failed with error %d\n",
2671 __func__, ret);
2672 }
2673 return ret == HCMD_SUCCESS ? 0 : -EBUSY;
2674}
2675
2676/*
2677 * Set the LCB selector - allow host access. The DCC selector always
2678 * points to the host.
2679 */
2680static inline void set_host_lcb_access(struct hfi1_devdata *dd)
2681{
2682 write_csr(dd, DC_DC8051_CFG_CSR_ACCESS_SEL,
2683 DC_DC8051_CFG_CSR_ACCESS_SEL_DCC_SMASK
2684 | DC_DC8051_CFG_CSR_ACCESS_SEL_LCB_SMASK);
2685}
2686
2687/*
2688 * Clear the LCB selector - allow 8051 access. The DCC selector always
2689 * points to the host.
2690 */
2691static inline void set_8051_lcb_access(struct hfi1_devdata *dd)
2692{
2693 write_csr(dd, DC_DC8051_CFG_CSR_ACCESS_SEL,
2694 DC_DC8051_CFG_CSR_ACCESS_SEL_DCC_SMASK);
2695}
2696
2697/*
2698 * Acquire LCB access from the 8051. If the host already has access,
2699 * just increment a counter. Otherwise, inform the 8051 that the
2700 * host is taking access.
2701 *
2702 * Returns:
2703 * 0 on success
2704 * -EBUSY if the 8051 has control and cannot be disturbed
2705 * -errno if unable to acquire access from the 8051
2706 */
2707int acquire_lcb_access(struct hfi1_devdata *dd, int sleep_ok)
2708{
2709 struct hfi1_pportdata *ppd = dd->pport;
2710 int ret = 0;
2711
2712 /*
2713 * Use the host link state lock so the operation of this routine
2714 * { link state check, selector change, count increment } can occur
2715 * as a unit against a link state change. Otherwise there is a
2716 * race between the state change and the count increment.
2717 */
2718 if (sleep_ok) {
2719 mutex_lock(&ppd->hls_lock);
2720 } else {
Dan Carpenter951842b2015-09-16 09:22:51 +03002721 while (!mutex_trylock(&ppd->hls_lock))
Mike Marciniszyn77241052015-07-30 15:17:43 -04002722 udelay(1);
2723 }
2724
2725 /* this access is valid only when the link is up */
2726 if ((ppd->host_link_state & HLS_UP) == 0) {
2727 dd_dev_info(dd, "%s: link state %s not up\n",
2728 __func__, link_state_name(ppd->host_link_state));
2729 ret = -EBUSY;
2730 goto done;
2731 }
2732
2733 if (dd->lcb_access_count == 0) {
2734 ret = request_host_lcb_access(dd);
2735 if (ret) {
2736 dd_dev_err(dd,
2737 "%s: unable to acquire LCB access, err %d\n",
2738 __func__, ret);
2739 goto done;
2740 }
2741 set_host_lcb_access(dd);
2742 }
2743 dd->lcb_access_count++;
2744done:
2745 mutex_unlock(&ppd->hls_lock);
2746 return ret;
2747}
2748
2749/*
2750 * Release LCB access by decrementing the use count. If the count is moving
2751 * from 1 to 0, inform 8051 that it has control back.
2752 *
2753 * Returns:
2754 * 0 on success
2755 * -errno if unable to release access to the 8051
2756 */
2757int release_lcb_access(struct hfi1_devdata *dd, int sleep_ok)
2758{
2759 int ret = 0;
2760
2761 /*
2762 * Use the host link state lock because the acquire needed it.
2763 * Here, we only need to keep { selector change, count decrement }
2764 * as a unit.
2765 */
2766 if (sleep_ok) {
2767 mutex_lock(&dd->pport->hls_lock);
2768 } else {
Dan Carpenter951842b2015-09-16 09:22:51 +03002769 while (!mutex_trylock(&dd->pport->hls_lock))
Mike Marciniszyn77241052015-07-30 15:17:43 -04002770 udelay(1);
2771 }
2772
2773 if (dd->lcb_access_count == 0) {
2774 dd_dev_err(dd, "%s: LCB access count is zero. Skipping.\n",
2775 __func__);
2776 goto done;
2777 }
2778
2779 if (dd->lcb_access_count == 1) {
2780 set_8051_lcb_access(dd);
2781 ret = request_8051_lcb_access(dd);
2782 if (ret) {
2783 dd_dev_err(dd,
2784 "%s: unable to release LCB access, err %d\n",
2785 __func__, ret);
2786 /* restore host access if the grant didn't work */
2787 set_host_lcb_access(dd);
2788 goto done;
2789 }
2790 }
2791 dd->lcb_access_count--;
2792done:
2793 mutex_unlock(&dd->pport->hls_lock);
2794 return ret;
2795}
2796
2797/*
2798 * Initialize LCB access variables and state. Called during driver load,
2799 * after most of the initialization is finished.
2800 *
2801 * The DC default is LCB access on for the host. The driver defaults to
2802 * leaving access to the 8051. Assign access now - this constrains the call
2803 * to this routine to be after all LCB set-up is done. In particular, after
2804 * hf1_init_dd() -> set_up_interrupts() -> clear_all_interrupts()
2805 */
2806static void init_lcb_access(struct hfi1_devdata *dd)
2807{
2808 dd->lcb_access_count = 0;
2809}
2810
2811/*
2812 * Write a response back to a 8051 request.
2813 */
2814static void hreq_response(struct hfi1_devdata *dd, u8 return_code, u16 rsp_data)
2815{
2816 write_csr(dd, DC_DC8051_CFG_EXT_DEV_0,
2817 DC_DC8051_CFG_EXT_DEV_0_COMPLETED_SMASK
2818 | (u64)return_code << DC_DC8051_CFG_EXT_DEV_0_RETURN_CODE_SHIFT
2819 | (u64)rsp_data << DC_DC8051_CFG_EXT_DEV_0_RSP_DATA_SHIFT);
2820}
2821
2822/*
2823 * Handle requests from the 8051.
2824 */
2825static void handle_8051_request(struct hfi1_devdata *dd)
2826{
2827 u64 reg;
2828 u16 data;
2829 u8 type;
2830
2831 reg = read_csr(dd, DC_DC8051_CFG_EXT_DEV_1);
2832 if ((reg & DC_DC8051_CFG_EXT_DEV_1_REQ_NEW_SMASK) == 0)
2833 return; /* no request */
2834
2835 /* zero out COMPLETED so the response is seen */
2836 write_csr(dd, DC_DC8051_CFG_EXT_DEV_0, 0);
2837
2838 /* extract request details */
2839 type = (reg >> DC_DC8051_CFG_EXT_DEV_1_REQ_TYPE_SHIFT)
2840 & DC_DC8051_CFG_EXT_DEV_1_REQ_TYPE_MASK;
2841 data = (reg >> DC_DC8051_CFG_EXT_DEV_1_REQ_DATA_SHIFT)
2842 & DC_DC8051_CFG_EXT_DEV_1_REQ_DATA_MASK;
2843
2844 switch (type) {
2845 case HREQ_LOAD_CONFIG:
2846 case HREQ_SAVE_CONFIG:
2847 case HREQ_READ_CONFIG:
2848 case HREQ_SET_TX_EQ_ABS:
2849 case HREQ_SET_TX_EQ_REL:
2850 case HREQ_ENABLE:
2851 dd_dev_info(dd, "8051 request: request 0x%x not supported\n",
2852 type);
2853 hreq_response(dd, HREQ_NOT_SUPPORTED, 0);
2854 break;
2855
2856 case HREQ_CONFIG_DONE:
2857 hreq_response(dd, HREQ_SUCCESS, 0);
2858 break;
2859
2860 case HREQ_INTERFACE_TEST:
2861 hreq_response(dd, HREQ_SUCCESS, data);
2862 break;
2863
2864 default:
2865 dd_dev_err(dd, "8051 request: unknown request 0x%x\n", type);
2866 hreq_response(dd, HREQ_NOT_SUPPORTED, 0);
2867 break;
2868 }
2869}
2870
2871static void write_global_credit(struct hfi1_devdata *dd,
2872 u8 vau, u16 total, u16 shared)
2873{
2874 write_csr(dd, SEND_CM_GLOBAL_CREDIT,
2875 ((u64)total
2876 << SEND_CM_GLOBAL_CREDIT_TOTAL_CREDIT_LIMIT_SHIFT)
2877 | ((u64)shared
2878 << SEND_CM_GLOBAL_CREDIT_SHARED_LIMIT_SHIFT)
2879 | ((u64)vau << SEND_CM_GLOBAL_CREDIT_AU_SHIFT));
2880}
2881
2882/*
2883 * Set up initial VL15 credits of the remote. Assumes the rest of
2884 * the CM credit registers are zero from a previous global or credit reset .
2885 */
2886void set_up_vl15(struct hfi1_devdata *dd, u8 vau, u16 vl15buf)
2887{
2888 /* leave shared count at zero for both global and VL15 */
2889 write_global_credit(dd, vau, vl15buf, 0);
2890
2891 /* We may need some credits for another VL when sending packets
2892 * with the snoop interface. Dividing it down the middle for VL15
2893 * and VL0 should suffice.
2894 */
2895 if (unlikely(dd->hfi1_snoop.mode_flag == HFI1_PORT_SNOOP_MODE)) {
2896 write_csr(dd, SEND_CM_CREDIT_VL15, (u64)(vl15buf >> 1)
2897 << SEND_CM_CREDIT_VL15_DEDICATED_LIMIT_VL_SHIFT);
2898 write_csr(dd, SEND_CM_CREDIT_VL, (u64)(vl15buf >> 1)
2899 << SEND_CM_CREDIT_VL_DEDICATED_LIMIT_VL_SHIFT);
2900 } else {
2901 write_csr(dd, SEND_CM_CREDIT_VL15, (u64)vl15buf
2902 << SEND_CM_CREDIT_VL15_DEDICATED_LIMIT_VL_SHIFT);
2903 }
2904}
2905
2906/*
2907 * Zero all credit details from the previous connection and
2908 * reset the CM manager's internal counters.
2909 */
2910void reset_link_credits(struct hfi1_devdata *dd)
2911{
2912 int i;
2913
2914 /* remove all previous VL credit limits */
2915 for (i = 0; i < TXE_NUM_DATA_VL; i++)
2916 write_csr(dd, SEND_CM_CREDIT_VL + (8*i), 0);
2917 write_csr(dd, SEND_CM_CREDIT_VL15, 0);
2918 write_global_credit(dd, 0, 0, 0);
2919 /* reset the CM block */
2920 pio_send_control(dd, PSC_CM_RESET);
2921}
2922
2923/* convert a vCU to a CU */
2924static u32 vcu_to_cu(u8 vcu)
2925{
2926 return 1 << vcu;
2927}
2928
2929/* convert a CU to a vCU */
2930static u8 cu_to_vcu(u32 cu)
2931{
2932 return ilog2(cu);
2933}
2934
2935/* convert a vAU to an AU */
2936static u32 vau_to_au(u8 vau)
2937{
2938 return 8 * (1 << vau);
2939}
2940
2941static void set_linkup_defaults(struct hfi1_pportdata *ppd)
2942{
2943 ppd->sm_trap_qp = 0x0;
2944 ppd->sa_qp = 0x1;
2945}
2946
2947/*
2948 * Graceful LCB shutdown. This leaves the LCB FIFOs in reset.
2949 */
2950static void lcb_shutdown(struct hfi1_devdata *dd, int abort)
2951{
2952 u64 reg;
2953
2954 /* clear lcb run: LCB_CFG_RUN.EN = 0 */
2955 write_csr(dd, DC_LCB_CFG_RUN, 0);
2956 /* set tx fifo reset: LCB_CFG_TX_FIFOS_RESET.VAL = 1 */
2957 write_csr(dd, DC_LCB_CFG_TX_FIFOS_RESET,
2958 1ull << DC_LCB_CFG_TX_FIFOS_RESET_VAL_SHIFT);
2959 /* set dcc reset csr: DCC_CFG_RESET.{reset_lcb,reset_rx_fpe} = 1 */
2960 dd->lcb_err_en = read_csr(dd, DC_LCB_ERR_EN);
2961 reg = read_csr(dd, DCC_CFG_RESET);
2962 write_csr(dd, DCC_CFG_RESET,
2963 reg
2964 | (1ull << DCC_CFG_RESET_RESET_LCB_SHIFT)
2965 | (1ull << DCC_CFG_RESET_RESET_RX_FPE_SHIFT));
2966 (void) read_csr(dd, DCC_CFG_RESET); /* make sure the write completed */
2967 if (!abort) {
2968 udelay(1); /* must hold for the longer of 16cclks or 20ns */
2969 write_csr(dd, DCC_CFG_RESET, reg);
2970 write_csr(dd, DC_LCB_ERR_EN, dd->lcb_err_en);
2971 }
2972}
2973
2974/*
2975 * This routine should be called after the link has been transitioned to
2976 * OFFLINE (OFFLINE state has the side effect of putting the SerDes into
2977 * reset).
2978 *
2979 * The expectation is that the caller of this routine would have taken
2980 * care of properly transitioning the link into the correct state.
2981 */
2982static void dc_shutdown(struct hfi1_devdata *dd)
2983{
2984 unsigned long flags;
2985
2986 spin_lock_irqsave(&dd->dc8051_lock, flags);
2987 if (dd->dc_shutdown) {
2988 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
2989 return;
2990 }
2991 dd->dc_shutdown = 1;
2992 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
2993 /* Shutdown the LCB */
2994 lcb_shutdown(dd, 1);
2995 /* Going to OFFLINE would have causes the 8051 to put the
2996 * SerDes into reset already. Just need to shut down the 8051,
2997 * itself. */
2998 write_csr(dd, DC_DC8051_CFG_RST, 0x1);
2999}
3000
3001/* Calling this after the DC has been brought out of reset should not
3002 * do any damage. */
3003static void dc_start(struct hfi1_devdata *dd)
3004{
3005 unsigned long flags;
3006 int ret;
3007
3008 spin_lock_irqsave(&dd->dc8051_lock, flags);
3009 if (!dd->dc_shutdown)
3010 goto done;
3011 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
3012 /* Take the 8051 out of reset */
3013 write_csr(dd, DC_DC8051_CFG_RST, 0ull);
3014 /* Wait until 8051 is ready */
3015 ret = wait_fm_ready(dd, TIMEOUT_8051_START);
3016 if (ret) {
3017 dd_dev_err(dd, "%s: timeout starting 8051 firmware\n",
3018 __func__);
3019 }
3020 /* Take away reset for LCB and RX FPE (set in lcb_shutdown). */
3021 write_csr(dd, DCC_CFG_RESET, 0x10);
3022 /* lcb_shutdown() with abort=1 does not restore these */
3023 write_csr(dd, DC_LCB_ERR_EN, dd->lcb_err_en);
3024 spin_lock_irqsave(&dd->dc8051_lock, flags);
3025 dd->dc_shutdown = 0;
3026done:
3027 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
3028}
3029
3030/*
3031 * These LCB adjustments are for the Aurora SerDes core in the FPGA.
3032 */
3033static void adjust_lcb_for_fpga_serdes(struct hfi1_devdata *dd)
3034{
3035 u64 rx_radr, tx_radr;
3036 u32 version;
3037
3038 if (dd->icode != ICODE_FPGA_EMULATION)
3039 return;
3040
3041 /*
3042 * These LCB defaults on emulator _s are good, nothing to do here:
3043 * LCB_CFG_TX_FIFOS_RADR
3044 * LCB_CFG_RX_FIFOS_RADR
3045 * LCB_CFG_LN_DCLK
3046 * LCB_CFG_IGNORE_LOST_RCLK
3047 */
3048 if (is_emulator_s(dd))
3049 return;
3050 /* else this is _p */
3051
3052 version = emulator_rev(dd);
3053 if (!is_a0(dd))
3054 version = 0x2d; /* all B0 use 0x2d or higher settings */
3055
3056 if (version <= 0x12) {
3057 /* release 0x12 and below */
3058
3059 /*
3060 * LCB_CFG_RX_FIFOS_RADR.RST_VAL = 0x9
3061 * LCB_CFG_RX_FIFOS_RADR.OK_TO_JUMP_VAL = 0x9
3062 * LCB_CFG_RX_FIFOS_RADR.DO_NOT_JUMP_VAL = 0xa
3063 */
3064 rx_radr =
3065 0xaull << DC_LCB_CFG_RX_FIFOS_RADR_DO_NOT_JUMP_VAL_SHIFT
3066 | 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_OK_TO_JUMP_VAL_SHIFT
3067 | 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_RST_VAL_SHIFT;
3068 /*
3069 * LCB_CFG_TX_FIFOS_RADR.ON_REINIT = 0 (default)
3070 * LCB_CFG_TX_FIFOS_RADR.RST_VAL = 6
3071 */
3072 tx_radr = 6ull << DC_LCB_CFG_TX_FIFOS_RADR_RST_VAL_SHIFT;
3073 } else if (version <= 0x18) {
3074 /* release 0x13 up to 0x18 */
3075 /* LCB_CFG_RX_FIFOS_RADR = 0x988 */
3076 rx_radr =
3077 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_DO_NOT_JUMP_VAL_SHIFT
3078 | 0x8ull << DC_LCB_CFG_RX_FIFOS_RADR_OK_TO_JUMP_VAL_SHIFT
3079 | 0x8ull << DC_LCB_CFG_RX_FIFOS_RADR_RST_VAL_SHIFT;
3080 tx_radr = 7ull << DC_LCB_CFG_TX_FIFOS_RADR_RST_VAL_SHIFT;
3081 } else if (version == 0x19) {
3082 /* release 0x19 */
3083 /* LCB_CFG_RX_FIFOS_RADR = 0xa99 */
3084 rx_radr =
3085 0xAull << DC_LCB_CFG_RX_FIFOS_RADR_DO_NOT_JUMP_VAL_SHIFT
3086 | 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_OK_TO_JUMP_VAL_SHIFT
3087 | 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_RST_VAL_SHIFT;
3088 tx_radr = 3ull << DC_LCB_CFG_TX_FIFOS_RADR_RST_VAL_SHIFT;
3089 } else if (version == 0x1a) {
3090 /* release 0x1a */
3091 /* LCB_CFG_RX_FIFOS_RADR = 0x988 */
3092 rx_radr =
3093 0x9ull << DC_LCB_CFG_RX_FIFOS_RADR_DO_NOT_JUMP_VAL_SHIFT
3094 | 0x8ull << DC_LCB_CFG_RX_FIFOS_RADR_OK_TO_JUMP_VAL_SHIFT
3095 | 0x8ull << DC_LCB_CFG_RX_FIFOS_RADR_RST_VAL_SHIFT;
3096 tx_radr = 7ull << DC_LCB_CFG_TX_FIFOS_RADR_RST_VAL_SHIFT;
3097 write_csr(dd, DC_LCB_CFG_LN_DCLK, 1ull);
3098 } else {
3099 /* release 0x1b and higher */
3100 /* LCB_CFG_RX_FIFOS_RADR = 0x877 */
3101 rx_radr =
3102 0x8ull << DC_LCB_CFG_RX_FIFOS_RADR_DO_NOT_JUMP_VAL_SHIFT
3103 | 0x7ull << DC_LCB_CFG_RX_FIFOS_RADR_OK_TO_JUMP_VAL_SHIFT
3104 | 0x7ull << DC_LCB_CFG_RX_FIFOS_RADR_RST_VAL_SHIFT;
3105 tx_radr = 3ull << DC_LCB_CFG_TX_FIFOS_RADR_RST_VAL_SHIFT;
3106 }
3107
3108 write_csr(dd, DC_LCB_CFG_RX_FIFOS_RADR, rx_radr);
3109 /* LCB_CFG_IGNORE_LOST_RCLK.EN = 1 */
3110 write_csr(dd, DC_LCB_CFG_IGNORE_LOST_RCLK,
3111 DC_LCB_CFG_IGNORE_LOST_RCLK_EN_SMASK);
3112 write_csr(dd, DC_LCB_CFG_TX_FIFOS_RADR, tx_radr);
3113}
3114
3115/*
3116 * Handle a SMA idle message
3117 *
3118 * This is a work-queue function outside of the interrupt.
3119 */
3120void handle_sma_message(struct work_struct *work)
3121{
3122 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3123 sma_message_work);
3124 struct hfi1_devdata *dd = ppd->dd;
3125 u64 msg;
3126 int ret;
3127
3128 /* msg is bytes 1-4 of the 40-bit idle message - the command code
3129 is stripped off */
3130 ret = read_idle_sma(dd, &msg);
3131 if (ret)
3132 return;
3133 dd_dev_info(dd, "%s: SMA message 0x%llx\n", __func__, msg);
3134 /*
3135 * React to the SMA message. Byte[1] (0 for us) is the command.
3136 */
3137 switch (msg & 0xff) {
3138 case SMA_IDLE_ARM:
3139 /*
3140 * See OPAv1 table 9-14 - HFI and External Switch Ports Key
3141 * State Transitions
3142 *
3143 * Only expected in INIT or ARMED, discard otherwise.
3144 */
3145 if (ppd->host_link_state & (HLS_UP_INIT | HLS_UP_ARMED))
3146 ppd->neighbor_normal = 1;
3147 break;
3148 case SMA_IDLE_ACTIVE:
3149 /*
3150 * See OPAv1 table 9-14 - HFI and External Switch Ports Key
3151 * State Transitions
3152 *
3153 * Can activate the node. Discard otherwise.
3154 */
3155 if (ppd->host_link_state == HLS_UP_ARMED
3156 && ppd->is_active_optimize_enabled) {
3157 ppd->neighbor_normal = 1;
3158 ret = set_link_state(ppd, HLS_UP_ACTIVE);
3159 if (ret)
3160 dd_dev_err(
3161 dd,
3162 "%s: received Active SMA idle message, couldn't set link to Active\n",
3163 __func__);
3164 }
3165 break;
3166 default:
3167 dd_dev_err(dd,
3168 "%s: received unexpected SMA idle message 0x%llx\n",
3169 __func__, msg);
3170 break;
3171 }
3172}
3173
3174static void adjust_rcvctrl(struct hfi1_devdata *dd, u64 add, u64 clear)
3175{
3176 u64 rcvctrl;
3177 unsigned long flags;
3178
3179 spin_lock_irqsave(&dd->rcvctrl_lock, flags);
3180 rcvctrl = read_csr(dd, RCV_CTRL);
3181 rcvctrl |= add;
3182 rcvctrl &= ~clear;
3183 write_csr(dd, RCV_CTRL, rcvctrl);
3184 spin_unlock_irqrestore(&dd->rcvctrl_lock, flags);
3185}
3186
3187static inline void add_rcvctrl(struct hfi1_devdata *dd, u64 add)
3188{
3189 adjust_rcvctrl(dd, add, 0);
3190}
3191
3192static inline void clear_rcvctrl(struct hfi1_devdata *dd, u64 clear)
3193{
3194 adjust_rcvctrl(dd, 0, clear);
3195}
3196
3197/*
3198 * Called from all interrupt handlers to start handling an SPC freeze.
3199 */
3200void start_freeze_handling(struct hfi1_pportdata *ppd, int flags)
3201{
3202 struct hfi1_devdata *dd = ppd->dd;
3203 struct send_context *sc;
3204 int i;
3205
3206 if (flags & FREEZE_SELF)
3207 write_csr(dd, CCE_CTRL, CCE_CTRL_SPC_FREEZE_SMASK);
3208
3209 /* enter frozen mode */
3210 dd->flags |= HFI1_FROZEN;
3211
3212 /* notify all SDMA engines that they are going into a freeze */
3213 sdma_freeze_notify(dd, !!(flags & FREEZE_LINK_DOWN));
3214
3215 /* do halt pre-handling on all enabled send contexts */
3216 for (i = 0; i < dd->num_send_contexts; i++) {
3217 sc = dd->send_contexts[i].sc;
3218 if (sc && (sc->flags & SCF_ENABLED))
3219 sc_stop(sc, SCF_FROZEN | SCF_HALTED);
3220 }
3221
3222 /* Send context are frozen. Notify user space */
3223 hfi1_set_uevent_bits(ppd, _HFI1_EVENT_FROZEN_BIT);
3224
3225 if (flags & FREEZE_ABORT) {
3226 dd_dev_err(dd,
3227 "Aborted freeze recovery. Please REBOOT system\n");
3228 return;
3229 }
3230 /* queue non-interrupt handler */
3231 queue_work(ppd->hfi1_wq, &ppd->freeze_work);
3232}
3233
3234/*
3235 * Wait until all 4 sub-blocks indicate that they have frozen or unfrozen,
3236 * depending on the "freeze" parameter.
3237 *
3238 * No need to return an error if it times out, our only option
3239 * is to proceed anyway.
3240 */
3241static void wait_for_freeze_status(struct hfi1_devdata *dd, int freeze)
3242{
3243 unsigned long timeout;
3244 u64 reg;
3245
3246 timeout = jiffies + msecs_to_jiffies(FREEZE_STATUS_TIMEOUT);
3247 while (1) {
3248 reg = read_csr(dd, CCE_STATUS);
3249 if (freeze) {
3250 /* waiting until all indicators are set */
3251 if ((reg & ALL_FROZE) == ALL_FROZE)
3252 return; /* all done */
3253 } else {
3254 /* waiting until all indicators are clear */
3255 if ((reg & ALL_FROZE) == 0)
3256 return; /* all done */
3257 }
3258
3259 if (time_after(jiffies, timeout)) {
3260 dd_dev_err(dd,
3261 "Time out waiting for SPC %sfreeze, bits 0x%llx, expecting 0x%llx, continuing",
3262 freeze ? "" : "un",
3263 reg & ALL_FROZE,
3264 freeze ? ALL_FROZE : 0ull);
3265 return;
3266 }
3267 usleep_range(80, 120);
3268 }
3269}
3270
3271/*
3272 * Do all freeze handling for the RXE block.
3273 */
3274static void rxe_freeze(struct hfi1_devdata *dd)
3275{
3276 int i;
3277
3278 /* disable port */
3279 clear_rcvctrl(dd, RCV_CTRL_RCV_PORT_ENABLE_SMASK);
3280
3281 /* disable all receive contexts */
3282 for (i = 0; i < dd->num_rcv_contexts; i++)
3283 hfi1_rcvctrl(dd, HFI1_RCVCTRL_CTXT_DIS, i);
3284}
3285
3286/*
3287 * Unfreeze handling for the RXE block - kernel contexts only.
3288 * This will also enable the port. User contexts will do unfreeze
3289 * handling on a per-context basis as they call into the driver.
3290 *
3291 */
3292static void rxe_kernel_unfreeze(struct hfi1_devdata *dd)
3293{
3294 int i;
3295
3296 /* enable all kernel contexts */
3297 for (i = 0; i < dd->n_krcv_queues; i++)
3298 hfi1_rcvctrl(dd, HFI1_RCVCTRL_CTXT_ENB, i);
3299
3300 /* enable port */
3301 add_rcvctrl(dd, RCV_CTRL_RCV_PORT_ENABLE_SMASK);
3302}
3303
3304/*
3305 * Non-interrupt SPC freeze handling.
3306 *
3307 * This is a work-queue function outside of the triggering interrupt.
3308 */
3309void handle_freeze(struct work_struct *work)
3310{
3311 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3312 freeze_work);
3313 struct hfi1_devdata *dd = ppd->dd;
3314
3315 /* wait for freeze indicators on all affected blocks */
3316 dd_dev_info(dd, "Entering SPC freeze\n");
3317 wait_for_freeze_status(dd, 1);
3318
3319 /* SPC is now frozen */
3320
3321 /* do send PIO freeze steps */
3322 pio_freeze(dd);
3323
3324 /* do send DMA freeze steps */
3325 sdma_freeze(dd);
3326
3327 /* do send egress freeze steps - nothing to do */
3328
3329 /* do receive freeze steps */
3330 rxe_freeze(dd);
3331
3332 /*
3333 * Unfreeze the hardware - clear the freeze, wait for each
3334 * block's frozen bit to clear, then clear the frozen flag.
3335 */
3336 write_csr(dd, CCE_CTRL, CCE_CTRL_SPC_UNFREEZE_SMASK);
3337 wait_for_freeze_status(dd, 0);
3338
3339 if (is_a0(dd)) {
3340 write_csr(dd, CCE_CTRL, CCE_CTRL_SPC_FREEZE_SMASK);
3341 wait_for_freeze_status(dd, 1);
3342 write_csr(dd, CCE_CTRL, CCE_CTRL_SPC_UNFREEZE_SMASK);
3343 wait_for_freeze_status(dd, 0);
3344 }
3345
3346 /* do send PIO unfreeze steps for kernel contexts */
3347 pio_kernel_unfreeze(dd);
3348
3349 /* do send DMA unfreeze steps */
3350 sdma_unfreeze(dd);
3351
3352 /* do send egress unfreeze steps - nothing to do */
3353
3354 /* do receive unfreeze steps for kernel contexts */
3355 rxe_kernel_unfreeze(dd);
3356
3357 /*
3358 * The unfreeze procedure touches global device registers when
3359 * it disables and re-enables RXE. Mark the device unfrozen
3360 * after all that is done so other parts of the driver waiting
3361 * for the device to unfreeze don't do things out of order.
3362 *
3363 * The above implies that the meaning of HFI1_FROZEN flag is
3364 * "Device has gone into freeze mode and freeze mode handling
3365 * is still in progress."
3366 *
3367 * The flag will be removed when freeze mode processing has
3368 * completed.
3369 */
3370 dd->flags &= ~HFI1_FROZEN;
3371 wake_up(&dd->event_queue);
3372
3373 /* no longer frozen */
3374 dd_dev_err(dd, "Exiting SPC freeze\n");
3375}
3376
3377/*
3378 * Handle a link up interrupt from the 8051.
3379 *
3380 * This is a work-queue function outside of the interrupt.
3381 */
3382void handle_link_up(struct work_struct *work)
3383{
3384 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3385 link_up_work);
3386 set_link_state(ppd, HLS_UP_INIT);
3387
3388 /* cache the read of DC_LCB_STS_ROUND_TRIP_LTP_CNT */
3389 read_ltp_rtt(ppd->dd);
3390 /*
3391 * OPA specifies that certain counters are cleared on a transition
3392 * to link up, so do that.
3393 */
3394 clear_linkup_counters(ppd->dd);
3395 /*
3396 * And (re)set link up default values.
3397 */
3398 set_linkup_defaults(ppd);
3399
3400 /* enforce link speed enabled */
3401 if ((ppd->link_speed_active & ppd->link_speed_enabled) == 0) {
3402 /* oops - current speed is not enabled, bounce */
3403 dd_dev_err(ppd->dd,
3404 "Link speed active 0x%x is outside enabled 0x%x, downing link\n",
3405 ppd->link_speed_active, ppd->link_speed_enabled);
3406 set_link_down_reason(ppd, OPA_LINKDOWN_REASON_SPEED_POLICY, 0,
3407 OPA_LINKDOWN_REASON_SPEED_POLICY);
3408 set_link_state(ppd, HLS_DN_OFFLINE);
3409 start_link(ppd);
3410 }
3411}
3412
3413/* Several pieces of LNI information were cached for SMA in ppd.
3414 * Reset these on link down */
3415static void reset_neighbor_info(struct hfi1_pportdata *ppd)
3416{
3417 ppd->neighbor_guid = 0;
3418 ppd->neighbor_port_number = 0;
3419 ppd->neighbor_type = 0;
3420 ppd->neighbor_fm_security = 0;
3421}
3422
3423/*
3424 * Handle a link down interrupt from the 8051.
3425 *
3426 * This is a work-queue function outside of the interrupt.
3427 */
3428void handle_link_down(struct work_struct *work)
3429{
3430 u8 lcl_reason, neigh_reason = 0;
3431 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3432 link_down_work);
3433
3434 /* go offline first, then deal with reasons */
3435 set_link_state(ppd, HLS_DN_OFFLINE);
3436
3437 lcl_reason = 0;
3438 read_planned_down_reason_code(ppd->dd, &neigh_reason);
3439
3440 /*
3441 * If no reason, assume peer-initiated but missed
3442 * LinkGoingDown idle flits.
3443 */
3444 if (neigh_reason == 0)
3445 lcl_reason = OPA_LINKDOWN_REASON_NEIGHBOR_UNKNOWN;
3446
3447 set_link_down_reason(ppd, lcl_reason, neigh_reason, 0);
3448
3449 reset_neighbor_info(ppd);
3450
3451 /* disable the port */
3452 clear_rcvctrl(ppd->dd, RCV_CTRL_RCV_PORT_ENABLE_SMASK);
3453
3454 /* If there is no cable attached, turn the DC off. Otherwise,
3455 * start the link bring up. */
3456 if (!qsfp_mod_present(ppd))
3457 dc_shutdown(ppd->dd);
3458 else
3459 start_link(ppd);
3460}
3461
3462void handle_link_bounce(struct work_struct *work)
3463{
3464 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3465 link_bounce_work);
3466
3467 /*
3468 * Only do something if the link is currently up.
3469 */
3470 if (ppd->host_link_state & HLS_UP) {
3471 set_link_state(ppd, HLS_DN_OFFLINE);
3472 start_link(ppd);
3473 } else {
3474 dd_dev_info(ppd->dd, "%s: link not up (%s), nothing to do\n",
3475 __func__, link_state_name(ppd->host_link_state));
3476 }
3477}
3478
3479/*
3480 * Mask conversion: Capability exchange to Port LTP. The capability
3481 * exchange has an implicit 16b CRC that is mandatory.
3482 */
3483static int cap_to_port_ltp(int cap)
3484{
3485 int port_ltp = PORT_LTP_CRC_MODE_16; /* this mode is mandatory */
3486
3487 if (cap & CAP_CRC_14B)
3488 port_ltp |= PORT_LTP_CRC_MODE_14;
3489 if (cap & CAP_CRC_48B)
3490 port_ltp |= PORT_LTP_CRC_MODE_48;
3491 if (cap & CAP_CRC_12B_16B_PER_LANE)
3492 port_ltp |= PORT_LTP_CRC_MODE_PER_LANE;
3493
3494 return port_ltp;
3495}
3496
3497/*
3498 * Convert an OPA Port LTP mask to capability mask
3499 */
3500int port_ltp_to_cap(int port_ltp)
3501{
3502 int cap_mask = 0;
3503
3504 if (port_ltp & PORT_LTP_CRC_MODE_14)
3505 cap_mask |= CAP_CRC_14B;
3506 if (port_ltp & PORT_LTP_CRC_MODE_48)
3507 cap_mask |= CAP_CRC_48B;
3508 if (port_ltp & PORT_LTP_CRC_MODE_PER_LANE)
3509 cap_mask |= CAP_CRC_12B_16B_PER_LANE;
3510
3511 return cap_mask;
3512}
3513
3514/*
3515 * Convert a single DC LCB CRC mode to an OPA Port LTP mask.
3516 */
3517static int lcb_to_port_ltp(int lcb_crc)
3518{
3519 int port_ltp = 0;
3520
3521 if (lcb_crc == LCB_CRC_12B_16B_PER_LANE)
3522 port_ltp = PORT_LTP_CRC_MODE_PER_LANE;
3523 else if (lcb_crc == LCB_CRC_48B)
3524 port_ltp = PORT_LTP_CRC_MODE_48;
3525 else if (lcb_crc == LCB_CRC_14B)
3526 port_ltp = PORT_LTP_CRC_MODE_14;
3527 else
3528 port_ltp = PORT_LTP_CRC_MODE_16;
3529
3530 return port_ltp;
3531}
3532
3533/*
3534 * Our neighbor has indicated that we are allowed to act as a fabric
3535 * manager, so place the full management partition key in the second
3536 * (0-based) pkey array position (see OPAv1, section 20.2.2.6.8). Note
3537 * that we should already have the limited management partition key in
3538 * array element 1, and also that the port is not yet up when
3539 * add_full_mgmt_pkey() is invoked.
3540 */
3541static void add_full_mgmt_pkey(struct hfi1_pportdata *ppd)
3542{
3543 struct hfi1_devdata *dd = ppd->dd;
3544
3545 /* Sanity check - ppd->pkeys[2] should be 0 */
3546 if (ppd->pkeys[2] != 0)
3547 dd_dev_err(dd, "%s pkey[2] already set to 0x%x, resetting it to 0x%x\n",
3548 __func__, ppd->pkeys[2], FULL_MGMT_P_KEY);
3549 ppd->pkeys[2] = FULL_MGMT_P_KEY;
3550 (void)hfi1_set_ib_cfg(ppd, HFI1_IB_CFG_PKEYS, 0);
3551}
3552
3553/*
3554 * Convert the given link width to the OPA link width bitmask.
3555 */
3556static u16 link_width_to_bits(struct hfi1_devdata *dd, u16 width)
3557{
3558 switch (width) {
3559 case 0:
3560 /*
3561 * Simulator and quick linkup do not set the width.
3562 * Just set it to 4x without complaint.
3563 */
3564 if (dd->icode == ICODE_FUNCTIONAL_SIMULATOR || quick_linkup)
3565 return OPA_LINK_WIDTH_4X;
3566 return 0; /* no lanes up */
3567 case 1: return OPA_LINK_WIDTH_1X;
3568 case 2: return OPA_LINK_WIDTH_2X;
3569 case 3: return OPA_LINK_WIDTH_3X;
3570 default:
3571 dd_dev_info(dd, "%s: invalid width %d, using 4\n",
3572 __func__, width);
3573 /* fall through */
3574 case 4: return OPA_LINK_WIDTH_4X;
3575 }
3576}
3577
3578/*
3579 * Do a population count on the bottom nibble.
3580 */
3581static const u8 bit_counts[16] = {
3582 0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4
3583};
3584static inline u8 nibble_to_count(u8 nibble)
3585{
3586 return bit_counts[nibble & 0xf];
3587}
3588
3589/*
3590 * Read the active lane information from the 8051 registers and return
3591 * their widths.
3592 *
3593 * Active lane information is found in these 8051 registers:
3594 * enable_lane_tx
3595 * enable_lane_rx
3596 */
3597static void get_link_widths(struct hfi1_devdata *dd, u16 *tx_width,
3598 u16 *rx_width)
3599{
3600 u16 tx, rx;
3601 u8 enable_lane_rx;
3602 u8 enable_lane_tx;
3603 u8 tx_polarity_inversion;
3604 u8 rx_polarity_inversion;
3605 u8 max_rate;
3606
3607 /* read the active lanes */
3608 read_tx_settings(dd, &enable_lane_tx, &tx_polarity_inversion,
3609 &rx_polarity_inversion, &max_rate);
3610 read_local_lni(dd, &enable_lane_rx);
3611
3612 /* convert to counts */
3613 tx = nibble_to_count(enable_lane_tx);
3614 rx = nibble_to_count(enable_lane_rx);
3615
3616 /*
3617 * Set link_speed_active here, overriding what was set in
3618 * handle_verify_cap(). The ASIC 8051 firmware does not correctly
3619 * set the max_rate field in handle_verify_cap until v0.19.
3620 */
3621 if ((dd->icode == ICODE_RTL_SILICON)
3622 && (dd->dc8051_ver < dc8051_ver(0, 19))) {
3623 /* max_rate: 0 = 12.5G, 1 = 25G */
3624 switch (max_rate) {
3625 case 0:
3626 dd->pport[0].link_speed_active = OPA_LINK_SPEED_12_5G;
3627 break;
3628 default:
3629 dd_dev_err(dd,
3630 "%s: unexpected max rate %d, using 25Gb\n",
3631 __func__, (int)max_rate);
3632 /* fall through */
3633 case 1:
3634 dd->pport[0].link_speed_active = OPA_LINK_SPEED_25G;
3635 break;
3636 }
3637 }
3638
3639 dd_dev_info(dd,
3640 "Fabric active lanes (width): tx 0x%x (%d), rx 0x%x (%d)\n",
3641 enable_lane_tx, tx, enable_lane_rx, rx);
3642 *tx_width = link_width_to_bits(dd, tx);
3643 *rx_width = link_width_to_bits(dd, rx);
3644}
3645
3646/*
3647 * Read verify_cap_local_fm_link_width[1] to obtain the link widths.
3648 * Valid after the end of VerifyCap and during LinkUp. Does not change
3649 * after link up. I.e. look elsewhere for downgrade information.
3650 *
3651 * Bits are:
3652 * + bits [7:4] contain the number of active transmitters
3653 * + bits [3:0] contain the number of active receivers
3654 * These are numbers 1 through 4 and can be different values if the
3655 * link is asymmetric.
3656 *
3657 * verify_cap_local_fm_link_width[0] retains its original value.
3658 */
3659static void get_linkup_widths(struct hfi1_devdata *dd, u16 *tx_width,
3660 u16 *rx_width)
3661{
3662 u16 widths, tx, rx;
3663 u8 misc_bits, local_flags;
3664 u16 active_tx, active_rx;
3665
3666 read_vc_local_link_width(dd, &misc_bits, &local_flags, &widths);
3667 tx = widths >> 12;
3668 rx = (widths >> 8) & 0xf;
3669
3670 *tx_width = link_width_to_bits(dd, tx);
3671 *rx_width = link_width_to_bits(dd, rx);
3672
3673 /* print the active widths */
3674 get_link_widths(dd, &active_tx, &active_rx);
3675}
3676
3677/*
3678 * Set ppd->link_width_active and ppd->link_width_downgrade_active using
3679 * hardware information when the link first comes up.
3680 *
3681 * The link width is not available until after VerifyCap.AllFramesReceived
3682 * (the trigger for handle_verify_cap), so this is outside that routine
3683 * and should be called when the 8051 signals linkup.
3684 */
3685void get_linkup_link_widths(struct hfi1_pportdata *ppd)
3686{
3687 u16 tx_width, rx_width;
3688
3689 /* get end-of-LNI link widths */
3690 get_linkup_widths(ppd->dd, &tx_width, &rx_width);
3691
3692 /* use tx_width as the link is supposed to be symmetric on link up */
3693 ppd->link_width_active = tx_width;
3694 /* link width downgrade active (LWD.A) starts out matching LW.A */
3695 ppd->link_width_downgrade_tx_active = ppd->link_width_active;
3696 ppd->link_width_downgrade_rx_active = ppd->link_width_active;
3697 /* per OPA spec, on link up LWD.E resets to LWD.S */
3698 ppd->link_width_downgrade_enabled = ppd->link_width_downgrade_supported;
3699 /* cache the active egress rate (units {10^6 bits/sec]) */
3700 ppd->current_egress_rate = active_egress_rate(ppd);
3701}
3702
3703/*
3704 * Handle a verify capabilities interrupt from the 8051.
3705 *
3706 * This is a work-queue function outside of the interrupt.
3707 */
3708void handle_verify_cap(struct work_struct *work)
3709{
3710 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3711 link_vc_work);
3712 struct hfi1_devdata *dd = ppd->dd;
3713 u64 reg;
3714 u8 power_management;
3715 u8 continious;
3716 u8 vcu;
3717 u8 vau;
3718 u8 z;
3719 u16 vl15buf;
3720 u16 link_widths;
3721 u16 crc_mask;
3722 u16 crc_val;
3723 u16 device_id;
3724 u16 active_tx, active_rx;
3725 u8 partner_supported_crc;
3726 u8 remote_tx_rate;
3727 u8 device_rev;
3728
3729 set_link_state(ppd, HLS_VERIFY_CAP);
3730
3731 lcb_shutdown(dd, 0);
3732 adjust_lcb_for_fpga_serdes(dd);
3733
3734 /*
3735 * These are now valid:
3736 * remote VerifyCap fields in the general LNI config
3737 * CSR DC8051_STS_REMOTE_GUID
3738 * CSR DC8051_STS_REMOTE_NODE_TYPE
3739 * CSR DC8051_STS_REMOTE_FM_SECURITY
3740 * CSR DC8051_STS_REMOTE_PORT_NO
3741 */
3742
3743 read_vc_remote_phy(dd, &power_management, &continious);
3744 read_vc_remote_fabric(
3745 dd,
3746 &vau,
3747 &z,
3748 &vcu,
3749 &vl15buf,
3750 &partner_supported_crc);
3751 read_vc_remote_link_width(dd, &remote_tx_rate, &link_widths);
3752 read_remote_device_id(dd, &device_id, &device_rev);
3753 /*
3754 * And the 'MgmtAllowed' information, which is exchanged during
3755 * LNI, is also be available at this point.
3756 */
3757 read_mgmt_allowed(dd, &ppd->mgmt_allowed);
3758 /* print the active widths */
3759 get_link_widths(dd, &active_tx, &active_rx);
3760 dd_dev_info(dd,
3761 "Peer PHY: power management 0x%x, continuous updates 0x%x\n",
3762 (int)power_management, (int)continious);
3763 dd_dev_info(dd,
3764 "Peer Fabric: vAU %d, Z %d, vCU %d, vl15 credits 0x%x, CRC sizes 0x%x\n",
3765 (int)vau,
3766 (int)z,
3767 (int)vcu,
3768 (int)vl15buf,
3769 (int)partner_supported_crc);
3770 dd_dev_info(dd, "Peer Link Width: tx rate 0x%x, widths 0x%x\n",
3771 (u32)remote_tx_rate, (u32)link_widths);
3772 dd_dev_info(dd, "Peer Device ID: 0x%04x, Revision 0x%02x\n",
3773 (u32)device_id, (u32)device_rev);
3774 /*
3775 * The peer vAU value just read is the peer receiver value. HFI does
3776 * not support a transmit vAU of 0 (AU == 8). We advertised that
3777 * with Z=1 in the fabric capabilities sent to the peer. The peer
3778 * will see our Z=1, and, if it advertised a vAU of 0, will move its
3779 * receive to vAU of 1 (AU == 16). Do the same here. We do not care
3780 * about the peer Z value - our sent vAU is 3 (hardwired) and is not
3781 * subject to the Z value exception.
3782 */
3783 if (vau == 0)
3784 vau = 1;
3785 set_up_vl15(dd, vau, vl15buf);
3786
3787 /* set up the LCB CRC mode */
3788 crc_mask = ppd->port_crc_mode_enabled & partner_supported_crc;
3789
3790 /* order is important: use the lowest bit in common */
3791 if (crc_mask & CAP_CRC_14B)
3792 crc_val = LCB_CRC_14B;
3793 else if (crc_mask & CAP_CRC_48B)
3794 crc_val = LCB_CRC_48B;
3795 else if (crc_mask & CAP_CRC_12B_16B_PER_LANE)
3796 crc_val = LCB_CRC_12B_16B_PER_LANE;
3797 else
3798 crc_val = LCB_CRC_16B;
3799
3800 dd_dev_info(dd, "Final LCB CRC mode: %d\n", (int)crc_val);
3801 write_csr(dd, DC_LCB_CFG_CRC_MODE,
3802 (u64)crc_val << DC_LCB_CFG_CRC_MODE_TX_VAL_SHIFT);
3803
3804 /* set (14b only) or clear sideband credit */
3805 reg = read_csr(dd, SEND_CM_CTRL);
3806 if (crc_val == LCB_CRC_14B && crc_14b_sideband) {
3807 write_csr(dd, SEND_CM_CTRL,
3808 reg | SEND_CM_CTRL_FORCE_CREDIT_MODE_SMASK);
3809 } else {
3810 write_csr(dd, SEND_CM_CTRL,
3811 reg & ~SEND_CM_CTRL_FORCE_CREDIT_MODE_SMASK);
3812 }
3813
3814 ppd->link_speed_active = 0; /* invalid value */
3815 if (dd->dc8051_ver < dc8051_ver(0, 20)) {
3816 /* remote_tx_rate: 0 = 12.5G, 1 = 25G */
3817 switch (remote_tx_rate) {
3818 case 0:
3819 ppd->link_speed_active = OPA_LINK_SPEED_12_5G;
3820 break;
3821 case 1:
3822 ppd->link_speed_active = OPA_LINK_SPEED_25G;
3823 break;
3824 }
3825 } else {
3826 /* actual rate is highest bit of the ANDed rates */
3827 u8 rate = remote_tx_rate & ppd->local_tx_rate;
3828
3829 if (rate & 2)
3830 ppd->link_speed_active = OPA_LINK_SPEED_25G;
3831 else if (rate & 1)
3832 ppd->link_speed_active = OPA_LINK_SPEED_12_5G;
3833 }
3834 if (ppd->link_speed_active == 0) {
3835 dd_dev_err(dd, "%s: unexpected remote tx rate %d, using 25Gb\n",
3836 __func__, (int)remote_tx_rate);
3837 ppd->link_speed_active = OPA_LINK_SPEED_25G;
3838 }
3839
3840 /*
3841 * Cache the values of the supported, enabled, and active
3842 * LTP CRC modes to return in 'portinfo' queries. But the bit
3843 * flags that are returned in the portinfo query differ from
3844 * what's in the link_crc_mask, crc_sizes, and crc_val
3845 * variables. Convert these here.
3846 */
3847 ppd->port_ltp_crc_mode = cap_to_port_ltp(link_crc_mask) << 8;
3848 /* supported crc modes */
3849 ppd->port_ltp_crc_mode |=
3850 cap_to_port_ltp(ppd->port_crc_mode_enabled) << 4;
3851 /* enabled crc modes */
3852 ppd->port_ltp_crc_mode |= lcb_to_port_ltp(crc_val);
3853 /* active crc mode */
3854
3855 /* set up the remote credit return table */
3856 assign_remote_cm_au_table(dd, vcu);
3857
3858 /*
3859 * The LCB is reset on entry to handle_verify_cap(), so this must
3860 * be applied on every link up.
3861 *
3862 * Adjust LCB error kill enable to kill the link if
3863 * these RBUF errors are seen:
3864 * REPLAY_BUF_MBE_SMASK
3865 * FLIT_INPUT_BUF_MBE_SMASK
3866 */
3867 if (is_a0(dd)) { /* fixed in B0 */
3868 reg = read_csr(dd, DC_LCB_CFG_LINK_KILL_EN);
3869 reg |= DC_LCB_CFG_LINK_KILL_EN_REPLAY_BUF_MBE_SMASK
3870 | DC_LCB_CFG_LINK_KILL_EN_FLIT_INPUT_BUF_MBE_SMASK;
3871 write_csr(dd, DC_LCB_CFG_LINK_KILL_EN, reg);
3872 }
3873
3874 /* pull LCB fifos out of reset - all fifo clocks must be stable */
3875 write_csr(dd, DC_LCB_CFG_TX_FIFOS_RESET, 0);
3876
3877 /* give 8051 access to the LCB CSRs */
3878 write_csr(dd, DC_LCB_ERR_EN, 0); /* mask LCB errors */
3879 set_8051_lcb_access(dd);
3880
3881 ppd->neighbor_guid =
3882 read_csr(dd, DC_DC8051_STS_REMOTE_GUID);
3883 ppd->neighbor_port_number = read_csr(dd, DC_DC8051_STS_REMOTE_PORT_NO) &
3884 DC_DC8051_STS_REMOTE_PORT_NO_VAL_SMASK;
3885 ppd->neighbor_type =
3886 read_csr(dd, DC_DC8051_STS_REMOTE_NODE_TYPE) &
3887 DC_DC8051_STS_REMOTE_NODE_TYPE_VAL_MASK;
3888 ppd->neighbor_fm_security =
3889 read_csr(dd, DC_DC8051_STS_REMOTE_FM_SECURITY) &
3890 DC_DC8051_STS_LOCAL_FM_SECURITY_DISABLED_MASK;
3891 dd_dev_info(dd,
3892 "Neighbor Guid: %llx Neighbor type %d MgmtAllowed %d FM security bypass %d\n",
3893 ppd->neighbor_guid, ppd->neighbor_type,
3894 ppd->mgmt_allowed, ppd->neighbor_fm_security);
3895 if (ppd->mgmt_allowed)
3896 add_full_mgmt_pkey(ppd);
3897
3898 /* tell the 8051 to go to LinkUp */
3899 set_link_state(ppd, HLS_GOING_UP);
3900}
3901
3902/*
3903 * Apply the link width downgrade enabled policy against the current active
3904 * link widths.
3905 *
3906 * Called when the enabled policy changes or the active link widths change.
3907 */
3908void apply_link_downgrade_policy(struct hfi1_pportdata *ppd, int refresh_widths)
3909{
Mike Marciniszyn77241052015-07-30 15:17:43 -04003910 int do_bounce = 0;
Dean Luick323fd782015-11-16 21:59:24 -05003911 int tries;
3912 u16 lwde;
Mike Marciniszyn77241052015-07-30 15:17:43 -04003913 u16 tx, rx;
3914
Dean Luick323fd782015-11-16 21:59:24 -05003915 /* use the hls lock to avoid a race with actual link up */
3916 tries = 0;
3917retry:
Mike Marciniszyn77241052015-07-30 15:17:43 -04003918 mutex_lock(&ppd->hls_lock);
3919 /* only apply if the link is up */
Dean Luick323fd782015-11-16 21:59:24 -05003920 if (!(ppd->host_link_state & HLS_UP)) {
3921 /* still going up..wait and retry */
3922 if (ppd->host_link_state & HLS_GOING_UP) {
3923 if (++tries < 1000) {
3924 mutex_unlock(&ppd->hls_lock);
3925 usleep_range(100, 120); /* arbitrary */
3926 goto retry;
3927 }
3928 dd_dev_err(ppd->dd,
3929 "%s: giving up waiting for link state change\n",
3930 __func__);
3931 }
3932 goto done;
3933 }
3934
3935 lwde = ppd->link_width_downgrade_enabled;
Mike Marciniszyn77241052015-07-30 15:17:43 -04003936
3937 if (refresh_widths) {
3938 get_link_widths(ppd->dd, &tx, &rx);
3939 ppd->link_width_downgrade_tx_active = tx;
3940 ppd->link_width_downgrade_rx_active = rx;
3941 }
3942
3943 if (lwde == 0) {
3944 /* downgrade is disabled */
3945
3946 /* bounce if not at starting active width */
3947 if ((ppd->link_width_active !=
3948 ppd->link_width_downgrade_tx_active)
3949 || (ppd->link_width_active !=
3950 ppd->link_width_downgrade_rx_active)) {
3951 dd_dev_err(ppd->dd,
3952 "Link downgrade is disabled and link has downgraded, downing link\n");
3953 dd_dev_err(ppd->dd,
3954 " original 0x%x, tx active 0x%x, rx active 0x%x\n",
3955 ppd->link_width_active,
3956 ppd->link_width_downgrade_tx_active,
3957 ppd->link_width_downgrade_rx_active);
3958 do_bounce = 1;
3959 }
3960 } else if ((lwde & ppd->link_width_downgrade_tx_active) == 0
3961 || (lwde & ppd->link_width_downgrade_rx_active) == 0) {
3962 /* Tx or Rx is outside the enabled policy */
3963 dd_dev_err(ppd->dd,
3964 "Link is outside of downgrade allowed, downing link\n");
3965 dd_dev_err(ppd->dd,
3966 " enabled 0x%x, tx active 0x%x, rx active 0x%x\n",
3967 lwde,
3968 ppd->link_width_downgrade_tx_active,
3969 ppd->link_width_downgrade_rx_active);
3970 do_bounce = 1;
3971 }
3972
Dean Luick323fd782015-11-16 21:59:24 -05003973done:
3974 mutex_unlock(&ppd->hls_lock);
3975
Mike Marciniszyn77241052015-07-30 15:17:43 -04003976 if (do_bounce) {
3977 set_link_down_reason(ppd, OPA_LINKDOWN_REASON_WIDTH_POLICY, 0,
3978 OPA_LINKDOWN_REASON_WIDTH_POLICY);
3979 set_link_state(ppd, HLS_DN_OFFLINE);
3980 start_link(ppd);
3981 }
3982}
3983
3984/*
3985 * Handle a link downgrade interrupt from the 8051.
3986 *
3987 * This is a work-queue function outside of the interrupt.
3988 */
3989void handle_link_downgrade(struct work_struct *work)
3990{
3991 struct hfi1_pportdata *ppd = container_of(work, struct hfi1_pportdata,
3992 link_downgrade_work);
3993
3994 dd_dev_info(ppd->dd, "8051: Link width downgrade\n");
3995 apply_link_downgrade_policy(ppd, 1);
3996}
3997
3998static char *dcc_err_string(char *buf, int buf_len, u64 flags)
3999{
4000 return flag_string(buf, buf_len, flags, dcc_err_flags,
4001 ARRAY_SIZE(dcc_err_flags));
4002}
4003
4004static char *lcb_err_string(char *buf, int buf_len, u64 flags)
4005{
4006 return flag_string(buf, buf_len, flags, lcb_err_flags,
4007 ARRAY_SIZE(lcb_err_flags));
4008}
4009
4010static char *dc8051_err_string(char *buf, int buf_len, u64 flags)
4011{
4012 return flag_string(buf, buf_len, flags, dc8051_err_flags,
4013 ARRAY_SIZE(dc8051_err_flags));
4014}
4015
4016static char *dc8051_info_err_string(char *buf, int buf_len, u64 flags)
4017{
4018 return flag_string(buf, buf_len, flags, dc8051_info_err_flags,
4019 ARRAY_SIZE(dc8051_info_err_flags));
4020}
4021
4022static char *dc8051_info_host_msg_string(char *buf, int buf_len, u64 flags)
4023{
4024 return flag_string(buf, buf_len, flags, dc8051_info_host_msg_flags,
4025 ARRAY_SIZE(dc8051_info_host_msg_flags));
4026}
4027
4028static void handle_8051_interrupt(struct hfi1_devdata *dd, u32 unused, u64 reg)
4029{
4030 struct hfi1_pportdata *ppd = dd->pport;
4031 u64 info, err, host_msg;
4032 int queue_link_down = 0;
4033 char buf[96];
4034
4035 /* look at the flags */
4036 if (reg & DC_DC8051_ERR_FLG_SET_BY_8051_SMASK) {
4037 /* 8051 information set by firmware */
4038 /* read DC8051_DBG_ERR_INFO_SET_BY_8051 for details */
4039 info = read_csr(dd, DC_DC8051_DBG_ERR_INFO_SET_BY_8051);
4040 err = (info >> DC_DC8051_DBG_ERR_INFO_SET_BY_8051_ERROR_SHIFT)
4041 & DC_DC8051_DBG_ERR_INFO_SET_BY_8051_ERROR_MASK;
4042 host_msg = (info >>
4043 DC_DC8051_DBG_ERR_INFO_SET_BY_8051_HOST_MSG_SHIFT)
4044 & DC_DC8051_DBG_ERR_INFO_SET_BY_8051_HOST_MSG_MASK;
4045
4046 /*
4047 * Handle error flags.
4048 */
4049 if (err & FAILED_LNI) {
4050 /*
4051 * LNI error indications are cleared by the 8051
4052 * only when starting polling. Only pay attention
4053 * to them when in the states that occur during
4054 * LNI.
4055 */
4056 if (ppd->host_link_state
4057 & (HLS_DN_POLL | HLS_VERIFY_CAP | HLS_GOING_UP)) {
4058 queue_link_down = 1;
4059 dd_dev_info(dd, "Link error: %s\n",
4060 dc8051_info_err_string(buf,
4061 sizeof(buf),
4062 err & FAILED_LNI));
4063 }
4064 err &= ~(u64)FAILED_LNI;
4065 }
4066 if (err) {
4067 /* report remaining errors, but do not do anything */
4068 dd_dev_err(dd, "8051 info error: %s\n",
4069 dc8051_info_err_string(buf, sizeof(buf), err));
4070 }
4071
4072 /*
4073 * Handle host message flags.
4074 */
4075 if (host_msg & HOST_REQ_DONE) {
4076 /*
4077 * Presently, the driver does a busy wait for
4078 * host requests to complete. This is only an
4079 * informational message.
4080 * NOTE: The 8051 clears the host message
4081 * information *on the next 8051 command*.
4082 * Therefore, when linkup is achieved,
4083 * this flag will still be set.
4084 */
4085 host_msg &= ~(u64)HOST_REQ_DONE;
4086 }
4087 if (host_msg & BC_SMA_MSG) {
4088 queue_work(ppd->hfi1_wq, &ppd->sma_message_work);
4089 host_msg &= ~(u64)BC_SMA_MSG;
4090 }
4091 if (host_msg & LINKUP_ACHIEVED) {
4092 dd_dev_info(dd, "8051: Link up\n");
4093 queue_work(ppd->hfi1_wq, &ppd->link_up_work);
4094 host_msg &= ~(u64)LINKUP_ACHIEVED;
4095 }
4096 if (host_msg & EXT_DEVICE_CFG_REQ) {
4097 handle_8051_request(dd);
4098 host_msg &= ~(u64)EXT_DEVICE_CFG_REQ;
4099 }
4100 if (host_msg & VERIFY_CAP_FRAME) {
4101 queue_work(ppd->hfi1_wq, &ppd->link_vc_work);
4102 host_msg &= ~(u64)VERIFY_CAP_FRAME;
4103 }
4104 if (host_msg & LINK_GOING_DOWN) {
4105 const char *extra = "";
4106 /* no downgrade action needed if going down */
4107 if (host_msg & LINK_WIDTH_DOWNGRADED) {
4108 host_msg &= ~(u64)LINK_WIDTH_DOWNGRADED;
4109 extra = " (ignoring downgrade)";
4110 }
4111 dd_dev_info(dd, "8051: Link down%s\n", extra);
4112 queue_link_down = 1;
4113 host_msg &= ~(u64)LINK_GOING_DOWN;
4114 }
4115 if (host_msg & LINK_WIDTH_DOWNGRADED) {
4116 queue_work(ppd->hfi1_wq, &ppd->link_downgrade_work);
4117 host_msg &= ~(u64)LINK_WIDTH_DOWNGRADED;
4118 }
4119 if (host_msg) {
4120 /* report remaining messages, but do not do anything */
4121 dd_dev_info(dd, "8051 info host message: %s\n",
4122 dc8051_info_host_msg_string(buf, sizeof(buf),
4123 host_msg));
4124 }
4125
4126 reg &= ~DC_DC8051_ERR_FLG_SET_BY_8051_SMASK;
4127 }
4128 if (reg & DC_DC8051_ERR_FLG_LOST_8051_HEART_BEAT_SMASK) {
4129 /*
4130 * Lost the 8051 heartbeat. If this happens, we
4131 * receive constant interrupts about it. Disable
4132 * the interrupt after the first.
4133 */
4134 dd_dev_err(dd, "Lost 8051 heartbeat\n");
4135 write_csr(dd, DC_DC8051_ERR_EN,
4136 read_csr(dd, DC_DC8051_ERR_EN)
4137 & ~DC_DC8051_ERR_EN_LOST_8051_HEART_BEAT_SMASK);
4138
4139 reg &= ~DC_DC8051_ERR_FLG_LOST_8051_HEART_BEAT_SMASK;
4140 }
4141 if (reg) {
4142 /* report the error, but do not do anything */
4143 dd_dev_err(dd, "8051 error: %s\n",
4144 dc8051_err_string(buf, sizeof(buf), reg));
4145 }
4146
4147 if (queue_link_down) {
4148 /* if the link is already going down or disabled, do not
4149 * queue another */
4150 if ((ppd->host_link_state
4151 & (HLS_GOING_OFFLINE|HLS_LINK_COOLDOWN))
4152 || ppd->link_enabled == 0) {
4153 dd_dev_info(dd, "%s: not queuing link down\n",
4154 __func__);
4155 } else {
4156 queue_work(ppd->hfi1_wq, &ppd->link_down_work);
4157 }
4158 }
4159}
4160
4161static const char * const fm_config_txt[] = {
4162[0] =
4163 "BadHeadDist: Distance violation between two head flits",
4164[1] =
4165 "BadTailDist: Distance violation between two tail flits",
4166[2] =
4167 "BadCtrlDist: Distance violation between two credit control flits",
4168[3] =
4169 "BadCrdAck: Credits return for unsupported VL",
4170[4] =
4171 "UnsupportedVLMarker: Received VL Marker",
4172[5] =
4173 "BadPreempt: Exceeded the preemption nesting level",
4174[6] =
4175 "BadControlFlit: Received unsupported control flit",
4176/* no 7 */
4177[8] =
4178 "UnsupportedVLMarker: Received VL Marker for unconfigured or disabled VL",
4179};
4180
4181static const char * const port_rcv_txt[] = {
4182[1] =
4183 "BadPktLen: Illegal PktLen",
4184[2] =
4185 "PktLenTooLong: Packet longer than PktLen",
4186[3] =
4187 "PktLenTooShort: Packet shorter than PktLen",
4188[4] =
4189 "BadSLID: Illegal SLID (0, using multicast as SLID, does not include security validation of SLID)",
4190[5] =
4191 "BadDLID: Illegal DLID (0, doesn't match HFI)",
4192[6] =
4193 "BadL2: Illegal L2 opcode",
4194[7] =
4195 "BadSC: Unsupported SC",
4196[9] =
4197 "BadRC: Illegal RC",
4198[11] =
4199 "PreemptError: Preempting with same VL",
4200[12] =
4201 "PreemptVL15: Preempting a VL15 packet",
4202};
4203
4204#define OPA_LDR_FMCONFIG_OFFSET 16
4205#define OPA_LDR_PORTRCV_OFFSET 0
4206static void handle_dcc_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
4207{
4208 u64 info, hdr0, hdr1;
4209 const char *extra;
4210 char buf[96];
4211 struct hfi1_pportdata *ppd = dd->pport;
4212 u8 lcl_reason = 0;
4213 int do_bounce = 0;
4214
4215 if (reg & DCC_ERR_FLG_UNCORRECTABLE_ERR_SMASK) {
4216 if (!(dd->err_info_uncorrectable & OPA_EI_STATUS_SMASK)) {
4217 info = read_csr(dd, DCC_ERR_INFO_UNCORRECTABLE);
4218 dd->err_info_uncorrectable = info & OPA_EI_CODE_SMASK;
4219 /* set status bit */
4220 dd->err_info_uncorrectable |= OPA_EI_STATUS_SMASK;
4221 }
4222 reg &= ~DCC_ERR_FLG_UNCORRECTABLE_ERR_SMASK;
4223 }
4224
4225 if (reg & DCC_ERR_FLG_LINK_ERR_SMASK) {
4226 struct hfi1_pportdata *ppd = dd->pport;
4227 /* this counter saturates at (2^32) - 1 */
4228 if (ppd->link_downed < (u32)UINT_MAX)
4229 ppd->link_downed++;
4230 reg &= ~DCC_ERR_FLG_LINK_ERR_SMASK;
4231 }
4232
4233 if (reg & DCC_ERR_FLG_FMCONFIG_ERR_SMASK) {
4234 u8 reason_valid = 1;
4235
4236 info = read_csr(dd, DCC_ERR_INFO_FMCONFIG);
4237 if (!(dd->err_info_fmconfig & OPA_EI_STATUS_SMASK)) {
4238 dd->err_info_fmconfig = info & OPA_EI_CODE_SMASK;
4239 /* set status bit */
4240 dd->err_info_fmconfig |= OPA_EI_STATUS_SMASK;
4241 }
4242 switch (info) {
4243 case 0:
4244 case 1:
4245 case 2:
4246 case 3:
4247 case 4:
4248 case 5:
4249 case 6:
4250 extra = fm_config_txt[info];
4251 break;
4252 case 8:
4253 extra = fm_config_txt[info];
4254 if (ppd->port_error_action &
4255 OPA_PI_MASK_FM_CFG_UNSUPPORTED_VL_MARKER) {
4256 do_bounce = 1;
4257 /*
4258 * lcl_reason cannot be derived from info
4259 * for this error
4260 */
4261 lcl_reason =
4262 OPA_LINKDOWN_REASON_UNSUPPORTED_VL_MARKER;
4263 }
4264 break;
4265 default:
4266 reason_valid = 0;
4267 snprintf(buf, sizeof(buf), "reserved%lld", info);
4268 extra = buf;
4269 break;
4270 }
4271
4272 if (reason_valid && !do_bounce) {
4273 do_bounce = ppd->port_error_action &
4274 (1 << (OPA_LDR_FMCONFIG_OFFSET + info));
4275 lcl_reason = info + OPA_LINKDOWN_REASON_BAD_HEAD_DIST;
4276 }
4277
4278 /* just report this */
4279 dd_dev_info(dd, "DCC Error: fmconfig error: %s\n", extra);
4280 reg &= ~DCC_ERR_FLG_FMCONFIG_ERR_SMASK;
4281 }
4282
4283 if (reg & DCC_ERR_FLG_RCVPORT_ERR_SMASK) {
4284 u8 reason_valid = 1;
4285
4286 info = read_csr(dd, DCC_ERR_INFO_PORTRCV);
4287 hdr0 = read_csr(dd, DCC_ERR_INFO_PORTRCV_HDR0);
4288 hdr1 = read_csr(dd, DCC_ERR_INFO_PORTRCV_HDR1);
4289 if (!(dd->err_info_rcvport.status_and_code &
4290 OPA_EI_STATUS_SMASK)) {
4291 dd->err_info_rcvport.status_and_code =
4292 info & OPA_EI_CODE_SMASK;
4293 /* set status bit */
4294 dd->err_info_rcvport.status_and_code |=
4295 OPA_EI_STATUS_SMASK;
4296 /* save first 2 flits in the packet that caused
4297 * the error */
4298 dd->err_info_rcvport.packet_flit1 = hdr0;
4299 dd->err_info_rcvport.packet_flit2 = hdr1;
4300 }
4301 switch (info) {
4302 case 1:
4303 case 2:
4304 case 3:
4305 case 4:
4306 case 5:
4307 case 6:
4308 case 7:
4309 case 9:
4310 case 11:
4311 case 12:
4312 extra = port_rcv_txt[info];
4313 break;
4314 default:
4315 reason_valid = 0;
4316 snprintf(buf, sizeof(buf), "reserved%lld", info);
4317 extra = buf;
4318 break;
4319 }
4320
4321 if (reason_valid && !do_bounce) {
4322 do_bounce = ppd->port_error_action &
4323 (1 << (OPA_LDR_PORTRCV_OFFSET + info));
4324 lcl_reason = info + OPA_LINKDOWN_REASON_RCV_ERROR_0;
4325 }
4326
4327 /* just report this */
4328 dd_dev_info(dd, "DCC Error: PortRcv error: %s\n", extra);
4329 dd_dev_info(dd, " hdr0 0x%llx, hdr1 0x%llx\n",
4330 hdr0, hdr1);
4331
4332 reg &= ~DCC_ERR_FLG_RCVPORT_ERR_SMASK;
4333 }
4334
4335 if (reg & DCC_ERR_FLG_EN_CSR_ACCESS_BLOCKED_UC_SMASK) {
4336 /* informative only */
4337 dd_dev_info(dd, "8051 access to LCB blocked\n");
4338 reg &= ~DCC_ERR_FLG_EN_CSR_ACCESS_BLOCKED_UC_SMASK;
4339 }
4340 if (reg & DCC_ERR_FLG_EN_CSR_ACCESS_BLOCKED_HOST_SMASK) {
4341 /* informative only */
4342 dd_dev_info(dd, "host access to LCB blocked\n");
4343 reg &= ~DCC_ERR_FLG_EN_CSR_ACCESS_BLOCKED_HOST_SMASK;
4344 }
4345
4346 /* report any remaining errors */
4347 if (reg)
4348 dd_dev_info(dd, "DCC Error: %s\n",
4349 dcc_err_string(buf, sizeof(buf), reg));
4350
4351 if (lcl_reason == 0)
4352 lcl_reason = OPA_LINKDOWN_REASON_UNKNOWN;
4353
4354 if (do_bounce) {
4355 dd_dev_info(dd, "%s: PortErrorAction bounce\n", __func__);
4356 set_link_down_reason(ppd, lcl_reason, 0, lcl_reason);
4357 queue_work(ppd->hfi1_wq, &ppd->link_bounce_work);
4358 }
4359}
4360
4361static void handle_lcb_err(struct hfi1_devdata *dd, u32 unused, u64 reg)
4362{
4363 char buf[96];
4364
4365 dd_dev_info(dd, "LCB Error: %s\n",
4366 lcb_err_string(buf, sizeof(buf), reg));
4367}
4368
4369/*
4370 * CCE block DC interrupt. Source is < 8.
4371 */
4372static void is_dc_int(struct hfi1_devdata *dd, unsigned int source)
4373{
4374 const struct err_reg_info *eri = &dc_errs[source];
4375
4376 if (eri->handler) {
4377 interrupt_clear_down(dd, 0, eri);
4378 } else if (source == 3 /* dc_lbm_int */) {
4379 /*
4380 * This indicates that a parity error has occurred on the
4381 * address/control lines presented to the LBM. The error
4382 * is a single pulse, there is no associated error flag,
4383 * and it is non-maskable. This is because if a parity
4384 * error occurs on the request the request is dropped.
4385 * This should never occur, but it is nice to know if it
4386 * ever does.
4387 */
4388 dd_dev_err(dd, "Parity error in DC LBM block\n");
4389 } else {
4390 dd_dev_err(dd, "Invalid DC interrupt %u\n", source);
4391 }
4392}
4393
4394/*
4395 * TX block send credit interrupt. Source is < 160.
4396 */
4397static void is_send_credit_int(struct hfi1_devdata *dd, unsigned int source)
4398{
4399 sc_group_release_update(dd, source);
4400}
4401
4402/*
4403 * TX block SDMA interrupt. Source is < 48.
4404 *
4405 * SDMA interrupts are grouped by type:
4406 *
4407 * 0 - N-1 = SDma
4408 * N - 2N-1 = SDmaProgress
4409 * 2N - 3N-1 = SDmaIdle
4410 */
4411static void is_sdma_eng_int(struct hfi1_devdata *dd, unsigned int source)
4412{
4413 /* what interrupt */
4414 unsigned int what = source / TXE_NUM_SDMA_ENGINES;
4415 /* which engine */
4416 unsigned int which = source % TXE_NUM_SDMA_ENGINES;
4417
4418#ifdef CONFIG_SDMA_VERBOSITY
4419 dd_dev_err(dd, "CONFIG SDMA(%u) %s:%d %s()\n", which,
4420 slashstrip(__FILE__), __LINE__, __func__);
4421 sdma_dumpstate(&dd->per_sdma[which]);
4422#endif
4423
4424 if (likely(what < 3 && which < dd->num_sdma)) {
4425 sdma_engine_interrupt(&dd->per_sdma[which], 1ull << source);
4426 } else {
4427 /* should not happen */
4428 dd_dev_err(dd, "Invalid SDMA interrupt 0x%x\n", source);
4429 }
4430}
4431
4432/*
4433 * RX block receive available interrupt. Source is < 160.
4434 */
4435static void is_rcv_avail_int(struct hfi1_devdata *dd, unsigned int source)
4436{
4437 struct hfi1_ctxtdata *rcd;
4438 char *err_detail;
4439
4440 if (likely(source < dd->num_rcv_contexts)) {
4441 rcd = dd->rcd[source];
4442 if (rcd) {
4443 if (source < dd->first_user_ctxt)
Dean Luickf4f30031c2015-10-26 10:28:44 -04004444 rcd->do_interrupt(rcd, 0);
Mike Marciniszyn77241052015-07-30 15:17:43 -04004445 else
4446 handle_user_interrupt(rcd);
4447 return; /* OK */
4448 }
4449 /* received an interrupt, but no rcd */
4450 err_detail = "dataless";
4451 } else {
4452 /* received an interrupt, but are not using that context */
4453 err_detail = "out of range";
4454 }
4455 dd_dev_err(dd, "unexpected %s receive available context interrupt %u\n",
4456 err_detail, source);
4457}
4458
4459/*
4460 * RX block receive urgent interrupt. Source is < 160.
4461 */
4462static void is_rcv_urgent_int(struct hfi1_devdata *dd, unsigned int source)
4463{
4464 struct hfi1_ctxtdata *rcd;
4465 char *err_detail;
4466
4467 if (likely(source < dd->num_rcv_contexts)) {
4468 rcd = dd->rcd[source];
4469 if (rcd) {
4470 /* only pay attention to user urgent interrupts */
4471 if (source >= dd->first_user_ctxt)
4472 handle_user_interrupt(rcd);
4473 return; /* OK */
4474 }
4475 /* received an interrupt, but no rcd */
4476 err_detail = "dataless";
4477 } else {
4478 /* received an interrupt, but are not using that context */
4479 err_detail = "out of range";
4480 }
4481 dd_dev_err(dd, "unexpected %s receive urgent context interrupt %u\n",
4482 err_detail, source);
4483}
4484
4485/*
4486 * Reserved range interrupt. Should not be called in normal operation.
4487 */
4488static void is_reserved_int(struct hfi1_devdata *dd, unsigned int source)
4489{
4490 char name[64];
4491
4492 dd_dev_err(dd, "unexpected %s interrupt\n",
4493 is_reserved_name(name, sizeof(name), source));
4494}
4495
4496static const struct is_table is_table[] = {
4497/* start end
4498 name func interrupt func */
4499{ IS_GENERAL_ERR_START, IS_GENERAL_ERR_END,
4500 is_misc_err_name, is_misc_err_int },
4501{ IS_SDMAENG_ERR_START, IS_SDMAENG_ERR_END,
4502 is_sdma_eng_err_name, is_sdma_eng_err_int },
4503{ IS_SENDCTXT_ERR_START, IS_SENDCTXT_ERR_END,
4504 is_sendctxt_err_name, is_sendctxt_err_int },
4505{ IS_SDMA_START, IS_SDMA_END,
4506 is_sdma_eng_name, is_sdma_eng_int },
4507{ IS_VARIOUS_START, IS_VARIOUS_END,
4508 is_various_name, is_various_int },
4509{ IS_DC_START, IS_DC_END,
4510 is_dc_name, is_dc_int },
4511{ IS_RCVAVAIL_START, IS_RCVAVAIL_END,
4512 is_rcv_avail_name, is_rcv_avail_int },
4513{ IS_RCVURGENT_START, IS_RCVURGENT_END,
4514 is_rcv_urgent_name, is_rcv_urgent_int },
4515{ IS_SENDCREDIT_START, IS_SENDCREDIT_END,
4516 is_send_credit_name, is_send_credit_int},
4517{ IS_RESERVED_START, IS_RESERVED_END,
4518 is_reserved_name, is_reserved_int},
4519};
4520
4521/*
4522 * Interrupt source interrupt - called when the given source has an interrupt.
4523 * Source is a bit index into an array of 64-bit integers.
4524 */
4525static void is_interrupt(struct hfi1_devdata *dd, unsigned int source)
4526{
4527 const struct is_table *entry;
4528
4529 /* avoids a double compare by walking the table in-order */
4530 for (entry = &is_table[0]; entry->is_name; entry++) {
4531 if (source < entry->end) {
4532 trace_hfi1_interrupt(dd, entry, source);
4533 entry->is_int(dd, source - entry->start);
4534 return;
4535 }
4536 }
4537 /* fell off the end */
4538 dd_dev_err(dd, "invalid interrupt source %u\n", source);
4539}
4540
4541/*
4542 * General interrupt handler. This is able to correctly handle
4543 * all interrupts in case INTx is used.
4544 */
4545static irqreturn_t general_interrupt(int irq, void *data)
4546{
4547 struct hfi1_devdata *dd = data;
4548 u64 regs[CCE_NUM_INT_CSRS];
4549 u32 bit;
4550 int i;
4551
4552 this_cpu_inc(*dd->int_counter);
4553
4554 /* phase 1: scan and clear all handled interrupts */
4555 for (i = 0; i < CCE_NUM_INT_CSRS; i++) {
4556 if (dd->gi_mask[i] == 0) {
4557 regs[i] = 0; /* used later */
4558 continue;
4559 }
4560 regs[i] = read_csr(dd, CCE_INT_STATUS + (8 * i)) &
4561 dd->gi_mask[i];
4562 /* only clear if anything is set */
4563 if (regs[i])
4564 write_csr(dd, CCE_INT_CLEAR + (8 * i), regs[i]);
4565 }
4566
4567 /* phase 2: call the appropriate handler */
4568 for_each_set_bit(bit, (unsigned long *)&regs[0],
4569 CCE_NUM_INT_CSRS*64) {
4570 is_interrupt(dd, bit);
4571 }
4572
4573 return IRQ_HANDLED;
4574}
4575
4576static irqreturn_t sdma_interrupt(int irq, void *data)
4577{
4578 struct sdma_engine *sde = data;
4579 struct hfi1_devdata *dd = sde->dd;
4580 u64 status;
4581
4582#ifdef CONFIG_SDMA_VERBOSITY
4583 dd_dev_err(dd, "CONFIG SDMA(%u) %s:%d %s()\n", sde->this_idx,
4584 slashstrip(__FILE__), __LINE__, __func__);
4585 sdma_dumpstate(sde);
4586#endif
4587
4588 this_cpu_inc(*dd->int_counter);
4589
4590 /* This read_csr is really bad in the hot path */
4591 status = read_csr(dd,
4592 CCE_INT_STATUS + (8*(IS_SDMA_START/64)))
4593 & sde->imask;
4594 if (likely(status)) {
4595 /* clear the interrupt(s) */
4596 write_csr(dd,
4597 CCE_INT_CLEAR + (8*(IS_SDMA_START/64)),
4598 status);
4599
4600 /* handle the interrupt(s) */
4601 sdma_engine_interrupt(sde, status);
4602 } else
4603 dd_dev_err(dd, "SDMA engine %u interrupt, but no status bits set\n",
4604 sde->this_idx);
4605
4606 return IRQ_HANDLED;
4607}
4608
4609/*
Dean Luickf4f30031c2015-10-26 10:28:44 -04004610 * Clear the receive interrupt, forcing the write and making sure
4611 * we have data from the chip, pushing everything in front of it
4612 * back to the host.
4613 */
4614static inline void clear_recv_intr(struct hfi1_ctxtdata *rcd)
4615{
4616 struct hfi1_devdata *dd = rcd->dd;
4617 u32 addr = CCE_INT_CLEAR + (8 * rcd->ireg);
4618
4619 mmiowb(); /* make sure everything before is written */
4620 write_csr(dd, addr, rcd->imask);
4621 /* force the above write on the chip and get a value back */
4622 (void)read_csr(dd, addr);
4623}
4624
4625/* force the receive interrupt */
4626static inline void force_recv_intr(struct hfi1_ctxtdata *rcd)
4627{
4628 write_csr(rcd->dd, CCE_INT_FORCE + (8 * rcd->ireg), rcd->imask);
4629}
4630
4631/* return non-zero if a packet is present */
4632static inline int check_packet_present(struct hfi1_ctxtdata *rcd)
4633{
4634 if (!HFI1_CAP_IS_KSET(DMA_RTAIL))
4635 return (rcd->seq_cnt ==
4636 rhf_rcv_seq(rhf_to_cpu(get_rhf_addr(rcd))));
4637
4638 /* else is RDMA rtail */
4639 return (rcd->head != get_rcvhdrtail(rcd));
4640}
4641
4642/*
4643 * Receive packet IRQ handler. This routine expects to be on its own IRQ.
4644 * This routine will try to handle packets immediately (latency), but if
4645 * it finds too many, it will invoke the thread handler (bandwitdh). The
4646 * chip receive interupt is *not* cleared down until this or the thread (if
4647 * invoked) is finished. The intent is to avoid extra interrupts while we
4648 * are processing packets anyway.
Mike Marciniszyn77241052015-07-30 15:17:43 -04004649 */
4650static irqreturn_t receive_context_interrupt(int irq, void *data)
4651{
4652 struct hfi1_ctxtdata *rcd = data;
4653 struct hfi1_devdata *dd = rcd->dd;
Dean Luickf4f30031c2015-10-26 10:28:44 -04004654 int disposition;
4655 int present;
Mike Marciniszyn77241052015-07-30 15:17:43 -04004656
4657 trace_hfi1_receive_interrupt(dd, rcd->ctxt);
4658 this_cpu_inc(*dd->int_counter);
4659
Dean Luickf4f30031c2015-10-26 10:28:44 -04004660 /* receive interrupt remains blocked while processing packets */
4661 disposition = rcd->do_interrupt(rcd, 0);
Mike Marciniszyn77241052015-07-30 15:17:43 -04004662
Dean Luickf4f30031c2015-10-26 10:28:44 -04004663 /*
4664 * Too many packets were seen while processing packets in this
4665 * IRQ handler. Invoke the handler thread. The receive interrupt
4666 * remains blocked.
4667 */
4668 if (disposition == RCV_PKT_LIMIT)
4669 return IRQ_WAKE_THREAD;
4670
4671 /*
4672 * The packet processor detected no more packets. Clear the receive
4673 * interrupt and recheck for a packet packet that may have arrived
4674 * after the previous check and interrupt clear. If a packet arrived,
4675 * force another interrupt.
4676 */
4677 clear_recv_intr(rcd);
4678 present = check_packet_present(rcd);
4679 if (present)
4680 force_recv_intr(rcd);
4681
4682 return IRQ_HANDLED;
4683}
4684
4685/*
4686 * Receive packet thread handler. This expects to be invoked with the
4687 * receive interrupt still blocked.
4688 */
4689static irqreturn_t receive_context_thread(int irq, void *data)
4690{
4691 struct hfi1_ctxtdata *rcd = data;
4692 int present;
4693
4694 /* receive interrupt is still blocked from the IRQ handler */
4695 (void)rcd->do_interrupt(rcd, 1);
4696
4697 /*
4698 * The packet processor will only return if it detected no more
4699 * packets. Hold IRQs here so we can safely clear the interrupt and
4700 * recheck for a packet that may have arrived after the previous
4701 * check and the interrupt clear. If a packet arrived, force another
4702 * interrupt.
4703 */
4704 local_irq_disable();
4705 clear_recv_intr(rcd);
4706 present = check_packet_present(rcd);
4707 if (present)
4708 force_recv_intr(rcd);
4709 local_irq_enable();
Mike Marciniszyn77241052015-07-30 15:17:43 -04004710
4711 return IRQ_HANDLED;
4712}
4713
4714/* ========================================================================= */
4715
4716u32 read_physical_state(struct hfi1_devdata *dd)
4717{
4718 u64 reg;
4719
4720 reg = read_csr(dd, DC_DC8051_STS_CUR_STATE);
4721 return (reg >> DC_DC8051_STS_CUR_STATE_PORT_SHIFT)
4722 & DC_DC8051_STS_CUR_STATE_PORT_MASK;
4723}
4724
4725static u32 read_logical_state(struct hfi1_devdata *dd)
4726{
4727 u64 reg;
4728
4729 reg = read_csr(dd, DCC_CFG_PORT_CONFIG);
4730 return (reg >> DCC_CFG_PORT_CONFIG_LINK_STATE_SHIFT)
4731 & DCC_CFG_PORT_CONFIG_LINK_STATE_MASK;
4732}
4733
4734static void set_logical_state(struct hfi1_devdata *dd, u32 chip_lstate)
4735{
4736 u64 reg;
4737
4738 reg = read_csr(dd, DCC_CFG_PORT_CONFIG);
4739 /* clear current state, set new state */
4740 reg &= ~DCC_CFG_PORT_CONFIG_LINK_STATE_SMASK;
4741 reg |= (u64)chip_lstate << DCC_CFG_PORT_CONFIG_LINK_STATE_SHIFT;
4742 write_csr(dd, DCC_CFG_PORT_CONFIG, reg);
4743}
4744
4745/*
4746 * Use the 8051 to read a LCB CSR.
4747 */
4748static int read_lcb_via_8051(struct hfi1_devdata *dd, u32 addr, u64 *data)
4749{
4750 u32 regno;
4751 int ret;
4752
4753 if (dd->icode == ICODE_FUNCTIONAL_SIMULATOR) {
4754 if (acquire_lcb_access(dd, 0) == 0) {
4755 *data = read_csr(dd, addr);
4756 release_lcb_access(dd, 0);
4757 return 0;
4758 }
4759 return -EBUSY;
4760 }
4761
4762 /* register is an index of LCB registers: (offset - base) / 8 */
4763 regno = (addr - DC_LCB_CFG_RUN) >> 3;
4764 ret = do_8051_command(dd, HCMD_READ_LCB_CSR, regno, data);
4765 if (ret != HCMD_SUCCESS)
4766 return -EBUSY;
4767 return 0;
4768}
4769
4770/*
4771 * Read an LCB CSR. Access may not be in host control, so check.
4772 * Return 0 on success, -EBUSY on failure.
4773 */
4774int read_lcb_csr(struct hfi1_devdata *dd, u32 addr, u64 *data)
4775{
4776 struct hfi1_pportdata *ppd = dd->pport;
4777
4778 /* if up, go through the 8051 for the value */
4779 if (ppd->host_link_state & HLS_UP)
4780 return read_lcb_via_8051(dd, addr, data);
4781 /* if going up or down, no access */
4782 if (ppd->host_link_state & (HLS_GOING_UP | HLS_GOING_OFFLINE))
4783 return -EBUSY;
4784 /* otherwise, host has access */
4785 *data = read_csr(dd, addr);
4786 return 0;
4787}
4788
4789/*
4790 * Use the 8051 to write a LCB CSR.
4791 */
4792static int write_lcb_via_8051(struct hfi1_devdata *dd, u32 addr, u64 data)
4793{
Dean Luick3bf40d62015-11-06 20:07:04 -05004794 u32 regno;
4795 int ret;
Mike Marciniszyn77241052015-07-30 15:17:43 -04004796
Dean Luick3bf40d62015-11-06 20:07:04 -05004797 if (dd->icode == ICODE_FUNCTIONAL_SIMULATOR ||
4798 (dd->dc8051_ver < dc8051_ver(0, 20))) {
4799 if (acquire_lcb_access(dd, 0) == 0) {
4800 write_csr(dd, addr, data);
4801 release_lcb_access(dd, 0);
4802 return 0;
4803 }
4804 return -EBUSY;
Mike Marciniszyn77241052015-07-30 15:17:43 -04004805 }
Dean Luick3bf40d62015-11-06 20:07:04 -05004806
4807 /* register is an index of LCB registers: (offset - base) / 8 */
4808 regno = (addr - DC_LCB_CFG_RUN) >> 3;
4809 ret = do_8051_command(dd, HCMD_WRITE_LCB_CSR, regno, &data);
4810 if (ret != HCMD_SUCCESS)
4811 return -EBUSY;
4812 return 0;
Mike Marciniszyn77241052015-07-30 15:17:43 -04004813}
4814
4815/*
4816 * Write an LCB CSR. Access may not be in host control, so check.
4817 * Return 0 on success, -EBUSY on failure.
4818 */
4819int write_lcb_csr(struct hfi1_devdata *dd, u32 addr, u64 data)
4820{
4821 struct hfi1_pportdata *ppd = dd->pport;
4822
4823 /* if up, go through the 8051 for the value */
4824 if (ppd->host_link_state & HLS_UP)
4825 return write_lcb_via_8051(dd, addr, data);
4826 /* if going up or down, no access */
4827 if (ppd->host_link_state & (HLS_GOING_UP | HLS_GOING_OFFLINE))
4828 return -EBUSY;
4829 /* otherwise, host has access */
4830 write_csr(dd, addr, data);
4831 return 0;
4832}
4833
4834/*
4835 * Returns:
4836 * < 0 = Linux error, not able to get access
4837 * > 0 = 8051 command RETURN_CODE
4838 */
4839static int do_8051_command(
4840 struct hfi1_devdata *dd,
4841 u32 type,
4842 u64 in_data,
4843 u64 *out_data)
4844{
4845 u64 reg, completed;
4846 int return_code;
4847 unsigned long flags;
4848 unsigned long timeout;
4849
4850 hfi1_cdbg(DC8051, "type %d, data 0x%012llx", type, in_data);
4851
4852 /*
4853 * Alternative to holding the lock for a long time:
4854 * - keep busy wait - have other users bounce off
4855 */
4856 spin_lock_irqsave(&dd->dc8051_lock, flags);
4857
4858 /* We can't send any commands to the 8051 if it's in reset */
4859 if (dd->dc_shutdown) {
4860 return_code = -ENODEV;
4861 goto fail;
4862 }
4863
4864 /*
4865 * If an 8051 host command timed out previously, then the 8051 is
4866 * stuck.
4867 *
4868 * On first timeout, attempt to reset and restart the entire DC
4869 * block (including 8051). (Is this too big of a hammer?)
4870 *
4871 * If the 8051 times out a second time, the reset did not bring it
4872 * back to healthy life. In that case, fail any subsequent commands.
4873 */
4874 if (dd->dc8051_timed_out) {
4875 if (dd->dc8051_timed_out > 1) {
4876 dd_dev_err(dd,
4877 "Previous 8051 host command timed out, skipping command %u\n",
4878 type);
4879 return_code = -ENXIO;
4880 goto fail;
4881 }
4882 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
4883 dc_shutdown(dd);
4884 dc_start(dd);
4885 spin_lock_irqsave(&dd->dc8051_lock, flags);
4886 }
4887
4888 /*
4889 * If there is no timeout, then the 8051 command interface is
4890 * waiting for a command.
4891 */
4892
4893 /*
Dean Luick3bf40d62015-11-06 20:07:04 -05004894 * When writing a LCB CSR, out_data contains the full value to
4895 * to be written, while in_data contains the relative LCB
4896 * address in 7:0. Do the work here, rather than the caller,
4897 * of distrubting the write data to where it needs to go:
4898 *
4899 * Write data
4900 * 39:00 -> in_data[47:8]
4901 * 47:40 -> DC8051_CFG_EXT_DEV_0.RETURN_CODE
4902 * 63:48 -> DC8051_CFG_EXT_DEV_0.RSP_DATA
4903 */
4904 if (type == HCMD_WRITE_LCB_CSR) {
4905 in_data |= ((*out_data) & 0xffffffffffull) << 8;
4906 reg = ((((*out_data) >> 40) & 0xff) <<
4907 DC_DC8051_CFG_EXT_DEV_0_RETURN_CODE_SHIFT)
4908 | ((((*out_data) >> 48) & 0xffff) <<
4909 DC_DC8051_CFG_EXT_DEV_0_RSP_DATA_SHIFT);
4910 write_csr(dd, DC_DC8051_CFG_EXT_DEV_0, reg);
4911 }
4912
4913 /*
Mike Marciniszyn77241052015-07-30 15:17:43 -04004914 * Do two writes: the first to stabilize the type and req_data, the
4915 * second to activate.
4916 */
4917 reg = ((u64)type & DC_DC8051_CFG_HOST_CMD_0_REQ_TYPE_MASK)
4918 << DC_DC8051_CFG_HOST_CMD_0_REQ_TYPE_SHIFT
4919 | (in_data & DC_DC8051_CFG_HOST_CMD_0_REQ_DATA_MASK)
4920 << DC_DC8051_CFG_HOST_CMD_0_REQ_DATA_SHIFT;
4921 write_csr(dd, DC_DC8051_CFG_HOST_CMD_0, reg);
4922 reg |= DC_DC8051_CFG_HOST_CMD_0_REQ_NEW_SMASK;
4923 write_csr(dd, DC_DC8051_CFG_HOST_CMD_0, reg);
4924
4925 /* wait for completion, alternate: interrupt */
4926 timeout = jiffies + msecs_to_jiffies(DC8051_COMMAND_TIMEOUT);
4927 while (1) {
4928 reg = read_csr(dd, DC_DC8051_CFG_HOST_CMD_1);
4929 completed = reg & DC_DC8051_CFG_HOST_CMD_1_COMPLETED_SMASK;
4930 if (completed)
4931 break;
4932 if (time_after(jiffies, timeout)) {
4933 dd->dc8051_timed_out++;
4934 dd_dev_err(dd, "8051 host command %u timeout\n", type);
4935 if (out_data)
4936 *out_data = 0;
4937 return_code = -ETIMEDOUT;
4938 goto fail;
4939 }
4940 udelay(2);
4941 }
4942
4943 if (out_data) {
4944 *out_data = (reg >> DC_DC8051_CFG_HOST_CMD_1_RSP_DATA_SHIFT)
4945 & DC_DC8051_CFG_HOST_CMD_1_RSP_DATA_MASK;
4946 if (type == HCMD_READ_LCB_CSR) {
4947 /* top 16 bits are in a different register */
4948 *out_data |= (read_csr(dd, DC_DC8051_CFG_EXT_DEV_1)
4949 & DC_DC8051_CFG_EXT_DEV_1_REQ_DATA_SMASK)
4950 << (48
4951 - DC_DC8051_CFG_EXT_DEV_1_REQ_DATA_SHIFT);
4952 }
4953 }
4954 return_code = (reg >> DC_DC8051_CFG_HOST_CMD_1_RETURN_CODE_SHIFT)
4955 & DC_DC8051_CFG_HOST_CMD_1_RETURN_CODE_MASK;
4956 dd->dc8051_timed_out = 0;
4957 /*
4958 * Clear command for next user.
4959 */
4960 write_csr(dd, DC_DC8051_CFG_HOST_CMD_0, 0);
4961
4962fail:
4963 spin_unlock_irqrestore(&dd->dc8051_lock, flags);
4964
4965 return return_code;
4966}
4967
4968static int set_physical_link_state(struct hfi1_devdata *dd, u64 state)
4969{
4970 return do_8051_command(dd, HCMD_CHANGE_PHY_STATE, state, NULL);
4971}
4972
4973static int load_8051_config(struct hfi1_devdata *dd, u8 field_id,
4974 u8 lane_id, u32 config_data)
4975{
4976 u64 data;
4977 int ret;
4978
4979 data = (u64)field_id << LOAD_DATA_FIELD_ID_SHIFT
4980 | (u64)lane_id << LOAD_DATA_LANE_ID_SHIFT
4981 | (u64)config_data << LOAD_DATA_DATA_SHIFT;
4982 ret = do_8051_command(dd, HCMD_LOAD_CONFIG_DATA, data, NULL);
4983 if (ret != HCMD_SUCCESS) {
4984 dd_dev_err(dd,
4985 "load 8051 config: field id %d, lane %d, err %d\n",
4986 (int)field_id, (int)lane_id, ret);
4987 }
4988 return ret;
4989}
4990
4991/*
4992 * Read the 8051 firmware "registers". Use the RAM directly. Always
4993 * set the result, even on error.
4994 * Return 0 on success, -errno on failure
4995 */
4996static int read_8051_config(struct hfi1_devdata *dd, u8 field_id, u8 lane_id,
4997 u32 *result)
4998{
4999 u64 big_data;
5000 u32 addr;
5001 int ret;
5002
5003 /* address start depends on the lane_id */
5004 if (lane_id < 4)
5005 addr = (4 * NUM_GENERAL_FIELDS)
5006 + (lane_id * 4 * NUM_LANE_FIELDS);
5007 else
5008 addr = 0;
5009 addr += field_id * 4;
5010
5011 /* read is in 8-byte chunks, hardware will truncate the address down */
5012 ret = read_8051_data(dd, addr, 8, &big_data);
5013
5014 if (ret == 0) {
5015 /* extract the 4 bytes we want */
5016 if (addr & 0x4)
5017 *result = (u32)(big_data >> 32);
5018 else
5019 *result = (u32)big_data;
5020 } else {
5021 *result = 0;
5022 dd_dev_err(dd, "%s: direct read failed, lane %d, field %d!\n",
5023 __func__, lane_id, field_id);
5024 }
5025
5026 return ret;
5027}
5028
5029static int write_vc_local_phy(struct hfi1_devdata *dd, u8 power_management,
5030 u8 continuous)
5031{
5032 u32 frame;
5033
5034 frame = continuous << CONTINIOUS_REMOTE_UPDATE_SUPPORT_SHIFT
5035 | power_management << POWER_MANAGEMENT_SHIFT;
5036 return load_8051_config(dd, VERIFY_CAP_LOCAL_PHY,
5037 GENERAL_CONFIG, frame);
5038}
5039
5040static int write_vc_local_fabric(struct hfi1_devdata *dd, u8 vau, u8 z, u8 vcu,
5041 u16 vl15buf, u8 crc_sizes)
5042{
5043 u32 frame;
5044
5045 frame = (u32)vau << VAU_SHIFT
5046 | (u32)z << Z_SHIFT
5047 | (u32)vcu << VCU_SHIFT
5048 | (u32)vl15buf << VL15BUF_SHIFT
5049 | (u32)crc_sizes << CRC_SIZES_SHIFT;
5050 return load_8051_config(dd, VERIFY_CAP_LOCAL_FABRIC,
5051 GENERAL_CONFIG, frame);
5052}
5053
5054static void read_vc_local_link_width(struct hfi1_devdata *dd, u8 *misc_bits,
5055 u8 *flag_bits, u16 *link_widths)
5056{
5057 u32 frame;
5058
5059 read_8051_config(dd, VERIFY_CAP_LOCAL_LINK_WIDTH, GENERAL_CONFIG,
5060 &frame);
5061 *misc_bits = (frame >> MISC_CONFIG_BITS_SHIFT) & MISC_CONFIG_BITS_MASK;
5062 *flag_bits = (frame >> LOCAL_FLAG_BITS_SHIFT) & LOCAL_FLAG_BITS_MASK;
5063 *link_widths = (frame >> LINK_WIDTH_SHIFT) & LINK_WIDTH_MASK;
5064}
5065
5066static int write_vc_local_link_width(struct hfi1_devdata *dd,
5067 u8 misc_bits,
5068 u8 flag_bits,
5069 u16 link_widths)
5070{
5071 u32 frame;
5072
5073 frame = (u32)misc_bits << MISC_CONFIG_BITS_SHIFT
5074 | (u32)flag_bits << LOCAL_FLAG_BITS_SHIFT
5075 | (u32)link_widths << LINK_WIDTH_SHIFT;
5076 return load_8051_config(dd, VERIFY_CAP_LOCAL_LINK_WIDTH, GENERAL_CONFIG,
5077 frame);
5078}
5079
5080static int write_local_device_id(struct hfi1_devdata *dd, u16 device_id,
5081 u8 device_rev)
5082{
5083 u32 frame;
5084
5085 frame = ((u32)device_id << LOCAL_DEVICE_ID_SHIFT)
5086 | ((u32)device_rev << LOCAL_DEVICE_REV_SHIFT);
5087 return load_8051_config(dd, LOCAL_DEVICE_ID, GENERAL_CONFIG, frame);
5088}
5089
5090static void read_remote_device_id(struct hfi1_devdata *dd, u16 *device_id,
5091 u8 *device_rev)
5092{
5093 u32 frame;
5094
5095 read_8051_config(dd, REMOTE_DEVICE_ID, GENERAL_CONFIG, &frame);
5096 *device_id = (frame >> REMOTE_DEVICE_ID_SHIFT) & REMOTE_DEVICE_ID_MASK;
5097 *device_rev = (frame >> REMOTE_DEVICE_REV_SHIFT)
5098 & REMOTE_DEVICE_REV_MASK;
5099}
5100
5101void read_misc_status(struct hfi1_devdata *dd, u8 *ver_a, u8 *ver_b)
5102{
5103 u32 frame;
5104
5105 read_8051_config(dd, MISC_STATUS, GENERAL_CONFIG, &frame);
5106 *ver_a = (frame >> STS_FM_VERSION_A_SHIFT) & STS_FM_VERSION_A_MASK;
5107 *ver_b = (frame >> STS_FM_VERSION_B_SHIFT) & STS_FM_VERSION_B_MASK;
5108}
5109
5110static void read_vc_remote_phy(struct hfi1_devdata *dd, u8 *power_management,
5111 u8 *continuous)
5112{
5113 u32 frame;
5114
5115 read_8051_config(dd, VERIFY_CAP_REMOTE_PHY, GENERAL_CONFIG, &frame);
5116 *power_management = (frame >> POWER_MANAGEMENT_SHIFT)
5117 & POWER_MANAGEMENT_MASK;
5118 *continuous = (frame >> CONTINIOUS_REMOTE_UPDATE_SUPPORT_SHIFT)
5119 & CONTINIOUS_REMOTE_UPDATE_SUPPORT_MASK;
5120}
5121
5122static void read_vc_remote_fabric(struct hfi1_devdata *dd, u8 *vau, u8 *z,
5123 u8 *vcu, u16 *vl15buf, u8 *crc_sizes)
5124{
5125 u32 frame;
5126
5127 read_8051_config(dd, VERIFY_CAP_REMOTE_FABRIC, GENERAL_CONFIG, &frame);
5128 *vau = (frame >> VAU_SHIFT) & VAU_MASK;
5129 *z = (frame >> Z_SHIFT) & Z_MASK;
5130 *vcu = (frame >> VCU_SHIFT) & VCU_MASK;
5131 *vl15buf = (frame >> VL15BUF_SHIFT) & VL15BUF_MASK;
5132 *crc_sizes = (frame >> CRC_SIZES_SHIFT) & CRC_SIZES_MASK;
5133}
5134
5135static void read_vc_remote_link_width(struct hfi1_devdata *dd,
5136 u8 *remote_tx_rate,
5137 u16 *link_widths)
5138{
5139 u32 frame;
5140
5141 read_8051_config(dd, VERIFY_CAP_REMOTE_LINK_WIDTH, GENERAL_CONFIG,
5142 &frame);
5143 *remote_tx_rate = (frame >> REMOTE_TX_RATE_SHIFT)
5144 & REMOTE_TX_RATE_MASK;
5145 *link_widths = (frame >> LINK_WIDTH_SHIFT) & LINK_WIDTH_MASK;
5146}
5147
5148static void read_local_lni(struct hfi1_devdata *dd, u8 *enable_lane_rx)
5149{
5150 u32 frame;
5151
5152 read_8051_config(dd, LOCAL_LNI_INFO, GENERAL_CONFIG, &frame);
5153 *enable_lane_rx = (frame >> ENABLE_LANE_RX_SHIFT) & ENABLE_LANE_RX_MASK;
5154}
5155
5156static void read_mgmt_allowed(struct hfi1_devdata *dd, u8 *mgmt_allowed)
5157{
5158 u32 frame;
5159
5160 read_8051_config(dd, REMOTE_LNI_INFO, GENERAL_CONFIG, &frame);
5161 *mgmt_allowed = (frame >> MGMT_ALLOWED_SHIFT) & MGMT_ALLOWED_MASK;
5162}
5163
5164static void read_last_local_state(struct hfi1_devdata *dd, u32 *lls)
5165{
5166 read_8051_config(dd, LAST_LOCAL_STATE_COMPLETE, GENERAL_CONFIG, lls);
5167}
5168
5169static void read_last_remote_state(struct hfi1_devdata *dd, u32 *lrs)
5170{
5171 read_8051_config(dd, LAST_REMOTE_STATE_COMPLETE, GENERAL_CONFIG, lrs);
5172}
5173
5174void hfi1_read_link_quality(struct hfi1_devdata *dd, u8 *link_quality)
5175{
5176 u32 frame;
5177 int ret;
5178
5179 *link_quality = 0;
5180 if (dd->pport->host_link_state & HLS_UP) {
5181 ret = read_8051_config(dd, LINK_QUALITY_INFO, GENERAL_CONFIG,
5182 &frame);
5183 if (ret == 0)
5184 *link_quality = (frame >> LINK_QUALITY_SHIFT)
5185 & LINK_QUALITY_MASK;
5186 }
5187}
5188
5189static void read_planned_down_reason_code(struct hfi1_devdata *dd, u8 *pdrrc)
5190{
5191 u32 frame;
5192
5193 read_8051_config(dd, LINK_QUALITY_INFO, GENERAL_CONFIG, &frame);
5194 *pdrrc = (frame >> DOWN_REMOTE_REASON_SHIFT) & DOWN_REMOTE_REASON_MASK;
5195}
5196
5197static int read_tx_settings(struct hfi1_devdata *dd,
5198 u8 *enable_lane_tx,
5199 u8 *tx_polarity_inversion,
5200 u8 *rx_polarity_inversion,
5201 u8 *max_rate)
5202{
5203 u32 frame;
5204 int ret;
5205
5206 ret = read_8051_config(dd, TX_SETTINGS, GENERAL_CONFIG, &frame);
5207 *enable_lane_tx = (frame >> ENABLE_LANE_TX_SHIFT)
5208 & ENABLE_LANE_TX_MASK;
5209 *tx_polarity_inversion = (frame >> TX_POLARITY_INVERSION_SHIFT)
5210 & TX_POLARITY_INVERSION_MASK;
5211 *rx_polarity_inversion = (frame >> RX_POLARITY_INVERSION_SHIFT)
5212 & RX_POLARITY_INVERSION_MASK;
5213 *max_rate = (frame >> MAX_RATE_SHIFT) & MAX_RATE_MASK;
5214 return ret;
5215}
5216
5217static int write_tx_settings(struct hfi1_devdata *dd,
5218 u8 enable_lane_tx,
5219 u8 tx_polarity_inversion,
5220 u8 rx_polarity_inversion,
5221 u8 max_rate)
5222{
5223 u32 frame;
5224
5225 /* no need to mask, all variable sizes match field widths */
5226 frame = enable_lane_tx << ENABLE_LANE_TX_SHIFT
5227 | tx_polarity_inversion << TX_POLARITY_INVERSION_SHIFT
5228 | rx_polarity_inversion << RX_POLARITY_INVERSION_SHIFT
5229 | max_rate << MAX_RATE_SHIFT;
5230 return load_8051_config(dd, TX_SETTINGS, GENERAL_CONFIG, frame);
5231}
5232
5233static void check_fabric_firmware_versions(struct hfi1_devdata *dd)
5234{
5235 u32 frame, version, prod_id;
5236 int ret, lane;
5237
5238 /* 4 lanes */
5239 for (lane = 0; lane < 4; lane++) {
5240 ret = read_8051_config(dd, SPICO_FW_VERSION, lane, &frame);
5241 if (ret) {
5242 dd_dev_err(
5243 dd,
5244 "Unable to read lane %d firmware details\n",
5245 lane);
5246 continue;
5247 }
5248 version = (frame >> SPICO_ROM_VERSION_SHIFT)
5249 & SPICO_ROM_VERSION_MASK;
5250 prod_id = (frame >> SPICO_ROM_PROD_ID_SHIFT)
5251 & SPICO_ROM_PROD_ID_MASK;
5252 dd_dev_info(dd,
5253 "Lane %d firmware: version 0x%04x, prod_id 0x%04x\n",
5254 lane, version, prod_id);
5255 }
5256}
5257
5258/*
5259 * Read an idle LCB message.
5260 *
5261 * Returns 0 on success, -EINVAL on error
5262 */
5263static int read_idle_message(struct hfi1_devdata *dd, u64 type, u64 *data_out)
5264{
5265 int ret;
5266
5267 ret = do_8051_command(dd, HCMD_READ_LCB_IDLE_MSG,
5268 type, data_out);
5269 if (ret != HCMD_SUCCESS) {
5270 dd_dev_err(dd, "read idle message: type %d, err %d\n",
5271 (u32)type, ret);
5272 return -EINVAL;
5273 }
5274 dd_dev_info(dd, "%s: read idle message 0x%llx\n", __func__, *data_out);
5275 /* return only the payload as we already know the type */
5276 *data_out >>= IDLE_PAYLOAD_SHIFT;
5277 return 0;
5278}
5279
5280/*
5281 * Read an idle SMA message. To be done in response to a notification from
5282 * the 8051.
5283 *
5284 * Returns 0 on success, -EINVAL on error
5285 */
5286static int read_idle_sma(struct hfi1_devdata *dd, u64 *data)
5287{
5288 return read_idle_message(dd,
5289 (u64)IDLE_SMA << IDLE_MSG_TYPE_SHIFT, data);
5290}
5291
5292/*
5293 * Send an idle LCB message.
5294 *
5295 * Returns 0 on success, -EINVAL on error
5296 */
5297static int send_idle_message(struct hfi1_devdata *dd, u64 data)
5298{
5299 int ret;
5300
5301 dd_dev_info(dd, "%s: sending idle message 0x%llx\n", __func__, data);
5302 ret = do_8051_command(dd, HCMD_SEND_LCB_IDLE_MSG, data, NULL);
5303 if (ret != HCMD_SUCCESS) {
5304 dd_dev_err(dd, "send idle message: data 0x%llx, err %d\n",
5305 data, ret);
5306 return -EINVAL;
5307 }
5308 return 0;
5309}
5310
5311/*
5312 * Send an idle SMA message.
5313 *
5314 * Returns 0 on success, -EINVAL on error
5315 */
5316int send_idle_sma(struct hfi1_devdata *dd, u64 message)
5317{
5318 u64 data;
5319
5320 data = ((message & IDLE_PAYLOAD_MASK) << IDLE_PAYLOAD_SHIFT)
5321 | ((u64)IDLE_SMA << IDLE_MSG_TYPE_SHIFT);
5322 return send_idle_message(dd, data);
5323}
5324
5325/*
5326 * Initialize the LCB then do a quick link up. This may or may not be
5327 * in loopback.
5328 *
5329 * return 0 on success, -errno on error
5330 */
5331static int do_quick_linkup(struct hfi1_devdata *dd)
5332{
5333 u64 reg;
5334 unsigned long timeout;
5335 int ret;
5336
5337 lcb_shutdown(dd, 0);
5338
5339 if (loopback) {
5340 /* LCB_CFG_LOOPBACK.VAL = 2 */
5341 /* LCB_CFG_LANE_WIDTH.VAL = 0 */
5342 write_csr(dd, DC_LCB_CFG_LOOPBACK,
5343 IB_PACKET_TYPE << DC_LCB_CFG_LOOPBACK_VAL_SHIFT);
5344 write_csr(dd, DC_LCB_CFG_LANE_WIDTH, 0);
5345 }
5346
5347 /* start the LCBs */
5348 /* LCB_CFG_TX_FIFOS_RESET.VAL = 0 */
5349 write_csr(dd, DC_LCB_CFG_TX_FIFOS_RESET, 0);
5350
5351 /* simulator only loopback steps */
5352 if (loopback && dd->icode == ICODE_FUNCTIONAL_SIMULATOR) {
5353 /* LCB_CFG_RUN.EN = 1 */
5354 write_csr(dd, DC_LCB_CFG_RUN,
5355 1ull << DC_LCB_CFG_RUN_EN_SHIFT);
5356
5357 /* watch LCB_STS_LINK_TRANSFER_ACTIVE */
5358 timeout = jiffies + msecs_to_jiffies(10);
5359 while (1) {
5360 reg = read_csr(dd,
5361 DC_LCB_STS_LINK_TRANSFER_ACTIVE);
5362 if (reg)
5363 break;
5364 if (time_after(jiffies, timeout)) {
5365 dd_dev_err(dd,
5366 "timeout waiting for LINK_TRANSFER_ACTIVE\n");
5367 return -ETIMEDOUT;
5368 }
5369 udelay(2);
5370 }
5371
5372 write_csr(dd, DC_LCB_CFG_ALLOW_LINK_UP,
5373 1ull << DC_LCB_CFG_ALLOW_LINK_UP_VAL_SHIFT);
5374 }
5375
5376 if (!loopback) {
5377 /*
5378 * When doing quick linkup and not in loopback, both
5379 * sides must be done with LCB set-up before either
5380 * starts the quick linkup. Put a delay here so that
5381 * both sides can be started and have a chance to be
5382 * done with LCB set up before resuming.
5383 */
5384 dd_dev_err(dd,
5385 "Pausing for peer to be finished with LCB set up\n");
5386 msleep(5000);
5387 dd_dev_err(dd,
5388 "Continuing with quick linkup\n");
5389 }
5390
5391 write_csr(dd, DC_LCB_ERR_EN, 0); /* mask LCB errors */
5392 set_8051_lcb_access(dd);
5393
5394 /*
5395 * State "quick" LinkUp request sets the physical link state to
5396 * LinkUp without a verify capability sequence.
5397 * This state is in simulator v37 and later.
5398 */
5399 ret = set_physical_link_state(dd, PLS_QUICK_LINKUP);
5400 if (ret != HCMD_SUCCESS) {
5401 dd_dev_err(dd,
5402 "%s: set physical link state to quick LinkUp failed with return %d\n",
5403 __func__, ret);
5404
5405 set_host_lcb_access(dd);
5406 write_csr(dd, DC_LCB_ERR_EN, ~0ull); /* watch LCB errors */
5407
5408 if (ret >= 0)
5409 ret = -EINVAL;
5410 return ret;
5411 }
5412
5413 return 0; /* success */
5414}
5415
5416/*
5417 * Set the SerDes to internal loopback mode.
5418 * Returns 0 on success, -errno on error.
5419 */
5420static int set_serdes_loopback_mode(struct hfi1_devdata *dd)
5421{
5422 int ret;
5423
5424 ret = set_physical_link_state(dd, PLS_INTERNAL_SERDES_LOOPBACK);
5425 if (ret == HCMD_SUCCESS)
5426 return 0;
5427 dd_dev_err(dd,
5428 "Set physical link state to SerDes Loopback failed with return %d\n",
5429 ret);
5430 if (ret >= 0)
5431 ret = -EINVAL;
5432 return ret;
5433}
5434
5435/*
5436 * Do all special steps to set up loopback.
5437 */
5438static int init_loopback(struct hfi1_devdata *dd)
5439{
5440 dd_dev_info(dd, "Entering loopback mode\n");
5441
5442 /* all loopbacks should disable self GUID check */
5443 write_csr(dd, DC_DC8051_CFG_MODE,
5444 (read_csr(dd, DC_DC8051_CFG_MODE) | DISABLE_SELF_GUID_CHECK));
5445
5446 /*
5447 * The simulator has only one loopback option - LCB. Switch
5448 * to that option, which includes quick link up.
5449 *
5450 * Accept all valid loopback values.
5451 */
5452 if ((dd->icode == ICODE_FUNCTIONAL_SIMULATOR)
5453 && (loopback == LOOPBACK_SERDES
5454 || loopback == LOOPBACK_LCB
5455 || loopback == LOOPBACK_CABLE)) {
5456 loopback = LOOPBACK_LCB;
5457 quick_linkup = 1;
5458 return 0;
5459 }
5460
5461 /* handle serdes loopback */
5462 if (loopback == LOOPBACK_SERDES) {
5463 /* internal serdes loopack needs quick linkup on RTL */
5464 if (dd->icode == ICODE_RTL_SILICON)
5465 quick_linkup = 1;
5466 return set_serdes_loopback_mode(dd);
5467 }
5468
5469 /* LCB loopback - handled at poll time */
5470 if (loopback == LOOPBACK_LCB) {
5471 quick_linkup = 1; /* LCB is always quick linkup */
5472
5473 /* not supported in emulation due to emulation RTL changes */
5474 if (dd->icode == ICODE_FPGA_EMULATION) {
5475 dd_dev_err(dd,
5476 "LCB loopback not supported in emulation\n");
5477 return -EINVAL;
5478 }
5479 return 0;
5480 }
5481
5482 /* external cable loopback requires no extra steps */
5483 if (loopback == LOOPBACK_CABLE)
5484 return 0;
5485
5486 dd_dev_err(dd, "Invalid loopback mode %d\n", loopback);
5487 return -EINVAL;
5488}
5489
5490/*
5491 * Translate from the OPA_LINK_WIDTH handed to us by the FM to bits
5492 * used in the Verify Capability link width attribute.
5493 */
5494static u16 opa_to_vc_link_widths(u16 opa_widths)
5495{
5496 int i;
5497 u16 result = 0;
5498
5499 static const struct link_bits {
5500 u16 from;
5501 u16 to;
5502 } opa_link_xlate[] = {
5503 { OPA_LINK_WIDTH_1X, 1 << (1-1) },
5504 { OPA_LINK_WIDTH_2X, 1 << (2-1) },
5505 { OPA_LINK_WIDTH_3X, 1 << (3-1) },
5506 { OPA_LINK_WIDTH_4X, 1 << (4-1) },
5507 };
5508
5509 for (i = 0; i < ARRAY_SIZE(opa_link_xlate); i++) {
5510 if (opa_widths & opa_link_xlate[i].from)
5511 result |= opa_link_xlate[i].to;
5512 }
5513 return result;
5514}
5515
5516/*
5517 * Set link attributes before moving to polling.
5518 */
5519static int set_local_link_attributes(struct hfi1_pportdata *ppd)
5520{
5521 struct hfi1_devdata *dd = ppd->dd;
5522 u8 enable_lane_tx;
5523 u8 tx_polarity_inversion;
5524 u8 rx_polarity_inversion;
5525 int ret;
5526
5527 /* reset our fabric serdes to clear any lingering problems */
5528 fabric_serdes_reset(dd);
5529
5530 /* set the local tx rate - need to read-modify-write */
5531 ret = read_tx_settings(dd, &enable_lane_tx, &tx_polarity_inversion,
5532 &rx_polarity_inversion, &ppd->local_tx_rate);
5533 if (ret)
5534 goto set_local_link_attributes_fail;
5535
5536 if (dd->dc8051_ver < dc8051_ver(0, 20)) {
5537 /* set the tx rate to the fastest enabled */
5538 if (ppd->link_speed_enabled & OPA_LINK_SPEED_25G)
5539 ppd->local_tx_rate = 1;
5540 else
5541 ppd->local_tx_rate = 0;
5542 } else {
5543 /* set the tx rate to all enabled */
5544 ppd->local_tx_rate = 0;
5545 if (ppd->link_speed_enabled & OPA_LINK_SPEED_25G)
5546 ppd->local_tx_rate |= 2;
5547 if (ppd->link_speed_enabled & OPA_LINK_SPEED_12_5G)
5548 ppd->local_tx_rate |= 1;
5549 }
Easwar Hariharanfebffe22015-10-26 10:28:36 -04005550
5551 enable_lane_tx = 0xF; /* enable all four lanes */
Mike Marciniszyn77241052015-07-30 15:17:43 -04005552 ret = write_tx_settings(dd, enable_lane_tx, tx_polarity_inversion,
5553 rx_polarity_inversion, ppd->local_tx_rate);
5554 if (ret != HCMD_SUCCESS)
5555 goto set_local_link_attributes_fail;
5556
5557 /*
5558 * DC supports continuous updates.
5559 */
5560 ret = write_vc_local_phy(dd, 0 /* no power management */,
5561 1 /* continuous updates */);
5562 if (ret != HCMD_SUCCESS)
5563 goto set_local_link_attributes_fail;
5564
5565 /* z=1 in the next call: AU of 0 is not supported by the hardware */
5566 ret = write_vc_local_fabric(dd, dd->vau, 1, dd->vcu, dd->vl15_init,
5567 ppd->port_crc_mode_enabled);
5568 if (ret != HCMD_SUCCESS)
5569 goto set_local_link_attributes_fail;
5570
5571 ret = write_vc_local_link_width(dd, 0, 0,
5572 opa_to_vc_link_widths(ppd->link_width_enabled));
5573 if (ret != HCMD_SUCCESS)
5574 goto set_local_link_attributes_fail;
5575
5576 /* let peer know who we are */
5577 ret = write_local_device_id(dd, dd->pcidev->device, dd->minrev);
5578 if (ret == HCMD_SUCCESS)
5579 return 0;
5580
5581set_local_link_attributes_fail:
5582 dd_dev_err(dd,
5583 "Failed to set local link attributes, return 0x%x\n",
5584 ret);
5585 return ret;
5586}
5587
5588/*
5589 * Call this to start the link. Schedule a retry if the cable is not
5590 * present or if unable to start polling. Do not do anything if the
5591 * link is disabled. Returns 0 if link is disabled or moved to polling
5592 */
5593int start_link(struct hfi1_pportdata *ppd)
5594{
5595 if (!ppd->link_enabled) {
5596 dd_dev_info(ppd->dd,
5597 "%s: stopping link start because link is disabled\n",
5598 __func__);
5599 return 0;
5600 }
5601 if (!ppd->driver_link_ready) {
5602 dd_dev_info(ppd->dd,
5603 "%s: stopping link start because driver is not ready\n",
5604 __func__);
5605 return 0;
5606 }
5607
5608 if (qsfp_mod_present(ppd) || loopback == LOOPBACK_SERDES ||
5609 loopback == LOOPBACK_LCB ||
5610 ppd->dd->icode == ICODE_FUNCTIONAL_SIMULATOR)
5611 return set_link_state(ppd, HLS_DN_POLL);
5612
5613 dd_dev_info(ppd->dd,
5614 "%s: stopping link start because no cable is present\n",
5615 __func__);
5616 return -EAGAIN;
5617}
5618
5619static void reset_qsfp(struct hfi1_pportdata *ppd)
5620{
5621 struct hfi1_devdata *dd = ppd->dd;
5622 u64 mask, qsfp_mask;
5623
5624 mask = (u64)QSFP_HFI0_RESET_N;
5625 qsfp_mask = read_csr(dd,
5626 dd->hfi1_id ? ASIC_QSFP2_OE : ASIC_QSFP1_OE);
5627 qsfp_mask |= mask;
5628 write_csr(dd,
5629 dd->hfi1_id ? ASIC_QSFP2_OE : ASIC_QSFP1_OE,
5630 qsfp_mask);
5631
5632 qsfp_mask = read_csr(dd,
5633 dd->hfi1_id ? ASIC_QSFP2_OUT : ASIC_QSFP1_OUT);
5634 qsfp_mask &= ~mask;
5635 write_csr(dd,
5636 dd->hfi1_id ? ASIC_QSFP2_OUT : ASIC_QSFP1_OUT,
5637 qsfp_mask);
5638
5639 udelay(10);
5640
5641 qsfp_mask |= mask;
5642 write_csr(dd,
5643 dd->hfi1_id ? ASIC_QSFP2_OUT : ASIC_QSFP1_OUT,
5644 qsfp_mask);
5645}
5646
5647static int handle_qsfp_error_conditions(struct hfi1_pportdata *ppd,
5648 u8 *qsfp_interrupt_status)
5649{
5650 struct hfi1_devdata *dd = ppd->dd;
5651
5652 if ((qsfp_interrupt_status[0] & QSFP_HIGH_TEMP_ALARM) ||
5653 (qsfp_interrupt_status[0] & QSFP_HIGH_TEMP_WARNING))
5654 dd_dev_info(dd,
5655 "%s: QSFP cable on fire\n",
5656 __func__);
5657
5658 if ((qsfp_interrupt_status[0] & QSFP_LOW_TEMP_ALARM) ||
5659 (qsfp_interrupt_status[0] & QSFP_LOW_TEMP_WARNING))
5660 dd_dev_info(dd,
5661 "%s: QSFP cable temperature too low\n",
5662 __func__);
5663
5664 if ((qsfp_interrupt_status[1] & QSFP_HIGH_VCC_ALARM) ||
5665 (qsfp_interrupt_status[1] & QSFP_HIGH_VCC_WARNING))
5666 dd_dev_info(dd,
5667 "%s: QSFP supply voltage too high\n",
5668 __func__);
5669
5670 if ((qsfp_interrupt_status[1] & QSFP_LOW_VCC_ALARM) ||
5671 (qsfp_interrupt_status[1] & QSFP_LOW_VCC_WARNING))
5672 dd_dev_info(dd,
5673 "%s: QSFP supply voltage too low\n",
5674 __func__);
5675
5676 /* Byte 2 is vendor specific */
5677
5678 if ((qsfp_interrupt_status[3] & QSFP_HIGH_POWER_ALARM) ||
5679 (qsfp_interrupt_status[3] & QSFP_HIGH_POWER_WARNING))
5680 dd_dev_info(dd,
5681 "%s: Cable RX channel 1/2 power too high\n",
5682 __func__);
5683
5684 if ((qsfp_interrupt_status[3] & QSFP_LOW_POWER_ALARM) ||
5685 (qsfp_interrupt_status[3] & QSFP_LOW_POWER_WARNING))
5686 dd_dev_info(dd,
5687 "%s: Cable RX channel 1/2 power too low\n",
5688 __func__);
5689
5690 if ((qsfp_interrupt_status[4] & QSFP_HIGH_POWER_ALARM) ||
5691 (qsfp_interrupt_status[4] & QSFP_HIGH_POWER_WARNING))
5692 dd_dev_info(dd,
5693 "%s: Cable RX channel 3/4 power too high\n",
5694 __func__);
5695
5696 if ((qsfp_interrupt_status[4] & QSFP_LOW_POWER_ALARM) ||
5697 (qsfp_interrupt_status[4] & QSFP_LOW_POWER_WARNING))
5698 dd_dev_info(dd,
5699 "%s: Cable RX channel 3/4 power too low\n",
5700 __func__);
5701
5702 if ((qsfp_interrupt_status[5] & QSFP_HIGH_BIAS_ALARM) ||
5703 (qsfp_interrupt_status[5] & QSFP_HIGH_BIAS_WARNING))
5704 dd_dev_info(dd,
5705 "%s: Cable TX channel 1/2 bias too high\n",
5706 __func__);
5707
5708 if ((qsfp_interrupt_status[5] & QSFP_LOW_BIAS_ALARM) ||
5709 (qsfp_interrupt_status[5] & QSFP_LOW_BIAS_WARNING))
5710 dd_dev_info(dd,
5711 "%s: Cable TX channel 1/2 bias too low\n",
5712 __func__);
5713
5714 if ((qsfp_interrupt_status[6] & QSFP_HIGH_BIAS_ALARM) ||
5715 (qsfp_interrupt_status[6] & QSFP_HIGH_BIAS_WARNING))
5716 dd_dev_info(dd,
5717 "%s: Cable TX channel 3/4 bias too high\n",
5718 __func__);
5719
5720 if ((qsfp_interrupt_status[6] & QSFP_LOW_BIAS_ALARM) ||
5721 (qsfp_interrupt_status[6] & QSFP_LOW_BIAS_WARNING))
5722 dd_dev_info(dd,
5723 "%s: Cable TX channel 3/4 bias too low\n",
5724 __func__);
5725
5726 if ((qsfp_interrupt_status[7] & QSFP_HIGH_POWER_ALARM) ||
5727 (qsfp_interrupt_status[7] & QSFP_HIGH_POWER_WARNING))
5728 dd_dev_info(dd,
5729 "%s: Cable TX channel 1/2 power too high\n",
5730 __func__);
5731
5732 if ((qsfp_interrupt_status[7] & QSFP_LOW_POWER_ALARM) ||
5733 (qsfp_interrupt_status[7] & QSFP_LOW_POWER_WARNING))
5734 dd_dev_info(dd,
5735 "%s: Cable TX channel 1/2 power too low\n",
5736 __func__);
5737
5738 if ((qsfp_interrupt_status[8] & QSFP_HIGH_POWER_ALARM) ||
5739 (qsfp_interrupt_status[8] & QSFP_HIGH_POWER_WARNING))
5740 dd_dev_info(dd,
5741 "%s: Cable TX channel 3/4 power too high\n",
5742 __func__);
5743
5744 if ((qsfp_interrupt_status[8] & QSFP_LOW_POWER_ALARM) ||
5745 (qsfp_interrupt_status[8] & QSFP_LOW_POWER_WARNING))
5746 dd_dev_info(dd,
5747 "%s: Cable TX channel 3/4 power too low\n",
5748 __func__);
5749
5750 /* Bytes 9-10 and 11-12 are reserved */
5751 /* Bytes 13-15 are vendor specific */
5752
5753 return 0;
5754}
5755
5756static int do_pre_lni_host_behaviors(struct hfi1_pportdata *ppd)
5757{
5758 refresh_qsfp_cache(ppd, &ppd->qsfp_info);
5759
5760 return 0;
5761}
5762
5763static int do_qsfp_intr_fallback(struct hfi1_pportdata *ppd)
5764{
5765 struct hfi1_devdata *dd = ppd->dd;
5766 u8 qsfp_interrupt_status = 0;
5767
5768 if (qsfp_read(ppd, dd->hfi1_id, 2, &qsfp_interrupt_status, 1)
5769 != 1) {
5770 dd_dev_info(dd,
5771 "%s: Failed to read status of QSFP module\n",
5772 __func__);
5773 return -EIO;
5774 }
5775
5776 /* We don't care about alarms & warnings with a non-functional INT_N */
5777 if (!(qsfp_interrupt_status & QSFP_DATA_NOT_READY))
5778 do_pre_lni_host_behaviors(ppd);
5779
5780 return 0;
5781}
5782
5783/* This routine will only be scheduled if the QSFP module is present */
5784static void qsfp_event(struct work_struct *work)
5785{
5786 struct qsfp_data *qd;
5787 struct hfi1_pportdata *ppd;
5788 struct hfi1_devdata *dd;
5789
5790 qd = container_of(work, struct qsfp_data, qsfp_work);
5791 ppd = qd->ppd;
5792 dd = ppd->dd;
5793
5794 /* Sanity check */
5795 if (!qsfp_mod_present(ppd))
5796 return;
5797
5798 /*
5799 * Turn DC back on after cables has been
5800 * re-inserted. Up until now, the DC has been in
5801 * reset to save power.
5802 */
5803 dc_start(dd);
5804
5805 if (qd->cache_refresh_required) {
5806 msleep(3000);
5807 reset_qsfp(ppd);
5808
5809 /* Check for QSFP interrupt after t_init (SFF 8679)
5810 * + extra
5811 */
5812 msleep(3000);
5813 if (!qd->qsfp_interrupt_functional) {
5814 if (do_qsfp_intr_fallback(ppd) < 0)
5815 dd_dev_info(dd, "%s: QSFP fallback failed\n",
5816 __func__);
5817 ppd->driver_link_ready = 1;
5818 start_link(ppd);
5819 }
5820 }
5821
5822 if (qd->check_interrupt_flags) {
5823 u8 qsfp_interrupt_status[16] = {0,};
5824
5825 if (qsfp_read(ppd, dd->hfi1_id, 6,
5826 &qsfp_interrupt_status[0], 16) != 16) {
5827 dd_dev_info(dd,
5828 "%s: Failed to read status of QSFP module\n",
5829 __func__);
5830 } else {
5831 unsigned long flags;
5832 u8 data_status;
5833
5834 spin_lock_irqsave(&ppd->qsfp_info.qsfp_lock, flags);
5835 ppd->qsfp_info.check_interrupt_flags = 0;
5836 spin_unlock_irqrestore(&ppd->qsfp_info.qsfp_lock,
5837 flags);
5838
5839 if (qsfp_read(ppd, dd->hfi1_id, 2, &data_status, 1)
5840 != 1) {
5841 dd_dev_info(dd,
5842 "%s: Failed to read status of QSFP module\n",
5843 __func__);
5844 }
5845 if (!(data_status & QSFP_DATA_NOT_READY)) {
5846 do_pre_lni_host_behaviors(ppd);
5847 start_link(ppd);
5848 } else
5849 handle_qsfp_error_conditions(ppd,
5850 qsfp_interrupt_status);
5851 }
5852 }
5853}
5854
5855void init_qsfp(struct hfi1_pportdata *ppd)
5856{
5857 struct hfi1_devdata *dd = ppd->dd;
5858 u64 qsfp_mask;
5859
5860 if (loopback == LOOPBACK_SERDES || loopback == LOOPBACK_LCB ||
Easwar Hariharan3c2f85b2015-10-26 10:28:31 -04005861 ppd->dd->icode == ICODE_FUNCTIONAL_SIMULATOR) {
Mike Marciniszyn77241052015-07-30 15:17:43 -04005862 ppd->driver_link_ready = 1;
5863 return;
5864 }
5865
5866 ppd->qsfp_info.ppd = ppd;
5867 INIT_WORK(&ppd->qsfp_info.qsfp_work, qsfp_event);
5868
5869 qsfp_mask = (u64)(QSFP_HFI0_INT_N | QSFP_HFI0_MODPRST_N);
5870 /* Clear current status to avoid spurious interrupts */
5871 write_csr(dd,
5872 dd->hfi1_id ?
5873 ASIC_QSFP2_CLEAR :
5874 ASIC_QSFP1_CLEAR,
5875 qsfp_mask);
5876
5877 /* Handle active low nature of INT_N and MODPRST_N pins */
5878 if (qsfp_mod_present(ppd))
5879 qsfp_mask &= ~(u64)QSFP_HFI0_MODPRST_N;
5880 write_csr(dd,
5881 dd->hfi1_id ? ASIC_QSFP2_INVERT : ASIC_QSFP1_INVERT,
5882 qsfp_mask);
5883
5884 /* Allow only INT_N and MODPRST_N to trigger QSFP interrupts */
5885 qsfp_mask |= (u64)QSFP_HFI0_MODPRST_N;
5886 write_csr(dd,
5887 dd->hfi1_id ? ASIC_QSFP2_MASK : ASIC_QSFP1_MASK,
5888 qsfp_mask);
5889
5890 if (qsfp_mod_present(ppd)) {
5891 msleep(3000);
5892 reset_qsfp(ppd);
5893
5894 /* Check for QSFP interrupt after t_init (SFF 8679)
5895 * + extra
5896 */
5897 msleep(3000);
5898 if (!ppd->qsfp_info.qsfp_interrupt_functional) {
5899 if (do_qsfp_intr_fallback(ppd) < 0)
5900 dd_dev_info(dd,
5901 "%s: QSFP fallback failed\n",
5902 __func__);
5903 ppd->driver_link_ready = 1;
5904 }
5905 }
5906}
5907
5908int bringup_serdes(struct hfi1_pportdata *ppd)
5909{
5910 struct hfi1_devdata *dd = ppd->dd;
5911 u64 guid;
5912 int ret;
5913
5914 if (HFI1_CAP_IS_KSET(EXTENDED_PSN))
5915 add_rcvctrl(dd, RCV_CTRL_RCV_EXTENDED_PSN_ENABLE_SMASK);
5916
5917 guid = ppd->guid;
5918 if (!guid) {
5919 if (dd->base_guid)
5920 guid = dd->base_guid + ppd->port - 1;
5921 ppd->guid = guid;
5922 }
5923
5924 /* the link defaults to enabled */
5925 ppd->link_enabled = 1;
5926 /* Set linkinit_reason on power up per OPA spec */
5927 ppd->linkinit_reason = OPA_LINKINIT_REASON_LINKUP;
5928
5929 if (loopback) {
5930 ret = init_loopback(dd);
5931 if (ret < 0)
5932 return ret;
5933 }
5934
5935 return start_link(ppd);
5936}
5937
5938void hfi1_quiet_serdes(struct hfi1_pportdata *ppd)
5939{
5940 struct hfi1_devdata *dd = ppd->dd;
5941
5942 /*
5943 * Shut down the link and keep it down. First turn off that the
5944 * driver wants to allow the link to be up (driver_link_ready).
5945 * Then make sure the link is not automatically restarted
5946 * (link_enabled). Cancel any pending restart. And finally
5947 * go offline.
5948 */
5949 ppd->driver_link_ready = 0;
5950 ppd->link_enabled = 0;
5951
5952 set_link_down_reason(ppd, OPA_LINKDOWN_REASON_SMA_DISABLED, 0,
5953 OPA_LINKDOWN_REASON_SMA_DISABLED);
5954 set_link_state(ppd, HLS_DN_OFFLINE);
5955
5956 /* disable the port */
5957 clear_rcvctrl(dd, RCV_CTRL_RCV_PORT_ENABLE_SMASK);
5958}
5959
5960static inline int init_cpu_counters(struct hfi1_devdata *dd)
5961{
5962 struct hfi1_pportdata *ppd;
5963 int i;
5964
5965 ppd = (struct hfi1_pportdata *)(dd + 1);
5966 for (i = 0; i < dd->num_pports; i++, ppd++) {
5967 ppd->ibport_data.rc_acks = NULL;
5968 ppd->ibport_data.rc_qacks = NULL;
5969 ppd->ibport_data.rc_acks = alloc_percpu(u64);
5970 ppd->ibport_data.rc_qacks = alloc_percpu(u64);
5971 ppd->ibport_data.rc_delayed_comp = alloc_percpu(u64);
5972 if ((ppd->ibport_data.rc_acks == NULL) ||
5973 (ppd->ibport_data.rc_delayed_comp == NULL) ||
5974 (ppd->ibport_data.rc_qacks == NULL))
5975 return -ENOMEM;
5976 }
5977
5978 return 0;
5979}
5980
5981static const char * const pt_names[] = {
5982 "expected",
5983 "eager",
5984 "invalid"
5985};
5986
5987static const char *pt_name(u32 type)
5988{
5989 return type >= ARRAY_SIZE(pt_names) ? "unknown" : pt_names[type];
5990}
5991
5992/*
5993 * index is the index into the receive array
5994 */
5995void hfi1_put_tid(struct hfi1_devdata *dd, u32 index,
5996 u32 type, unsigned long pa, u16 order)
5997{
5998 u64 reg;
5999 void __iomem *base = (dd->rcvarray_wc ? dd->rcvarray_wc :
6000 (dd->kregbase + RCV_ARRAY));
6001
6002 if (!(dd->flags & HFI1_PRESENT))
6003 goto done;
6004
6005 if (type == PT_INVALID) {
6006 pa = 0;
6007 } else if (type > PT_INVALID) {
6008 dd_dev_err(dd,
6009 "unexpected receive array type %u for index %u, not handled\n",
6010 type, index);
6011 goto done;
6012 }
6013
6014 hfi1_cdbg(TID, "type %s, index 0x%x, pa 0x%lx, bsize 0x%lx",
6015 pt_name(type), index, pa, (unsigned long)order);
6016
6017#define RT_ADDR_SHIFT 12 /* 4KB kernel address boundary */
6018 reg = RCV_ARRAY_RT_WRITE_ENABLE_SMASK
6019 | (u64)order << RCV_ARRAY_RT_BUF_SIZE_SHIFT
6020 | ((pa >> RT_ADDR_SHIFT) & RCV_ARRAY_RT_ADDR_MASK)
6021 << RCV_ARRAY_RT_ADDR_SHIFT;
6022 writeq(reg, base + (index * 8));
6023
6024 if (type == PT_EAGER)
6025 /*
6026 * Eager entries are written one-by-one so we have to push them
6027 * after we write the entry.
6028 */
6029 flush_wc();
6030done:
6031 return;
6032}
6033
6034void hfi1_clear_tids(struct hfi1_ctxtdata *rcd)
6035{
6036 struct hfi1_devdata *dd = rcd->dd;
6037 u32 i;
6038
6039 /* this could be optimized */
6040 for (i = rcd->eager_base; i < rcd->eager_base +
6041 rcd->egrbufs.alloced; i++)
6042 hfi1_put_tid(dd, i, PT_INVALID, 0, 0);
6043
6044 for (i = rcd->expected_base;
6045 i < rcd->expected_base + rcd->expected_count; i++)
6046 hfi1_put_tid(dd, i, PT_INVALID, 0, 0);
6047}
6048
6049int hfi1_get_base_kinfo(struct hfi1_ctxtdata *rcd,
6050 struct hfi1_ctxt_info *kinfo)
6051{
6052 kinfo->runtime_flags = (HFI1_MISC_GET() << HFI1_CAP_USER_SHIFT) |
6053 HFI1_CAP_UGET(MASK) | HFI1_CAP_KGET(K2U);
6054 return 0;
6055}
6056
6057struct hfi1_message_header *hfi1_get_msgheader(
6058 struct hfi1_devdata *dd, __le32 *rhf_addr)
6059{
6060 u32 offset = rhf_hdrq_offset(rhf_to_cpu(rhf_addr));
6061
6062 return (struct hfi1_message_header *)
6063 (rhf_addr - dd->rhf_offset + offset);
6064}
6065
6066static const char * const ib_cfg_name_strings[] = {
6067 "HFI1_IB_CFG_LIDLMC",
6068 "HFI1_IB_CFG_LWID_DG_ENB",
6069 "HFI1_IB_CFG_LWID_ENB",
6070 "HFI1_IB_CFG_LWID",
6071 "HFI1_IB_CFG_SPD_ENB",
6072 "HFI1_IB_CFG_SPD",
6073 "HFI1_IB_CFG_RXPOL_ENB",
6074 "HFI1_IB_CFG_LREV_ENB",
6075 "HFI1_IB_CFG_LINKLATENCY",
6076 "HFI1_IB_CFG_HRTBT",
6077 "HFI1_IB_CFG_OP_VLS",
6078 "HFI1_IB_CFG_VL_HIGH_CAP",
6079 "HFI1_IB_CFG_VL_LOW_CAP",
6080 "HFI1_IB_CFG_OVERRUN_THRESH",
6081 "HFI1_IB_CFG_PHYERR_THRESH",
6082 "HFI1_IB_CFG_LINKDEFAULT",
6083 "HFI1_IB_CFG_PKEYS",
6084 "HFI1_IB_CFG_MTU",
6085 "HFI1_IB_CFG_LSTATE",
6086 "HFI1_IB_CFG_VL_HIGH_LIMIT",
6087 "HFI1_IB_CFG_PMA_TICKS",
6088 "HFI1_IB_CFG_PORT"
6089};
6090
6091static const char *ib_cfg_name(int which)
6092{
6093 if (which < 0 || which >= ARRAY_SIZE(ib_cfg_name_strings))
6094 return "invalid";
6095 return ib_cfg_name_strings[which];
6096}
6097
6098int hfi1_get_ib_cfg(struct hfi1_pportdata *ppd, int which)
6099{
6100 struct hfi1_devdata *dd = ppd->dd;
6101 int val = 0;
6102
6103 switch (which) {
6104 case HFI1_IB_CFG_LWID_ENB: /* allowed Link-width */
6105 val = ppd->link_width_enabled;
6106 break;
6107 case HFI1_IB_CFG_LWID: /* currently active Link-width */
6108 val = ppd->link_width_active;
6109 break;
6110 case HFI1_IB_CFG_SPD_ENB: /* allowed Link speeds */
6111 val = ppd->link_speed_enabled;
6112 break;
6113 case HFI1_IB_CFG_SPD: /* current Link speed */
6114 val = ppd->link_speed_active;
6115 break;
6116
6117 case HFI1_IB_CFG_RXPOL_ENB: /* Auto-RX-polarity enable */
6118 case HFI1_IB_CFG_LREV_ENB: /* Auto-Lane-reversal enable */
6119 case HFI1_IB_CFG_LINKLATENCY:
6120 goto unimplemented;
6121
6122 case HFI1_IB_CFG_OP_VLS:
6123 val = ppd->vls_operational;
6124 break;
6125 case HFI1_IB_CFG_VL_HIGH_CAP: /* VL arb high priority table size */
6126 val = VL_ARB_HIGH_PRIO_TABLE_SIZE;
6127 break;
6128 case HFI1_IB_CFG_VL_LOW_CAP: /* VL arb low priority table size */
6129 val = VL_ARB_LOW_PRIO_TABLE_SIZE;
6130 break;
6131 case HFI1_IB_CFG_OVERRUN_THRESH: /* IB overrun threshold */
6132 val = ppd->overrun_threshold;
6133 break;
6134 case HFI1_IB_CFG_PHYERR_THRESH: /* IB PHY error threshold */
6135 val = ppd->phy_error_threshold;
6136 break;
6137 case HFI1_IB_CFG_LINKDEFAULT: /* IB link default (sleep/poll) */
6138 val = dd->link_default;
6139 break;
6140
6141 case HFI1_IB_CFG_HRTBT: /* Heartbeat off/enable/auto */
6142 case HFI1_IB_CFG_PMA_TICKS:
6143 default:
6144unimplemented:
6145 if (HFI1_CAP_IS_KSET(PRINT_UNIMPL))
6146 dd_dev_info(
6147 dd,
6148 "%s: which %s: not implemented\n",
6149 __func__,
6150 ib_cfg_name(which));
6151 break;
6152 }
6153
6154 return val;
6155}
6156
6157/*
6158 * The largest MAD packet size.
6159 */
6160#define MAX_MAD_PACKET 2048
6161
6162/*
6163 * Return the maximum header bytes that can go on the _wire_
6164 * for this device. This count includes the ICRC which is
6165 * not part of the packet held in memory but it is appended
6166 * by the HW.
6167 * This is dependent on the device's receive header entry size.
6168 * HFI allows this to be set per-receive context, but the
6169 * driver presently enforces a global value.
6170 */
6171u32 lrh_max_header_bytes(struct hfi1_devdata *dd)
6172{
6173 /*
6174 * The maximum non-payload (MTU) bytes in LRH.PktLen are
6175 * the Receive Header Entry Size minus the PBC (or RHF) size
6176 * plus one DW for the ICRC appended by HW.
6177 *
6178 * dd->rcd[0].rcvhdrqentsize is in DW.
6179 * We use rcd[0] as all context will have the same value. Also,
6180 * the first kernel context would have been allocated by now so
6181 * we are guaranteed a valid value.
6182 */
6183 return (dd->rcd[0]->rcvhdrqentsize - 2/*PBC/RHF*/ + 1/*ICRC*/) << 2;
6184}
6185
6186/*
6187 * Set Send Length
6188 * @ppd - per port data
6189 *
6190 * Set the MTU by limiting how many DWs may be sent. The SendLenCheck*
6191 * registers compare against LRH.PktLen, so use the max bytes included
6192 * in the LRH.
6193 *
6194 * This routine changes all VL values except VL15, which it maintains at
6195 * the same value.
6196 */
6197static void set_send_length(struct hfi1_pportdata *ppd)
6198{
6199 struct hfi1_devdata *dd = ppd->dd;
6200 u32 max_hb = lrh_max_header_bytes(dd), maxvlmtu = 0, dcmtu;
6201 u64 len1 = 0, len2 = (((dd->vld[15].mtu + max_hb) >> 2)
6202 & SEND_LEN_CHECK1_LEN_VL15_MASK) <<
6203 SEND_LEN_CHECK1_LEN_VL15_SHIFT;
6204 int i;
6205
6206 for (i = 0; i < ppd->vls_supported; i++) {
6207 if (dd->vld[i].mtu > maxvlmtu)
6208 maxvlmtu = dd->vld[i].mtu;
6209 if (i <= 3)
6210 len1 |= (((dd->vld[i].mtu + max_hb) >> 2)
6211 & SEND_LEN_CHECK0_LEN_VL0_MASK) <<
6212 ((i % 4) * SEND_LEN_CHECK0_LEN_VL1_SHIFT);
6213 else
6214 len2 |= (((dd->vld[i].mtu + max_hb) >> 2)
6215 & SEND_LEN_CHECK1_LEN_VL4_MASK) <<
6216 ((i % 4) * SEND_LEN_CHECK1_LEN_VL5_SHIFT);
6217 }
6218 write_csr(dd, SEND_LEN_CHECK0, len1);
6219 write_csr(dd, SEND_LEN_CHECK1, len2);
6220 /* adjust kernel credit return thresholds based on new MTUs */
6221 /* all kernel receive contexts have the same hdrqentsize */
6222 for (i = 0; i < ppd->vls_supported; i++) {
6223 sc_set_cr_threshold(dd->vld[i].sc,
6224 sc_mtu_to_threshold(dd->vld[i].sc, dd->vld[i].mtu,
6225 dd->rcd[0]->rcvhdrqentsize));
6226 }
6227 sc_set_cr_threshold(dd->vld[15].sc,
6228 sc_mtu_to_threshold(dd->vld[15].sc, dd->vld[15].mtu,
6229 dd->rcd[0]->rcvhdrqentsize));
6230
6231 /* Adjust maximum MTU for the port in DC */
6232 dcmtu = maxvlmtu == 10240 ? DCC_CFG_PORT_MTU_CAP_10240 :
6233 (ilog2(maxvlmtu >> 8) + 1);
6234 len1 = read_csr(ppd->dd, DCC_CFG_PORT_CONFIG);
6235 len1 &= ~DCC_CFG_PORT_CONFIG_MTU_CAP_SMASK;
6236 len1 |= ((u64)dcmtu & DCC_CFG_PORT_CONFIG_MTU_CAP_MASK) <<
6237 DCC_CFG_PORT_CONFIG_MTU_CAP_SHIFT;
6238 write_csr(ppd->dd, DCC_CFG_PORT_CONFIG, len1);
6239}
6240
6241static void set_lidlmc(struct hfi1_pportdata *ppd)
6242{
6243 int i;
6244 u64 sreg = 0;
6245 struct hfi1_devdata *dd = ppd->dd;
6246 u32 mask = ~((1U << ppd->lmc) - 1);
6247 u64 c1 = read_csr(ppd->dd, DCC_CFG_PORT_CONFIG1);
6248
6249 if (dd->hfi1_snoop.mode_flag)
6250 dd_dev_info(dd, "Set lid/lmc while snooping");
6251
6252 c1 &= ~(DCC_CFG_PORT_CONFIG1_TARGET_DLID_SMASK
6253 | DCC_CFG_PORT_CONFIG1_DLID_MASK_SMASK);
6254 c1 |= ((ppd->lid & DCC_CFG_PORT_CONFIG1_TARGET_DLID_MASK)
6255 << DCC_CFG_PORT_CONFIG1_TARGET_DLID_SHIFT)|
6256 ((mask & DCC_CFG_PORT_CONFIG1_DLID_MASK_MASK)
6257 << DCC_CFG_PORT_CONFIG1_DLID_MASK_SHIFT);
6258 write_csr(ppd->dd, DCC_CFG_PORT_CONFIG1, c1);
6259
6260 /*
6261 * Iterate over all the send contexts and set their SLID check
6262 */
6263 sreg = ((mask & SEND_CTXT_CHECK_SLID_MASK_MASK) <<
6264 SEND_CTXT_CHECK_SLID_MASK_SHIFT) |
6265 (((ppd->lid & mask) & SEND_CTXT_CHECK_SLID_VALUE_MASK) <<
6266 SEND_CTXT_CHECK_SLID_VALUE_SHIFT);
6267
6268 for (i = 0; i < dd->chip_send_contexts; i++) {
6269 hfi1_cdbg(LINKVERB, "SendContext[%d].SLID_CHECK = 0x%x",
6270 i, (u32)sreg);
6271 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_SLID, sreg);
6272 }
6273
6274 /* Now we have to do the same thing for the sdma engines */
6275 sdma_update_lmc(dd, mask, ppd->lid);
6276}
6277
6278static int wait_phy_linkstate(struct hfi1_devdata *dd, u32 state, u32 msecs)
6279{
6280 unsigned long timeout;
6281 u32 curr_state;
6282
6283 timeout = jiffies + msecs_to_jiffies(msecs);
6284 while (1) {
6285 curr_state = read_physical_state(dd);
6286 if (curr_state == state)
6287 break;
6288 if (time_after(jiffies, timeout)) {
6289 dd_dev_err(dd,
6290 "timeout waiting for phy link state 0x%x, current state is 0x%x\n",
6291 state, curr_state);
6292 return -ETIMEDOUT;
6293 }
6294 usleep_range(1950, 2050); /* sleep 2ms-ish */
6295 }
6296
6297 return 0;
6298}
6299
6300/*
6301 * Helper for set_link_state(). Do not call except from that routine.
6302 * Expects ppd->hls_mutex to be held.
6303 *
6304 * @rem_reason value to be sent to the neighbor
6305 *
6306 * LinkDownReasons only set if transition succeeds.
6307 */
6308static int goto_offline(struct hfi1_pportdata *ppd, u8 rem_reason)
6309{
6310 struct hfi1_devdata *dd = ppd->dd;
6311 u32 pstate, previous_state;
6312 u32 last_local_state;
6313 u32 last_remote_state;
6314 int ret;
6315 int do_transition;
6316 int do_wait;
6317
6318 previous_state = ppd->host_link_state;
6319 ppd->host_link_state = HLS_GOING_OFFLINE;
6320 pstate = read_physical_state(dd);
6321 if (pstate == PLS_OFFLINE) {
6322 do_transition = 0; /* in right state */
6323 do_wait = 0; /* ...no need to wait */
6324 } else if ((pstate & 0xff) == PLS_OFFLINE) {
6325 do_transition = 0; /* in an offline transient state */
6326 do_wait = 1; /* ...wait for it to settle */
6327 } else {
6328 do_transition = 1; /* need to move to offline */
6329 do_wait = 1; /* ...will need to wait */
6330 }
6331
6332 if (do_transition) {
6333 ret = set_physical_link_state(dd,
6334 PLS_OFFLINE | (rem_reason << 8));
6335
6336 if (ret != HCMD_SUCCESS) {
6337 dd_dev_err(dd,
6338 "Failed to transition to Offline link state, return %d\n",
6339 ret);
6340 return -EINVAL;
6341 }
6342 if (ppd->offline_disabled_reason == OPA_LINKDOWN_REASON_NONE)
6343 ppd->offline_disabled_reason =
6344 OPA_LINKDOWN_REASON_TRANSIENT;
6345 }
6346
6347 if (do_wait) {
6348 /* it can take a while for the link to go down */
Dean Luickdc060242015-10-26 10:28:29 -04006349 ret = wait_phy_linkstate(dd, PLS_OFFLINE, 10000);
Mike Marciniszyn77241052015-07-30 15:17:43 -04006350 if (ret < 0)
6351 return ret;
6352 }
6353
6354 /* make sure the logical state is also down */
6355 wait_logical_linkstate(ppd, IB_PORT_DOWN, 1000);
6356
6357 /*
6358 * Now in charge of LCB - must be after the physical state is
6359 * offline.quiet and before host_link_state is changed.
6360 */
6361 set_host_lcb_access(dd);
6362 write_csr(dd, DC_LCB_ERR_EN, ~0ull); /* watch LCB errors */
6363 ppd->host_link_state = HLS_LINK_COOLDOWN; /* LCB access allowed */
6364
6365 /*
6366 * The LNI has a mandatory wait time after the physical state
6367 * moves to Offline.Quiet. The wait time may be different
6368 * depending on how the link went down. The 8051 firmware
6369 * will observe the needed wait time and only move to ready
6370 * when that is completed. The largest of the quiet timeouts
6371 * is 2.5s, so wait that long and then a bit more.
6372 */
6373 ret = wait_fm_ready(dd, 3000);
6374 if (ret) {
6375 dd_dev_err(dd,
6376 "After going offline, timed out waiting for the 8051 to become ready to accept host requests\n");
6377 /* state is really offline, so make it so */
6378 ppd->host_link_state = HLS_DN_OFFLINE;
6379 return ret;
6380 }
6381
6382 /*
6383 * The state is now offline and the 8051 is ready to accept host
6384 * requests.
6385 * - change our state
6386 * - notify others if we were previously in a linkup state
6387 */
6388 ppd->host_link_state = HLS_DN_OFFLINE;
6389 if (previous_state & HLS_UP) {
6390 /* went down while link was up */
6391 handle_linkup_change(dd, 0);
6392 } else if (previous_state
6393 & (HLS_DN_POLL | HLS_VERIFY_CAP | HLS_GOING_UP)) {
6394 /* went down while attempting link up */
6395 /* byte 1 of last_*_state is the failure reason */
6396 read_last_local_state(dd, &last_local_state);
6397 read_last_remote_state(dd, &last_remote_state);
6398 dd_dev_err(dd,
6399 "LNI failure last states: local 0x%08x, remote 0x%08x\n",
6400 last_local_state, last_remote_state);
6401 }
6402
6403 /* the active link width (downgrade) is 0 on link down */
6404 ppd->link_width_active = 0;
6405 ppd->link_width_downgrade_tx_active = 0;
6406 ppd->link_width_downgrade_rx_active = 0;
6407 ppd->current_egress_rate = 0;
6408 return 0;
6409}
6410
6411/* return the link state name */
6412static const char *link_state_name(u32 state)
6413{
6414 const char *name;
6415 int n = ilog2(state);
6416 static const char * const names[] = {
6417 [__HLS_UP_INIT_BP] = "INIT",
6418 [__HLS_UP_ARMED_BP] = "ARMED",
6419 [__HLS_UP_ACTIVE_BP] = "ACTIVE",
6420 [__HLS_DN_DOWNDEF_BP] = "DOWNDEF",
6421 [__HLS_DN_POLL_BP] = "POLL",
6422 [__HLS_DN_DISABLE_BP] = "DISABLE",
6423 [__HLS_DN_OFFLINE_BP] = "OFFLINE",
6424 [__HLS_VERIFY_CAP_BP] = "VERIFY_CAP",
6425 [__HLS_GOING_UP_BP] = "GOING_UP",
6426 [__HLS_GOING_OFFLINE_BP] = "GOING_OFFLINE",
6427 [__HLS_LINK_COOLDOWN_BP] = "LINK_COOLDOWN"
6428 };
6429
6430 name = n < ARRAY_SIZE(names) ? names[n] : NULL;
6431 return name ? name : "unknown";
6432}
6433
6434/* return the link state reason name */
6435static const char *link_state_reason_name(struct hfi1_pportdata *ppd, u32 state)
6436{
6437 if (state == HLS_UP_INIT) {
6438 switch (ppd->linkinit_reason) {
6439 case OPA_LINKINIT_REASON_LINKUP:
6440 return "(LINKUP)";
6441 case OPA_LINKINIT_REASON_FLAPPING:
6442 return "(FLAPPING)";
6443 case OPA_LINKINIT_OUTSIDE_POLICY:
6444 return "(OUTSIDE_POLICY)";
6445 case OPA_LINKINIT_QUARANTINED:
6446 return "(QUARANTINED)";
6447 case OPA_LINKINIT_INSUFIC_CAPABILITY:
6448 return "(INSUFIC_CAPABILITY)";
6449 default:
6450 break;
6451 }
6452 }
6453 return "";
6454}
6455
6456/*
6457 * driver_physical_state - convert the driver's notion of a port's
6458 * state (an HLS_*) into a physical state (a {IB,OPA}_PORTPHYSSTATE_*).
6459 * Return -1 (converted to a u32) to indicate error.
6460 */
6461u32 driver_physical_state(struct hfi1_pportdata *ppd)
6462{
6463 switch (ppd->host_link_state) {
6464 case HLS_UP_INIT:
6465 case HLS_UP_ARMED:
6466 case HLS_UP_ACTIVE:
6467 return IB_PORTPHYSSTATE_LINKUP;
6468 case HLS_DN_POLL:
6469 return IB_PORTPHYSSTATE_POLLING;
6470 case HLS_DN_DISABLE:
6471 return IB_PORTPHYSSTATE_DISABLED;
6472 case HLS_DN_OFFLINE:
6473 return OPA_PORTPHYSSTATE_OFFLINE;
6474 case HLS_VERIFY_CAP:
6475 return IB_PORTPHYSSTATE_POLLING;
6476 case HLS_GOING_UP:
6477 return IB_PORTPHYSSTATE_POLLING;
6478 case HLS_GOING_OFFLINE:
6479 return OPA_PORTPHYSSTATE_OFFLINE;
6480 case HLS_LINK_COOLDOWN:
6481 return OPA_PORTPHYSSTATE_OFFLINE;
6482 case HLS_DN_DOWNDEF:
6483 default:
6484 dd_dev_err(ppd->dd, "invalid host_link_state 0x%x\n",
6485 ppd->host_link_state);
6486 return -1;
6487 }
6488}
6489
6490/*
6491 * driver_logical_state - convert the driver's notion of a port's
6492 * state (an HLS_*) into a logical state (a IB_PORT_*). Return -1
6493 * (converted to a u32) to indicate error.
6494 */
6495u32 driver_logical_state(struct hfi1_pportdata *ppd)
6496{
6497 if (ppd->host_link_state && !(ppd->host_link_state & HLS_UP))
6498 return IB_PORT_DOWN;
6499
6500 switch (ppd->host_link_state & HLS_UP) {
6501 case HLS_UP_INIT:
6502 return IB_PORT_INIT;
6503 case HLS_UP_ARMED:
6504 return IB_PORT_ARMED;
6505 case HLS_UP_ACTIVE:
6506 return IB_PORT_ACTIVE;
6507 default:
6508 dd_dev_err(ppd->dd, "invalid host_link_state 0x%x\n",
6509 ppd->host_link_state);
6510 return -1;
6511 }
6512}
6513
6514void set_link_down_reason(struct hfi1_pportdata *ppd, u8 lcl_reason,
6515 u8 neigh_reason, u8 rem_reason)
6516{
6517 if (ppd->local_link_down_reason.latest == 0 &&
6518 ppd->neigh_link_down_reason.latest == 0) {
6519 ppd->local_link_down_reason.latest = lcl_reason;
6520 ppd->neigh_link_down_reason.latest = neigh_reason;
6521 ppd->remote_link_down_reason = rem_reason;
6522 }
6523}
6524
6525/*
6526 * Change the physical and/or logical link state.
6527 *
6528 * Do not call this routine while inside an interrupt. It contains
6529 * calls to routines that can take multiple seconds to finish.
6530 *
6531 * Returns 0 on success, -errno on failure.
6532 */
6533int set_link_state(struct hfi1_pportdata *ppd, u32 state)
6534{
6535 struct hfi1_devdata *dd = ppd->dd;
6536 struct ib_event event = {.device = NULL};
6537 int ret1, ret = 0;
6538 int was_up, is_down;
6539 int orig_new_state, poll_bounce;
6540
6541 mutex_lock(&ppd->hls_lock);
6542
6543 orig_new_state = state;
6544 if (state == HLS_DN_DOWNDEF)
6545 state = dd->link_default;
6546
6547 /* interpret poll -> poll as a link bounce */
6548 poll_bounce = ppd->host_link_state == HLS_DN_POLL
6549 && state == HLS_DN_POLL;
6550
6551 dd_dev_info(dd, "%s: current %s, new %s %s%s\n", __func__,
6552 link_state_name(ppd->host_link_state),
6553 link_state_name(orig_new_state),
6554 poll_bounce ? "(bounce) " : "",
6555 link_state_reason_name(ppd, state));
6556
6557 was_up = !!(ppd->host_link_state & HLS_UP);
6558
6559 /*
6560 * If we're going to a (HLS_*) link state that implies the logical
6561 * link state is neither of (IB_PORT_ARMED, IB_PORT_ACTIVE), then
6562 * reset is_sm_config_started to 0.
6563 */
6564 if (!(state & (HLS_UP_ARMED | HLS_UP_ACTIVE)))
6565 ppd->is_sm_config_started = 0;
6566
6567 /*
6568 * Do nothing if the states match. Let a poll to poll link bounce
6569 * go through.
6570 */
6571 if (ppd->host_link_state == state && !poll_bounce)
6572 goto done;
6573
6574 switch (state) {
6575 case HLS_UP_INIT:
6576 if (ppd->host_link_state == HLS_DN_POLL && (quick_linkup
6577 || dd->icode == ICODE_FUNCTIONAL_SIMULATOR)) {
6578 /*
6579 * Quick link up jumps from polling to here.
6580 *
6581 * Whether in normal or loopback mode, the
6582 * simulator jumps from polling to link up.
6583 * Accept that here.
6584 */
6585 /* OK */;
6586 } else if (ppd->host_link_state != HLS_GOING_UP) {
6587 goto unexpected;
6588 }
6589
6590 ppd->host_link_state = HLS_UP_INIT;
6591 ret = wait_logical_linkstate(ppd, IB_PORT_INIT, 1000);
6592 if (ret) {
6593 /* logical state didn't change, stay at going_up */
6594 ppd->host_link_state = HLS_GOING_UP;
6595 dd_dev_err(dd,
6596 "%s: logical state did not change to INIT\n",
6597 __func__);
6598 } else {
6599 /* clear old transient LINKINIT_REASON code */
6600 if (ppd->linkinit_reason >= OPA_LINKINIT_REASON_CLEAR)
6601 ppd->linkinit_reason =
6602 OPA_LINKINIT_REASON_LINKUP;
6603
6604 /* enable the port */
6605 add_rcvctrl(dd, RCV_CTRL_RCV_PORT_ENABLE_SMASK);
6606
6607 handle_linkup_change(dd, 1);
6608 }
6609 break;
6610 case HLS_UP_ARMED:
6611 if (ppd->host_link_state != HLS_UP_INIT)
6612 goto unexpected;
6613
6614 ppd->host_link_state = HLS_UP_ARMED;
6615 set_logical_state(dd, LSTATE_ARMED);
6616 ret = wait_logical_linkstate(ppd, IB_PORT_ARMED, 1000);
6617 if (ret) {
6618 /* logical state didn't change, stay at init */
6619 ppd->host_link_state = HLS_UP_INIT;
6620 dd_dev_err(dd,
6621 "%s: logical state did not change to ARMED\n",
6622 __func__);
6623 }
6624 /*
6625 * The simulator does not currently implement SMA messages,
6626 * so neighbor_normal is not set. Set it here when we first
6627 * move to Armed.
6628 */
6629 if (dd->icode == ICODE_FUNCTIONAL_SIMULATOR)
6630 ppd->neighbor_normal = 1;
6631 break;
6632 case HLS_UP_ACTIVE:
6633 if (ppd->host_link_state != HLS_UP_ARMED)
6634 goto unexpected;
6635
6636 ppd->host_link_state = HLS_UP_ACTIVE;
6637 set_logical_state(dd, LSTATE_ACTIVE);
6638 ret = wait_logical_linkstate(ppd, IB_PORT_ACTIVE, 1000);
6639 if (ret) {
6640 /* logical state didn't change, stay at armed */
6641 ppd->host_link_state = HLS_UP_ARMED;
6642 dd_dev_err(dd,
6643 "%s: logical state did not change to ACTIVE\n",
6644 __func__);
6645 } else {
6646
6647 /* tell all engines to go running */
6648 sdma_all_running(dd);
6649
6650 /* Signal the IB layer that the port has went active */
6651 event.device = &dd->verbs_dev.ibdev;
6652 event.element.port_num = ppd->port;
6653 event.event = IB_EVENT_PORT_ACTIVE;
6654 }
6655 break;
6656 case HLS_DN_POLL:
6657 if ((ppd->host_link_state == HLS_DN_DISABLE ||
6658 ppd->host_link_state == HLS_DN_OFFLINE) &&
6659 dd->dc_shutdown)
6660 dc_start(dd);
6661 /* Hand LED control to the DC */
6662 write_csr(dd, DCC_CFG_LED_CNTRL, 0);
6663
6664 if (ppd->host_link_state != HLS_DN_OFFLINE) {
6665 u8 tmp = ppd->link_enabled;
6666
6667 ret = goto_offline(ppd, ppd->remote_link_down_reason);
6668 if (ret) {
6669 ppd->link_enabled = tmp;
6670 break;
6671 }
6672 ppd->remote_link_down_reason = 0;
6673
6674 if (ppd->driver_link_ready)
6675 ppd->link_enabled = 1;
6676 }
6677
6678 ret = set_local_link_attributes(ppd);
6679 if (ret)
6680 break;
6681
6682 ppd->port_error_action = 0;
6683 ppd->host_link_state = HLS_DN_POLL;
6684
6685 if (quick_linkup) {
6686 /* quick linkup does not go into polling */
6687 ret = do_quick_linkup(dd);
6688 } else {
6689 ret1 = set_physical_link_state(dd, PLS_POLLING);
6690 if (ret1 != HCMD_SUCCESS) {
6691 dd_dev_err(dd,
6692 "Failed to transition to Polling link state, return 0x%x\n",
6693 ret1);
6694 ret = -EINVAL;
6695 }
6696 }
6697 ppd->offline_disabled_reason = OPA_LINKDOWN_REASON_NONE;
6698 /*
6699 * If an error occurred above, go back to offline. The
6700 * caller may reschedule another attempt.
6701 */
6702 if (ret)
6703 goto_offline(ppd, 0);
6704 break;
6705 case HLS_DN_DISABLE:
6706 /* link is disabled */
6707 ppd->link_enabled = 0;
6708
6709 /* allow any state to transition to disabled */
6710
6711 /* must transition to offline first */
6712 if (ppd->host_link_state != HLS_DN_OFFLINE) {
6713 ret = goto_offline(ppd, ppd->remote_link_down_reason);
6714 if (ret)
6715 break;
6716 ppd->remote_link_down_reason = 0;
6717 }
6718
6719 ret1 = set_physical_link_state(dd, PLS_DISABLED);
6720 if (ret1 != HCMD_SUCCESS) {
6721 dd_dev_err(dd,
6722 "Failed to transition to Disabled link state, return 0x%x\n",
6723 ret1);
6724 ret = -EINVAL;
6725 break;
6726 }
6727 ppd->host_link_state = HLS_DN_DISABLE;
6728 dc_shutdown(dd);
6729 break;
6730 case HLS_DN_OFFLINE:
6731 if (ppd->host_link_state == HLS_DN_DISABLE)
6732 dc_start(dd);
6733
6734 /* allow any state to transition to offline */
6735 ret = goto_offline(ppd, ppd->remote_link_down_reason);
6736 if (!ret)
6737 ppd->remote_link_down_reason = 0;
6738 break;
6739 case HLS_VERIFY_CAP:
6740 if (ppd->host_link_state != HLS_DN_POLL)
6741 goto unexpected;
6742 ppd->host_link_state = HLS_VERIFY_CAP;
6743 break;
6744 case HLS_GOING_UP:
6745 if (ppd->host_link_state != HLS_VERIFY_CAP)
6746 goto unexpected;
6747
6748 ret1 = set_physical_link_state(dd, PLS_LINKUP);
6749 if (ret1 != HCMD_SUCCESS) {
6750 dd_dev_err(dd,
6751 "Failed to transition to link up state, return 0x%x\n",
6752 ret1);
6753 ret = -EINVAL;
6754 break;
6755 }
6756 ppd->host_link_state = HLS_GOING_UP;
6757 break;
6758
6759 case HLS_GOING_OFFLINE: /* transient within goto_offline() */
6760 case HLS_LINK_COOLDOWN: /* transient within goto_offline() */
6761 default:
6762 dd_dev_info(dd, "%s: state 0x%x: not supported\n",
6763 __func__, state);
6764 ret = -EINVAL;
6765 break;
6766 }
6767
6768 is_down = !!(ppd->host_link_state & (HLS_DN_POLL |
6769 HLS_DN_DISABLE | HLS_DN_OFFLINE));
6770
6771 if (was_up && is_down && ppd->local_link_down_reason.sma == 0 &&
6772 ppd->neigh_link_down_reason.sma == 0) {
6773 ppd->local_link_down_reason.sma =
6774 ppd->local_link_down_reason.latest;
6775 ppd->neigh_link_down_reason.sma =
6776 ppd->neigh_link_down_reason.latest;
6777 }
6778
6779 goto done;
6780
6781unexpected:
6782 dd_dev_err(dd, "%s: unexpected state transition from %s to %s\n",
6783 __func__, link_state_name(ppd->host_link_state),
6784 link_state_name(state));
6785 ret = -EINVAL;
6786
6787done:
6788 mutex_unlock(&ppd->hls_lock);
6789
6790 if (event.device)
6791 ib_dispatch_event(&event);
6792
6793 return ret;
6794}
6795
6796int hfi1_set_ib_cfg(struct hfi1_pportdata *ppd, int which, u32 val)
6797{
6798 u64 reg;
6799 int ret = 0;
6800
6801 switch (which) {
6802 case HFI1_IB_CFG_LIDLMC:
6803 set_lidlmc(ppd);
6804 break;
6805 case HFI1_IB_CFG_VL_HIGH_LIMIT:
6806 /*
6807 * The VL Arbitrator high limit is sent in units of 4k
6808 * bytes, while HFI stores it in units of 64 bytes.
6809 */
6810 val *= 4096/64;
6811 reg = ((u64)val & SEND_HIGH_PRIORITY_LIMIT_LIMIT_MASK)
6812 << SEND_HIGH_PRIORITY_LIMIT_LIMIT_SHIFT;
6813 write_csr(ppd->dd, SEND_HIGH_PRIORITY_LIMIT, reg);
6814 break;
6815 case HFI1_IB_CFG_LINKDEFAULT: /* IB link default (sleep/poll) */
6816 /* HFI only supports POLL as the default link down state */
6817 if (val != HLS_DN_POLL)
6818 ret = -EINVAL;
6819 break;
6820 case HFI1_IB_CFG_OP_VLS:
6821 if (ppd->vls_operational != val) {
6822 ppd->vls_operational = val;
6823 if (!ppd->port)
6824 ret = -EINVAL;
6825 else
6826 ret = sdma_map_init(
6827 ppd->dd,
6828 ppd->port - 1,
6829 val,
6830 NULL);
6831 }
6832 break;
6833 /*
6834 * For link width, link width downgrade, and speed enable, always AND
6835 * the setting with what is actually supported. This has two benefits.
6836 * First, enabled can't have unsupported values, no matter what the
6837 * SM or FM might want. Second, the ALL_SUPPORTED wildcards that mean
6838 * "fill in with your supported value" have all the bits in the
6839 * field set, so simply ANDing with supported has the desired result.
6840 */
6841 case HFI1_IB_CFG_LWID_ENB: /* set allowed Link-width */
6842 ppd->link_width_enabled = val & ppd->link_width_supported;
6843 break;
6844 case HFI1_IB_CFG_LWID_DG_ENB: /* set allowed link width downgrade */
6845 ppd->link_width_downgrade_enabled =
6846 val & ppd->link_width_downgrade_supported;
6847 break;
6848 case HFI1_IB_CFG_SPD_ENB: /* allowed Link speeds */
6849 ppd->link_speed_enabled = val & ppd->link_speed_supported;
6850 break;
6851 case HFI1_IB_CFG_OVERRUN_THRESH: /* IB overrun threshold */
6852 /*
6853 * HFI does not follow IB specs, save this value
6854 * so we can report it, if asked.
6855 */
6856 ppd->overrun_threshold = val;
6857 break;
6858 case HFI1_IB_CFG_PHYERR_THRESH: /* IB PHY error threshold */
6859 /*
6860 * HFI does not follow IB specs, save this value
6861 * so we can report it, if asked.
6862 */
6863 ppd->phy_error_threshold = val;
6864 break;
6865
6866 case HFI1_IB_CFG_MTU:
6867 set_send_length(ppd);
6868 break;
6869
6870 case HFI1_IB_CFG_PKEYS:
6871 if (HFI1_CAP_IS_KSET(PKEY_CHECK))
6872 set_partition_keys(ppd);
6873 break;
6874
6875 default:
6876 if (HFI1_CAP_IS_KSET(PRINT_UNIMPL))
6877 dd_dev_info(ppd->dd,
6878 "%s: which %s, val 0x%x: not implemented\n",
6879 __func__, ib_cfg_name(which), val);
6880 break;
6881 }
6882 return ret;
6883}
6884
6885/* begin functions related to vl arbitration table caching */
6886static void init_vl_arb_caches(struct hfi1_pportdata *ppd)
6887{
6888 int i;
6889
6890 BUILD_BUG_ON(VL_ARB_TABLE_SIZE !=
6891 VL_ARB_LOW_PRIO_TABLE_SIZE);
6892 BUILD_BUG_ON(VL_ARB_TABLE_SIZE !=
6893 VL_ARB_HIGH_PRIO_TABLE_SIZE);
6894
6895 /*
6896 * Note that we always return values directly from the
6897 * 'vl_arb_cache' (and do no CSR reads) in response to a
6898 * 'Get(VLArbTable)'. This is obviously correct after a
6899 * 'Set(VLArbTable)', since the cache will then be up to
6900 * date. But it's also correct prior to any 'Set(VLArbTable)'
6901 * since then both the cache, and the relevant h/w registers
6902 * will be zeroed.
6903 */
6904
6905 for (i = 0; i < MAX_PRIO_TABLE; i++)
6906 spin_lock_init(&ppd->vl_arb_cache[i].lock);
6907}
6908
6909/*
6910 * vl_arb_lock_cache
6911 *
6912 * All other vl_arb_* functions should be called only after locking
6913 * the cache.
6914 */
6915static inline struct vl_arb_cache *
6916vl_arb_lock_cache(struct hfi1_pportdata *ppd, int idx)
6917{
6918 if (idx != LO_PRIO_TABLE && idx != HI_PRIO_TABLE)
6919 return NULL;
6920 spin_lock(&ppd->vl_arb_cache[idx].lock);
6921 return &ppd->vl_arb_cache[idx];
6922}
6923
6924static inline void vl_arb_unlock_cache(struct hfi1_pportdata *ppd, int idx)
6925{
6926 spin_unlock(&ppd->vl_arb_cache[idx].lock);
6927}
6928
6929static void vl_arb_get_cache(struct vl_arb_cache *cache,
6930 struct ib_vl_weight_elem *vl)
6931{
6932 memcpy(vl, cache->table, VL_ARB_TABLE_SIZE * sizeof(*vl));
6933}
6934
6935static void vl_arb_set_cache(struct vl_arb_cache *cache,
6936 struct ib_vl_weight_elem *vl)
6937{
6938 memcpy(cache->table, vl, VL_ARB_TABLE_SIZE * sizeof(*vl));
6939}
6940
6941static int vl_arb_match_cache(struct vl_arb_cache *cache,
6942 struct ib_vl_weight_elem *vl)
6943{
6944 return !memcmp(cache->table, vl, VL_ARB_TABLE_SIZE * sizeof(*vl));
6945}
6946/* end functions related to vl arbitration table caching */
6947
6948static int set_vl_weights(struct hfi1_pportdata *ppd, u32 target,
6949 u32 size, struct ib_vl_weight_elem *vl)
6950{
6951 struct hfi1_devdata *dd = ppd->dd;
6952 u64 reg;
6953 unsigned int i, is_up = 0;
6954 int drain, ret = 0;
6955
6956 mutex_lock(&ppd->hls_lock);
6957
6958 if (ppd->host_link_state & HLS_UP)
6959 is_up = 1;
6960
6961 drain = !is_ax(dd) && is_up;
6962
6963 if (drain)
6964 /*
6965 * Before adjusting VL arbitration weights, empty per-VL
6966 * FIFOs, otherwise a packet whose VL weight is being
6967 * set to 0 could get stuck in a FIFO with no chance to
6968 * egress.
6969 */
6970 ret = stop_drain_data_vls(dd);
6971
6972 if (ret) {
6973 dd_dev_err(
6974 dd,
6975 "%s: cannot stop/drain VLs - refusing to change VL arbitration weights\n",
6976 __func__);
6977 goto err;
6978 }
6979
6980 for (i = 0; i < size; i++, vl++) {
6981 /*
6982 * NOTE: The low priority shift and mask are used here, but
6983 * they are the same for both the low and high registers.
6984 */
6985 reg = (((u64)vl->vl & SEND_LOW_PRIORITY_LIST_VL_MASK)
6986 << SEND_LOW_PRIORITY_LIST_VL_SHIFT)
6987 | (((u64)vl->weight
6988 & SEND_LOW_PRIORITY_LIST_WEIGHT_MASK)
6989 << SEND_LOW_PRIORITY_LIST_WEIGHT_SHIFT);
6990 write_csr(dd, target + (i * 8), reg);
6991 }
6992 pio_send_control(dd, PSC_GLOBAL_VLARB_ENABLE);
6993
6994 if (drain)
6995 open_fill_data_vls(dd); /* reopen all VLs */
6996
6997err:
6998 mutex_unlock(&ppd->hls_lock);
6999
7000 return ret;
7001}
7002
7003/*
7004 * Read one credit merge VL register.
7005 */
7006static void read_one_cm_vl(struct hfi1_devdata *dd, u32 csr,
7007 struct vl_limit *vll)
7008{
7009 u64 reg = read_csr(dd, csr);
7010
7011 vll->dedicated = cpu_to_be16(
7012 (reg >> SEND_CM_CREDIT_VL_DEDICATED_LIMIT_VL_SHIFT)
7013 & SEND_CM_CREDIT_VL_DEDICATED_LIMIT_VL_MASK);
7014 vll->shared = cpu_to_be16(
7015 (reg >> SEND_CM_CREDIT_VL_SHARED_LIMIT_VL_SHIFT)
7016 & SEND_CM_CREDIT_VL_SHARED_LIMIT_VL_MASK);
7017}
7018
7019/*
7020 * Read the current credit merge limits.
7021 */
7022static int get_buffer_control(struct hfi1_devdata *dd,
7023 struct buffer_control *bc, u16 *overall_limit)
7024{
7025 u64 reg;
7026 int i;
7027
7028 /* not all entries are filled in */
7029 memset(bc, 0, sizeof(*bc));
7030
7031 /* OPA and HFI have a 1-1 mapping */
7032 for (i = 0; i < TXE_NUM_DATA_VL; i++)
7033 read_one_cm_vl(dd, SEND_CM_CREDIT_VL + (8*i), &bc->vl[i]);
7034
7035 /* NOTE: assumes that VL* and VL15 CSRs are bit-wise identical */
7036 read_one_cm_vl(dd, SEND_CM_CREDIT_VL15, &bc->vl[15]);
7037
7038 reg = read_csr(dd, SEND_CM_GLOBAL_CREDIT);
7039 bc->overall_shared_limit = cpu_to_be16(
7040 (reg >> SEND_CM_GLOBAL_CREDIT_SHARED_LIMIT_SHIFT)
7041 & SEND_CM_GLOBAL_CREDIT_SHARED_LIMIT_MASK);
7042 if (overall_limit)
7043 *overall_limit = (reg
7044 >> SEND_CM_GLOBAL_CREDIT_TOTAL_CREDIT_LIMIT_SHIFT)
7045 & SEND_CM_GLOBAL_CREDIT_TOTAL_CREDIT_LIMIT_MASK;
7046 return sizeof(struct buffer_control);
7047}
7048
7049static int get_sc2vlnt(struct hfi1_devdata *dd, struct sc2vlnt *dp)
7050{
7051 u64 reg;
7052 int i;
7053
7054 /* each register contains 16 SC->VLnt mappings, 4 bits each */
7055 reg = read_csr(dd, DCC_CFG_SC_VL_TABLE_15_0);
7056 for (i = 0; i < sizeof(u64); i++) {
7057 u8 byte = *(((u8 *)&reg) + i);
7058
7059 dp->vlnt[2 * i] = byte & 0xf;
7060 dp->vlnt[(2 * i) + 1] = (byte & 0xf0) >> 4;
7061 }
7062
7063 reg = read_csr(dd, DCC_CFG_SC_VL_TABLE_31_16);
7064 for (i = 0; i < sizeof(u64); i++) {
7065 u8 byte = *(((u8 *)&reg) + i);
7066
7067 dp->vlnt[16 + (2 * i)] = byte & 0xf;
7068 dp->vlnt[16 + (2 * i) + 1] = (byte & 0xf0) >> 4;
7069 }
7070 return sizeof(struct sc2vlnt);
7071}
7072
7073static void get_vlarb_preempt(struct hfi1_devdata *dd, u32 nelems,
7074 struct ib_vl_weight_elem *vl)
7075{
7076 unsigned int i;
7077
7078 for (i = 0; i < nelems; i++, vl++) {
7079 vl->vl = 0xf;
7080 vl->weight = 0;
7081 }
7082}
7083
7084static void set_sc2vlnt(struct hfi1_devdata *dd, struct sc2vlnt *dp)
7085{
7086 write_csr(dd, DCC_CFG_SC_VL_TABLE_15_0,
7087 DC_SC_VL_VAL(15_0,
7088 0, dp->vlnt[0] & 0xf,
7089 1, dp->vlnt[1] & 0xf,
7090 2, dp->vlnt[2] & 0xf,
7091 3, dp->vlnt[3] & 0xf,
7092 4, dp->vlnt[4] & 0xf,
7093 5, dp->vlnt[5] & 0xf,
7094 6, dp->vlnt[6] & 0xf,
7095 7, dp->vlnt[7] & 0xf,
7096 8, dp->vlnt[8] & 0xf,
7097 9, dp->vlnt[9] & 0xf,
7098 10, dp->vlnt[10] & 0xf,
7099 11, dp->vlnt[11] & 0xf,
7100 12, dp->vlnt[12] & 0xf,
7101 13, dp->vlnt[13] & 0xf,
7102 14, dp->vlnt[14] & 0xf,
7103 15, dp->vlnt[15] & 0xf));
7104 write_csr(dd, DCC_CFG_SC_VL_TABLE_31_16,
7105 DC_SC_VL_VAL(31_16,
7106 16, dp->vlnt[16] & 0xf,
7107 17, dp->vlnt[17] & 0xf,
7108 18, dp->vlnt[18] & 0xf,
7109 19, dp->vlnt[19] & 0xf,
7110 20, dp->vlnt[20] & 0xf,
7111 21, dp->vlnt[21] & 0xf,
7112 22, dp->vlnt[22] & 0xf,
7113 23, dp->vlnt[23] & 0xf,
7114 24, dp->vlnt[24] & 0xf,
7115 25, dp->vlnt[25] & 0xf,
7116 26, dp->vlnt[26] & 0xf,
7117 27, dp->vlnt[27] & 0xf,
7118 28, dp->vlnt[28] & 0xf,
7119 29, dp->vlnt[29] & 0xf,
7120 30, dp->vlnt[30] & 0xf,
7121 31, dp->vlnt[31] & 0xf));
7122}
7123
7124static void nonzero_msg(struct hfi1_devdata *dd, int idx, const char *what,
7125 u16 limit)
7126{
7127 if (limit != 0)
7128 dd_dev_info(dd, "Invalid %s limit %d on VL %d, ignoring\n",
7129 what, (int)limit, idx);
7130}
7131
7132/* change only the shared limit portion of SendCmGLobalCredit */
7133static void set_global_shared(struct hfi1_devdata *dd, u16 limit)
7134{
7135 u64 reg;
7136
7137 reg = read_csr(dd, SEND_CM_GLOBAL_CREDIT);
7138 reg &= ~SEND_CM_GLOBAL_CREDIT_SHARED_LIMIT_SMASK;
7139 reg |= (u64)limit << SEND_CM_GLOBAL_CREDIT_SHARED_LIMIT_SHIFT;
7140 write_csr(dd, SEND_CM_GLOBAL_CREDIT, reg);
7141}
7142
7143/* change only the total credit limit portion of SendCmGLobalCredit */
7144static void set_global_limit(struct hfi1_devdata *dd, u16 limit)
7145{
7146 u64 reg;
7147
7148 reg = read_csr(dd, SEND_CM_GLOBAL_CREDIT);
7149 reg &= ~SEND_CM_GLOBAL_CREDIT_TOTAL_CREDIT_LIMIT_SMASK;
7150 reg |= (u64)limit << SEND_CM_GLOBAL_CREDIT_TOTAL_CREDIT_LIMIT_SHIFT;
7151 write_csr(dd, SEND_CM_GLOBAL_CREDIT, reg);
7152}
7153
7154/* set the given per-VL shared limit */
7155static void set_vl_shared(struct hfi1_devdata *dd, int vl, u16 limit)
7156{
7157 u64 reg;
7158 u32 addr;
7159
7160 if (vl < TXE_NUM_DATA_VL)
7161 addr = SEND_CM_CREDIT_VL + (8 * vl);
7162 else
7163 addr = SEND_CM_CREDIT_VL15;
7164
7165 reg = read_csr(dd, addr);
7166 reg &= ~SEND_CM_CREDIT_VL_SHARED_LIMIT_VL_SMASK;
7167 reg |= (u64)limit << SEND_CM_CREDIT_VL_SHARED_LIMIT_VL_SHIFT;
7168 write_csr(dd, addr, reg);
7169}
7170
7171/* set the given per-VL dedicated limit */
7172static void set_vl_dedicated(struct hfi1_devdata *dd, int vl, u16 limit)
7173{
7174 u64 reg;
7175 u32 addr;
7176
7177 if (vl < TXE_NUM_DATA_VL)
7178 addr = SEND_CM_CREDIT_VL + (8 * vl);
7179 else
7180 addr = SEND_CM_CREDIT_VL15;
7181
7182 reg = read_csr(dd, addr);
7183 reg &= ~SEND_CM_CREDIT_VL_DEDICATED_LIMIT_VL_SMASK;
7184 reg |= (u64)limit << SEND_CM_CREDIT_VL_DEDICATED_LIMIT_VL_SHIFT;
7185 write_csr(dd, addr, reg);
7186}
7187
7188/* spin until the given per-VL status mask bits clear */
7189static void wait_for_vl_status_clear(struct hfi1_devdata *dd, u64 mask,
7190 const char *which)
7191{
7192 unsigned long timeout;
7193 u64 reg;
7194
7195 timeout = jiffies + msecs_to_jiffies(VL_STATUS_CLEAR_TIMEOUT);
7196 while (1) {
7197 reg = read_csr(dd, SEND_CM_CREDIT_USED_STATUS) & mask;
7198
7199 if (reg == 0)
7200 return; /* success */
7201 if (time_after(jiffies, timeout))
7202 break; /* timed out */
7203 udelay(1);
7204 }
7205
7206 dd_dev_err(dd,
7207 "%s credit change status not clearing after %dms, mask 0x%llx, not clear 0x%llx\n",
7208 which, VL_STATUS_CLEAR_TIMEOUT, mask, reg);
7209 /*
7210 * If this occurs, it is likely there was a credit loss on the link.
7211 * The only recovery from that is a link bounce.
7212 */
7213 dd_dev_err(dd,
7214 "Continuing anyway. A credit loss may occur. Suggest a link bounce\n");
7215}
7216
7217/*
7218 * The number of credits on the VLs may be changed while everything
7219 * is "live", but the following algorithm must be followed due to
7220 * how the hardware is actually implemented. In particular,
7221 * Return_Credit_Status[] is the only correct status check.
7222 *
7223 * if (reducing Global_Shared_Credit_Limit or any shared limit changing)
7224 * set Global_Shared_Credit_Limit = 0
7225 * use_all_vl = 1
7226 * mask0 = all VLs that are changing either dedicated or shared limits
7227 * set Shared_Limit[mask0] = 0
7228 * spin until Return_Credit_Status[use_all_vl ? all VL : mask0] == 0
7229 * if (changing any dedicated limit)
7230 * mask1 = all VLs that are lowering dedicated limits
7231 * lower Dedicated_Limit[mask1]
7232 * spin until Return_Credit_Status[mask1] == 0
7233 * raise Dedicated_Limits
7234 * raise Shared_Limits
7235 * raise Global_Shared_Credit_Limit
7236 *
7237 * lower = if the new limit is lower, set the limit to the new value
7238 * raise = if the new limit is higher than the current value (may be changed
7239 * earlier in the algorithm), set the new limit to the new value
7240 */
7241static int set_buffer_control(struct hfi1_devdata *dd,
7242 struct buffer_control *new_bc)
7243{
7244 u64 changing_mask, ld_mask, stat_mask;
7245 int change_count;
7246 int i, use_all_mask;
7247 int this_shared_changing;
7248 /*
7249 * A0: add the variable any_shared_limit_changing below and in the
7250 * algorithm above. If removing A0 support, it can be removed.
7251 */
7252 int any_shared_limit_changing;
7253 struct buffer_control cur_bc;
7254 u8 changing[OPA_MAX_VLS];
7255 u8 lowering_dedicated[OPA_MAX_VLS];
7256 u16 cur_total;
7257 u32 new_total = 0;
7258 const u64 all_mask =
7259 SEND_CM_CREDIT_USED_STATUS_VL0_RETURN_CREDIT_STATUS_SMASK
7260 | SEND_CM_CREDIT_USED_STATUS_VL1_RETURN_CREDIT_STATUS_SMASK
7261 | SEND_CM_CREDIT_USED_STATUS_VL2_RETURN_CREDIT_STATUS_SMASK
7262 | SEND_CM_CREDIT_USED_STATUS_VL3_RETURN_CREDIT_STATUS_SMASK
7263 | SEND_CM_CREDIT_USED_STATUS_VL4_RETURN_CREDIT_STATUS_SMASK
7264 | SEND_CM_CREDIT_USED_STATUS_VL5_RETURN_CREDIT_STATUS_SMASK
7265 | SEND_CM_CREDIT_USED_STATUS_VL6_RETURN_CREDIT_STATUS_SMASK
7266 | SEND_CM_CREDIT_USED_STATUS_VL7_RETURN_CREDIT_STATUS_SMASK
7267 | SEND_CM_CREDIT_USED_STATUS_VL15_RETURN_CREDIT_STATUS_SMASK;
7268
7269#define valid_vl(idx) ((idx) < TXE_NUM_DATA_VL || (idx) == 15)
7270#define NUM_USABLE_VLS 16 /* look at VL15 and less */
7271
7272
7273 /* find the new total credits, do sanity check on unused VLs */
7274 for (i = 0; i < OPA_MAX_VLS; i++) {
7275 if (valid_vl(i)) {
7276 new_total += be16_to_cpu(new_bc->vl[i].dedicated);
7277 continue;
7278 }
7279 nonzero_msg(dd, i, "dedicated",
7280 be16_to_cpu(new_bc->vl[i].dedicated));
7281 nonzero_msg(dd, i, "shared",
7282 be16_to_cpu(new_bc->vl[i].shared));
7283 new_bc->vl[i].dedicated = 0;
7284 new_bc->vl[i].shared = 0;
7285 }
7286 new_total += be16_to_cpu(new_bc->overall_shared_limit);
7287 if (new_total > (u32)dd->link_credits)
7288 return -EINVAL;
7289 /* fetch the current values */
7290 get_buffer_control(dd, &cur_bc, &cur_total);
7291
7292 /*
7293 * Create the masks we will use.
7294 */
7295 memset(changing, 0, sizeof(changing));
7296 memset(lowering_dedicated, 0, sizeof(lowering_dedicated));
7297 /* NOTE: Assumes that the individual VL bits are adjacent and in
7298 increasing order */
7299 stat_mask =
7300 SEND_CM_CREDIT_USED_STATUS_VL0_RETURN_CREDIT_STATUS_SMASK;
7301 changing_mask = 0;
7302 ld_mask = 0;
7303 change_count = 0;
7304 any_shared_limit_changing = 0;
7305 for (i = 0; i < NUM_USABLE_VLS; i++, stat_mask <<= 1) {
7306 if (!valid_vl(i))
7307 continue;
7308 this_shared_changing = new_bc->vl[i].shared
7309 != cur_bc.vl[i].shared;
7310 if (this_shared_changing)
7311 any_shared_limit_changing = 1;
7312 if (new_bc->vl[i].dedicated != cur_bc.vl[i].dedicated
7313 || this_shared_changing) {
7314 changing[i] = 1;
7315 changing_mask |= stat_mask;
7316 change_count++;
7317 }
7318 if (be16_to_cpu(new_bc->vl[i].dedicated) <
7319 be16_to_cpu(cur_bc.vl[i].dedicated)) {
7320 lowering_dedicated[i] = 1;
7321 ld_mask |= stat_mask;
7322 }
7323 }
7324
7325 /* bracket the credit change with a total adjustment */
7326 if (new_total > cur_total)
7327 set_global_limit(dd, new_total);
7328
7329 /*
7330 * Start the credit change algorithm.
7331 */
7332 use_all_mask = 0;
7333 if ((be16_to_cpu(new_bc->overall_shared_limit) <
7334 be16_to_cpu(cur_bc.overall_shared_limit))
7335 || (is_a0(dd) && any_shared_limit_changing)) {
7336 set_global_shared(dd, 0);
7337 cur_bc.overall_shared_limit = 0;
7338 use_all_mask = 1;
7339 }
7340
7341 for (i = 0; i < NUM_USABLE_VLS; i++) {
7342 if (!valid_vl(i))
7343 continue;
7344
7345 if (changing[i]) {
7346 set_vl_shared(dd, i, 0);
7347 cur_bc.vl[i].shared = 0;
7348 }
7349 }
7350
7351 wait_for_vl_status_clear(dd, use_all_mask ? all_mask : changing_mask,
7352 "shared");
7353
7354 if (change_count > 0) {
7355 for (i = 0; i < NUM_USABLE_VLS; i++) {
7356 if (!valid_vl(i))
7357 continue;
7358
7359 if (lowering_dedicated[i]) {
7360 set_vl_dedicated(dd, i,
7361 be16_to_cpu(new_bc->vl[i].dedicated));
7362 cur_bc.vl[i].dedicated =
7363 new_bc->vl[i].dedicated;
7364 }
7365 }
7366
7367 wait_for_vl_status_clear(dd, ld_mask, "dedicated");
7368
7369 /* now raise all dedicated that are going up */
7370 for (i = 0; i < NUM_USABLE_VLS; i++) {
7371 if (!valid_vl(i))
7372 continue;
7373
7374 if (be16_to_cpu(new_bc->vl[i].dedicated) >
7375 be16_to_cpu(cur_bc.vl[i].dedicated))
7376 set_vl_dedicated(dd, i,
7377 be16_to_cpu(new_bc->vl[i].dedicated));
7378 }
7379 }
7380
7381 /* next raise all shared that are going up */
7382 for (i = 0; i < NUM_USABLE_VLS; i++) {
7383 if (!valid_vl(i))
7384 continue;
7385
7386 if (be16_to_cpu(new_bc->vl[i].shared) >
7387 be16_to_cpu(cur_bc.vl[i].shared))
7388 set_vl_shared(dd, i, be16_to_cpu(new_bc->vl[i].shared));
7389 }
7390
7391 /* finally raise the global shared */
7392 if (be16_to_cpu(new_bc->overall_shared_limit) >
7393 be16_to_cpu(cur_bc.overall_shared_limit))
7394 set_global_shared(dd,
7395 be16_to_cpu(new_bc->overall_shared_limit));
7396
7397 /* bracket the credit change with a total adjustment */
7398 if (new_total < cur_total)
7399 set_global_limit(dd, new_total);
7400 return 0;
7401}
7402
7403/*
7404 * Read the given fabric manager table. Return the size of the
7405 * table (in bytes) on success, and a negative error code on
7406 * failure.
7407 */
7408int fm_get_table(struct hfi1_pportdata *ppd, int which, void *t)
7409
7410{
7411 int size;
7412 struct vl_arb_cache *vlc;
7413
7414 switch (which) {
7415 case FM_TBL_VL_HIGH_ARB:
7416 size = 256;
7417 /*
7418 * OPA specifies 128 elements (of 2 bytes each), though
7419 * HFI supports only 16 elements in h/w.
7420 */
7421 vlc = vl_arb_lock_cache(ppd, HI_PRIO_TABLE);
7422 vl_arb_get_cache(vlc, t);
7423 vl_arb_unlock_cache(ppd, HI_PRIO_TABLE);
7424 break;
7425 case FM_TBL_VL_LOW_ARB:
7426 size = 256;
7427 /*
7428 * OPA specifies 128 elements (of 2 bytes each), though
7429 * HFI supports only 16 elements in h/w.
7430 */
7431 vlc = vl_arb_lock_cache(ppd, LO_PRIO_TABLE);
7432 vl_arb_get_cache(vlc, t);
7433 vl_arb_unlock_cache(ppd, LO_PRIO_TABLE);
7434 break;
7435 case FM_TBL_BUFFER_CONTROL:
7436 size = get_buffer_control(ppd->dd, t, NULL);
7437 break;
7438 case FM_TBL_SC2VLNT:
7439 size = get_sc2vlnt(ppd->dd, t);
7440 break;
7441 case FM_TBL_VL_PREEMPT_ELEMS:
7442 size = 256;
7443 /* OPA specifies 128 elements, of 2 bytes each */
7444 get_vlarb_preempt(ppd->dd, OPA_MAX_VLS, t);
7445 break;
7446 case FM_TBL_VL_PREEMPT_MATRIX:
7447 size = 256;
7448 /*
7449 * OPA specifies that this is the same size as the VL
7450 * arbitration tables (i.e., 256 bytes).
7451 */
7452 break;
7453 default:
7454 return -EINVAL;
7455 }
7456 return size;
7457}
7458
7459/*
7460 * Write the given fabric manager table.
7461 */
7462int fm_set_table(struct hfi1_pportdata *ppd, int which, void *t)
7463{
7464 int ret = 0;
7465 struct vl_arb_cache *vlc;
7466
7467 switch (which) {
7468 case FM_TBL_VL_HIGH_ARB:
7469 vlc = vl_arb_lock_cache(ppd, HI_PRIO_TABLE);
7470 if (vl_arb_match_cache(vlc, t)) {
7471 vl_arb_unlock_cache(ppd, HI_PRIO_TABLE);
7472 break;
7473 }
7474 vl_arb_set_cache(vlc, t);
7475 vl_arb_unlock_cache(ppd, HI_PRIO_TABLE);
7476 ret = set_vl_weights(ppd, SEND_HIGH_PRIORITY_LIST,
7477 VL_ARB_HIGH_PRIO_TABLE_SIZE, t);
7478 break;
7479 case FM_TBL_VL_LOW_ARB:
7480 vlc = vl_arb_lock_cache(ppd, LO_PRIO_TABLE);
7481 if (vl_arb_match_cache(vlc, t)) {
7482 vl_arb_unlock_cache(ppd, LO_PRIO_TABLE);
7483 break;
7484 }
7485 vl_arb_set_cache(vlc, t);
7486 vl_arb_unlock_cache(ppd, LO_PRIO_TABLE);
7487 ret = set_vl_weights(ppd, SEND_LOW_PRIORITY_LIST,
7488 VL_ARB_LOW_PRIO_TABLE_SIZE, t);
7489 break;
7490 case FM_TBL_BUFFER_CONTROL:
7491 ret = set_buffer_control(ppd->dd, t);
7492 break;
7493 case FM_TBL_SC2VLNT:
7494 set_sc2vlnt(ppd->dd, t);
7495 break;
7496 default:
7497 ret = -EINVAL;
7498 }
7499 return ret;
7500}
7501
7502/*
7503 * Disable all data VLs.
7504 *
7505 * Return 0 if disabled, non-zero if the VLs cannot be disabled.
7506 */
7507static int disable_data_vls(struct hfi1_devdata *dd)
7508{
7509 if (is_a0(dd))
7510 return 1;
7511
7512 pio_send_control(dd, PSC_DATA_VL_DISABLE);
7513
7514 return 0;
7515}
7516
7517/*
7518 * open_fill_data_vls() - the counterpart to stop_drain_data_vls().
7519 * Just re-enables all data VLs (the "fill" part happens
7520 * automatically - the name was chosen for symmetry with
7521 * stop_drain_data_vls()).
7522 *
7523 * Return 0 if successful, non-zero if the VLs cannot be enabled.
7524 */
7525int open_fill_data_vls(struct hfi1_devdata *dd)
7526{
7527 if (is_a0(dd))
7528 return 1;
7529
7530 pio_send_control(dd, PSC_DATA_VL_ENABLE);
7531
7532 return 0;
7533}
7534
7535/*
7536 * drain_data_vls() - assumes that disable_data_vls() has been called,
7537 * wait for occupancy (of per-VL FIFOs) for all contexts, and SDMA
7538 * engines to drop to 0.
7539 */
7540static void drain_data_vls(struct hfi1_devdata *dd)
7541{
7542 sc_wait(dd);
7543 sdma_wait(dd);
7544 pause_for_credit_return(dd);
7545}
7546
7547/*
7548 * stop_drain_data_vls() - disable, then drain all per-VL fifos.
7549 *
7550 * Use open_fill_data_vls() to resume using data VLs. This pair is
7551 * meant to be used like this:
7552 *
7553 * stop_drain_data_vls(dd);
7554 * // do things with per-VL resources
7555 * open_fill_data_vls(dd);
7556 */
7557int stop_drain_data_vls(struct hfi1_devdata *dd)
7558{
7559 int ret;
7560
7561 ret = disable_data_vls(dd);
7562 if (ret == 0)
7563 drain_data_vls(dd);
7564
7565 return ret;
7566}
7567
7568/*
7569 * Convert a nanosecond time to a cclock count. No matter how slow
7570 * the cclock, a non-zero ns will always have a non-zero result.
7571 */
7572u32 ns_to_cclock(struct hfi1_devdata *dd, u32 ns)
7573{
7574 u32 cclocks;
7575
7576 if (dd->icode == ICODE_FPGA_EMULATION)
7577 cclocks = (ns * 1000) / FPGA_CCLOCK_PS;
7578 else /* simulation pretends to be ASIC */
7579 cclocks = (ns * 1000) / ASIC_CCLOCK_PS;
7580 if (ns && !cclocks) /* if ns nonzero, must be at least 1 */
7581 cclocks = 1;
7582 return cclocks;
7583}
7584
7585/*
7586 * Convert a cclock count to nanoseconds. Not matter how slow
7587 * the cclock, a non-zero cclocks will always have a non-zero result.
7588 */
7589u32 cclock_to_ns(struct hfi1_devdata *dd, u32 cclocks)
7590{
7591 u32 ns;
7592
7593 if (dd->icode == ICODE_FPGA_EMULATION)
7594 ns = (cclocks * FPGA_CCLOCK_PS) / 1000;
7595 else /* simulation pretends to be ASIC */
7596 ns = (cclocks * ASIC_CCLOCK_PS) / 1000;
7597 if (cclocks && !ns)
7598 ns = 1;
7599 return ns;
7600}
7601
7602/*
7603 * Dynamically adjust the receive interrupt timeout for a context based on
7604 * incoming packet rate.
7605 *
7606 * NOTE: Dynamic adjustment does not allow rcv_intr_count to be zero.
7607 */
7608static void adjust_rcv_timeout(struct hfi1_ctxtdata *rcd, u32 npkts)
7609{
7610 struct hfi1_devdata *dd = rcd->dd;
7611 u32 timeout = rcd->rcvavail_timeout;
7612
7613 /*
7614 * This algorithm doubles or halves the timeout depending on whether
7615 * the number of packets received in this interrupt were less than or
7616 * greater equal the interrupt count.
7617 *
7618 * The calculations below do not allow a steady state to be achieved.
7619 * Only at the endpoints it is possible to have an unchanging
7620 * timeout.
7621 */
7622 if (npkts < rcv_intr_count) {
7623 /*
7624 * Not enough packets arrived before the timeout, adjust
7625 * timeout downward.
7626 */
7627 if (timeout < 2) /* already at minimum? */
7628 return;
7629 timeout >>= 1;
7630 } else {
7631 /*
7632 * More than enough packets arrived before the timeout, adjust
7633 * timeout upward.
7634 */
7635 if (timeout >= dd->rcv_intr_timeout_csr) /* already at max? */
7636 return;
7637 timeout = min(timeout << 1, dd->rcv_intr_timeout_csr);
7638 }
7639
7640 rcd->rcvavail_timeout = timeout;
7641 /* timeout cannot be larger than rcv_intr_timeout_csr which has already
7642 been verified to be in range */
7643 write_kctxt_csr(dd, rcd->ctxt, RCV_AVAIL_TIME_OUT,
7644 (u64)timeout << RCV_AVAIL_TIME_OUT_TIME_OUT_RELOAD_SHIFT);
7645}
7646
7647void update_usrhead(struct hfi1_ctxtdata *rcd, u32 hd, u32 updegr, u32 egrhd,
7648 u32 intr_adjust, u32 npkts)
7649{
7650 struct hfi1_devdata *dd = rcd->dd;
7651 u64 reg;
7652 u32 ctxt = rcd->ctxt;
7653
7654 /*
7655 * Need to write timeout register before updating RcvHdrHead to ensure
7656 * that a new value is used when the HW decides to restart counting.
7657 */
7658 if (intr_adjust)
7659 adjust_rcv_timeout(rcd, npkts);
7660 if (updegr) {
7661 reg = (egrhd & RCV_EGR_INDEX_HEAD_HEAD_MASK)
7662 << RCV_EGR_INDEX_HEAD_HEAD_SHIFT;
7663 write_uctxt_csr(dd, ctxt, RCV_EGR_INDEX_HEAD, reg);
7664 }
7665 mmiowb();
7666 reg = ((u64)rcv_intr_count << RCV_HDR_HEAD_COUNTER_SHIFT) |
7667 (((u64)hd & RCV_HDR_HEAD_HEAD_MASK)
7668 << RCV_HDR_HEAD_HEAD_SHIFT);
7669 write_uctxt_csr(dd, ctxt, RCV_HDR_HEAD, reg);
7670 mmiowb();
7671}
7672
7673u32 hdrqempty(struct hfi1_ctxtdata *rcd)
7674{
7675 u32 head, tail;
7676
7677 head = (read_uctxt_csr(rcd->dd, rcd->ctxt, RCV_HDR_HEAD)
7678 & RCV_HDR_HEAD_HEAD_SMASK) >> RCV_HDR_HEAD_HEAD_SHIFT;
7679
7680 if (rcd->rcvhdrtail_kvaddr)
7681 tail = get_rcvhdrtail(rcd);
7682 else
7683 tail = read_uctxt_csr(rcd->dd, rcd->ctxt, RCV_HDR_TAIL);
7684
7685 return head == tail;
7686}
7687
7688/*
7689 * Context Control and Receive Array encoding for buffer size:
7690 * 0x0 invalid
7691 * 0x1 4 KB
7692 * 0x2 8 KB
7693 * 0x3 16 KB
7694 * 0x4 32 KB
7695 * 0x5 64 KB
7696 * 0x6 128 KB
7697 * 0x7 256 KB
7698 * 0x8 512 KB (Receive Array only)
7699 * 0x9 1 MB (Receive Array only)
7700 * 0xa 2 MB (Receive Array only)
7701 *
7702 * 0xB-0xF - reserved (Receive Array only)
7703 *
7704 *
7705 * This routine assumes that the value has already been sanity checked.
7706 */
7707static u32 encoded_size(u32 size)
7708{
7709 switch (size) {
7710 case 4*1024: return 0x1;
7711 case 8*1024: return 0x2;
7712 case 16*1024: return 0x3;
7713 case 32*1024: return 0x4;
7714 case 64*1024: return 0x5;
7715 case 128*1024: return 0x6;
7716 case 256*1024: return 0x7;
7717 case 512*1024: return 0x8;
7718 case 1*1024*1024: return 0x9;
7719 case 2*1024*1024: return 0xa;
7720 }
7721 return 0x1; /* if invalid, go with the minimum size */
7722}
7723
7724void hfi1_rcvctrl(struct hfi1_devdata *dd, unsigned int op, int ctxt)
7725{
7726 struct hfi1_ctxtdata *rcd;
7727 u64 rcvctrl, reg;
7728 int did_enable = 0;
7729
7730 rcd = dd->rcd[ctxt];
7731 if (!rcd)
7732 return;
7733
7734 hfi1_cdbg(RCVCTRL, "ctxt %d op 0x%x", ctxt, op);
7735
7736 rcvctrl = read_kctxt_csr(dd, ctxt, RCV_CTXT_CTRL);
7737 /* if the context already enabled, don't do the extra steps */
7738 if ((op & HFI1_RCVCTRL_CTXT_ENB)
7739 && !(rcvctrl & RCV_CTXT_CTRL_ENABLE_SMASK)) {
7740 /* reset the tail and hdr addresses, and sequence count */
7741 write_kctxt_csr(dd, ctxt, RCV_HDR_ADDR,
7742 rcd->rcvhdrq_phys);
7743 if (HFI1_CAP_KGET_MASK(rcd->flags, DMA_RTAIL))
7744 write_kctxt_csr(dd, ctxt, RCV_HDR_TAIL_ADDR,
7745 rcd->rcvhdrqtailaddr_phys);
7746 rcd->seq_cnt = 1;
7747
7748 /* reset the cached receive header queue head value */
7749 rcd->head = 0;
7750
7751 /*
7752 * Zero the receive header queue so we don't get false
7753 * positives when checking the sequence number. The
7754 * sequence numbers could land exactly on the same spot.
7755 * E.g. a rcd restart before the receive header wrapped.
7756 */
7757 memset(rcd->rcvhdrq, 0, rcd->rcvhdrq_size);
7758
7759 /* starting timeout */
7760 rcd->rcvavail_timeout = dd->rcv_intr_timeout_csr;
7761
7762 /* enable the context */
7763 rcvctrl |= RCV_CTXT_CTRL_ENABLE_SMASK;
7764
7765 /* clean the egr buffer size first */
7766 rcvctrl &= ~RCV_CTXT_CTRL_EGR_BUF_SIZE_SMASK;
7767 rcvctrl |= ((u64)encoded_size(rcd->egrbufs.rcvtid_size)
7768 & RCV_CTXT_CTRL_EGR_BUF_SIZE_MASK)
7769 << RCV_CTXT_CTRL_EGR_BUF_SIZE_SHIFT;
7770
7771 /* zero RcvHdrHead - set RcvHdrHead.Counter after enable */
7772 write_uctxt_csr(dd, ctxt, RCV_HDR_HEAD, 0);
7773 did_enable = 1;
7774
7775 /* zero RcvEgrIndexHead */
7776 write_uctxt_csr(dd, ctxt, RCV_EGR_INDEX_HEAD, 0);
7777
7778 /* set eager count and base index */
7779 reg = (((u64)(rcd->egrbufs.alloced >> RCV_SHIFT)
7780 & RCV_EGR_CTRL_EGR_CNT_MASK)
7781 << RCV_EGR_CTRL_EGR_CNT_SHIFT) |
7782 (((rcd->eager_base >> RCV_SHIFT)
7783 & RCV_EGR_CTRL_EGR_BASE_INDEX_MASK)
7784 << RCV_EGR_CTRL_EGR_BASE_INDEX_SHIFT);
7785 write_kctxt_csr(dd, ctxt, RCV_EGR_CTRL, reg);
7786
7787 /*
7788 * Set TID (expected) count and base index.
7789 * rcd->expected_count is set to individual RcvArray entries,
7790 * not pairs, and the CSR takes a pair-count in groups of
7791 * four, so divide by 8.
7792 */
7793 reg = (((rcd->expected_count >> RCV_SHIFT)
7794 & RCV_TID_CTRL_TID_PAIR_CNT_MASK)
7795 << RCV_TID_CTRL_TID_PAIR_CNT_SHIFT) |
7796 (((rcd->expected_base >> RCV_SHIFT)
7797 & RCV_TID_CTRL_TID_BASE_INDEX_MASK)
7798 << RCV_TID_CTRL_TID_BASE_INDEX_SHIFT);
7799 write_kctxt_csr(dd, ctxt, RCV_TID_CTRL, reg);
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05007800 if (ctxt == HFI1_CTRL_CTXT)
7801 write_csr(dd, RCV_VL15, HFI1_CTRL_CTXT);
Mike Marciniszyn77241052015-07-30 15:17:43 -04007802 }
7803 if (op & HFI1_RCVCTRL_CTXT_DIS) {
7804 write_csr(dd, RCV_VL15, 0);
Mark F. Brown46b010d2015-11-09 19:18:20 -05007805 /*
7806 * When receive context is being disabled turn on tail
7807 * update with a dummy tail address and then disable
7808 * receive context.
7809 */
7810 if (dd->rcvhdrtail_dummy_physaddr) {
7811 write_kctxt_csr(dd, ctxt, RCV_HDR_TAIL_ADDR,
7812 dd->rcvhdrtail_dummy_physaddr);
7813 rcvctrl |= RCV_CTXT_CTRL_TAIL_UPD_SMASK;
7814 }
7815
Mike Marciniszyn77241052015-07-30 15:17:43 -04007816 rcvctrl &= ~RCV_CTXT_CTRL_ENABLE_SMASK;
7817 }
7818 if (op & HFI1_RCVCTRL_INTRAVAIL_ENB)
7819 rcvctrl |= RCV_CTXT_CTRL_INTR_AVAIL_SMASK;
7820 if (op & HFI1_RCVCTRL_INTRAVAIL_DIS)
7821 rcvctrl &= ~RCV_CTXT_CTRL_INTR_AVAIL_SMASK;
7822 if (op & HFI1_RCVCTRL_TAILUPD_ENB && rcd->rcvhdrqtailaddr_phys)
7823 rcvctrl |= RCV_CTXT_CTRL_TAIL_UPD_SMASK;
7824 if (op & HFI1_RCVCTRL_TAILUPD_DIS)
7825 rcvctrl &= ~RCV_CTXT_CTRL_TAIL_UPD_SMASK;
7826 if (op & HFI1_RCVCTRL_TIDFLOW_ENB)
7827 rcvctrl |= RCV_CTXT_CTRL_TID_FLOW_ENABLE_SMASK;
7828 if (op & HFI1_RCVCTRL_TIDFLOW_DIS)
7829 rcvctrl &= ~RCV_CTXT_CTRL_TID_FLOW_ENABLE_SMASK;
7830 if (op & HFI1_RCVCTRL_ONE_PKT_EGR_ENB) {
7831 /* In one-packet-per-eager mode, the size comes from
7832 the RcvArray entry. */
7833 rcvctrl &= ~RCV_CTXT_CTRL_EGR_BUF_SIZE_SMASK;
7834 rcvctrl |= RCV_CTXT_CTRL_ONE_PACKET_PER_EGR_BUFFER_SMASK;
7835 }
7836 if (op & HFI1_RCVCTRL_ONE_PKT_EGR_DIS)
7837 rcvctrl &= ~RCV_CTXT_CTRL_ONE_PACKET_PER_EGR_BUFFER_SMASK;
7838 if (op & HFI1_RCVCTRL_NO_RHQ_DROP_ENB)
7839 rcvctrl |= RCV_CTXT_CTRL_DONT_DROP_RHQ_FULL_SMASK;
7840 if (op & HFI1_RCVCTRL_NO_RHQ_DROP_DIS)
7841 rcvctrl &= ~RCV_CTXT_CTRL_DONT_DROP_RHQ_FULL_SMASK;
7842 if (op & HFI1_RCVCTRL_NO_EGR_DROP_ENB)
7843 rcvctrl |= RCV_CTXT_CTRL_DONT_DROP_EGR_FULL_SMASK;
7844 if (op & HFI1_RCVCTRL_NO_EGR_DROP_DIS)
7845 rcvctrl &= ~RCV_CTXT_CTRL_DONT_DROP_EGR_FULL_SMASK;
7846 rcd->rcvctrl = rcvctrl;
7847 hfi1_cdbg(RCVCTRL, "ctxt %d rcvctrl 0x%llx\n", ctxt, rcvctrl);
7848 write_kctxt_csr(dd, ctxt, RCV_CTXT_CTRL, rcd->rcvctrl);
7849
7850 /* work around sticky RcvCtxtStatus.BlockedRHQFull */
7851 if (did_enable
7852 && (rcvctrl & RCV_CTXT_CTRL_DONT_DROP_RHQ_FULL_SMASK)) {
7853 reg = read_kctxt_csr(dd, ctxt, RCV_CTXT_STATUS);
7854 if (reg != 0) {
7855 dd_dev_info(dd, "ctxt %d status %lld (blocked)\n",
7856 ctxt, reg);
7857 read_uctxt_csr(dd, ctxt, RCV_HDR_HEAD);
7858 write_uctxt_csr(dd, ctxt, RCV_HDR_HEAD, 0x10);
7859 write_uctxt_csr(dd, ctxt, RCV_HDR_HEAD, 0x00);
7860 read_uctxt_csr(dd, ctxt, RCV_HDR_HEAD);
7861 reg = read_kctxt_csr(dd, ctxt, RCV_CTXT_STATUS);
7862 dd_dev_info(dd, "ctxt %d status %lld (%s blocked)\n",
7863 ctxt, reg, reg == 0 ? "not" : "still");
7864 }
7865 }
7866
7867 if (did_enable) {
7868 /*
7869 * The interrupt timeout and count must be set after
7870 * the context is enabled to take effect.
7871 */
7872 /* set interrupt timeout */
7873 write_kctxt_csr(dd, ctxt, RCV_AVAIL_TIME_OUT,
7874 (u64)rcd->rcvavail_timeout <<
7875 RCV_AVAIL_TIME_OUT_TIME_OUT_RELOAD_SHIFT);
7876
7877 /* set RcvHdrHead.Counter, zero RcvHdrHead.Head (again) */
7878 reg = (u64)rcv_intr_count << RCV_HDR_HEAD_COUNTER_SHIFT;
7879 write_uctxt_csr(dd, ctxt, RCV_HDR_HEAD, reg);
7880 }
7881
7882 if (op & (HFI1_RCVCTRL_TAILUPD_DIS | HFI1_RCVCTRL_CTXT_DIS))
7883 /*
7884 * If the context has been disabled and the Tail Update has
Mark F. Brown46b010d2015-11-09 19:18:20 -05007885 * been cleared, set the RCV_HDR_TAIL_ADDR CSR to dummy address
7886 * so it doesn't contain an address that is invalid.
Mike Marciniszyn77241052015-07-30 15:17:43 -04007887 */
Mark F. Brown46b010d2015-11-09 19:18:20 -05007888 write_kctxt_csr(dd, ctxt, RCV_HDR_TAIL_ADDR,
7889 dd->rcvhdrtail_dummy_physaddr);
Mike Marciniszyn77241052015-07-30 15:17:43 -04007890}
7891
7892u32 hfi1_read_cntrs(struct hfi1_devdata *dd, loff_t pos, char **namep,
7893 u64 **cntrp)
7894{
7895 int ret;
7896 u64 val = 0;
7897
7898 if (namep) {
7899 ret = dd->cntrnameslen;
7900 if (pos != 0) {
7901 dd_dev_err(dd, "read_cntrs does not support indexing");
7902 return 0;
7903 }
7904 *namep = dd->cntrnames;
7905 } else {
7906 const struct cntr_entry *entry;
7907 int i, j;
7908
7909 ret = (dd->ndevcntrs) * sizeof(u64);
7910 if (pos != 0) {
7911 dd_dev_err(dd, "read_cntrs does not support indexing");
7912 return 0;
7913 }
7914
7915 /* Get the start of the block of counters */
7916 *cntrp = dd->cntrs;
7917
7918 /*
7919 * Now go and fill in each counter in the block.
7920 */
7921 for (i = 0; i < DEV_CNTR_LAST; i++) {
7922 entry = &dev_cntrs[i];
7923 hfi1_cdbg(CNTR, "reading %s", entry->name);
7924 if (entry->flags & CNTR_DISABLED) {
7925 /* Nothing */
7926 hfi1_cdbg(CNTR, "\tDisabled\n");
7927 } else {
7928 if (entry->flags & CNTR_VL) {
7929 hfi1_cdbg(CNTR, "\tPer VL\n");
7930 for (j = 0; j < C_VL_COUNT; j++) {
7931 val = entry->rw_cntr(entry,
7932 dd, j,
7933 CNTR_MODE_R,
7934 0);
7935 hfi1_cdbg(
7936 CNTR,
7937 "\t\tRead 0x%llx for %d\n",
7938 val, j);
7939 dd->cntrs[entry->offset + j] =
7940 val;
7941 }
7942 } else {
7943 val = entry->rw_cntr(entry, dd,
7944 CNTR_INVALID_VL,
7945 CNTR_MODE_R, 0);
7946 dd->cntrs[entry->offset] = val;
7947 hfi1_cdbg(CNTR, "\tRead 0x%llx", val);
7948 }
7949 }
7950 }
7951 }
7952 return ret;
7953}
7954
7955/*
7956 * Used by sysfs to create files for hfi stats to read
7957 */
7958u32 hfi1_read_portcntrs(struct hfi1_devdata *dd, loff_t pos, u32 port,
7959 char **namep, u64 **cntrp)
7960{
7961 int ret;
7962 u64 val = 0;
7963
7964 if (namep) {
7965 ret = dd->portcntrnameslen;
7966 if (pos != 0) {
7967 dd_dev_err(dd, "index not supported");
7968 return 0;
7969 }
7970 *namep = dd->portcntrnames;
7971 } else {
7972 const struct cntr_entry *entry;
7973 struct hfi1_pportdata *ppd;
7974 int i, j;
7975
7976 ret = (dd->nportcntrs) * sizeof(u64);
7977 if (pos != 0) {
7978 dd_dev_err(dd, "indexing not supported");
7979 return 0;
7980 }
7981 ppd = (struct hfi1_pportdata *)(dd + 1 + port);
7982 *cntrp = ppd->cntrs;
7983
7984 for (i = 0; i < PORT_CNTR_LAST; i++) {
7985 entry = &port_cntrs[i];
7986 hfi1_cdbg(CNTR, "reading %s", entry->name);
7987 if (entry->flags & CNTR_DISABLED) {
7988 /* Nothing */
7989 hfi1_cdbg(CNTR, "\tDisabled\n");
7990 continue;
7991 }
7992
7993 if (entry->flags & CNTR_VL) {
7994 hfi1_cdbg(CNTR, "\tPer VL");
7995 for (j = 0; j < C_VL_COUNT; j++) {
7996 val = entry->rw_cntr(entry, ppd, j,
7997 CNTR_MODE_R,
7998 0);
7999 hfi1_cdbg(
8000 CNTR,
8001 "\t\tRead 0x%llx for %d",
8002 val, j);
8003 ppd->cntrs[entry->offset + j] = val;
8004 }
8005 } else {
8006 val = entry->rw_cntr(entry, ppd,
8007 CNTR_INVALID_VL,
8008 CNTR_MODE_R,
8009 0);
8010 ppd->cntrs[entry->offset] = val;
8011 hfi1_cdbg(CNTR, "\tRead 0x%llx", val);
8012 }
8013 }
8014 }
8015 return ret;
8016}
8017
8018static void free_cntrs(struct hfi1_devdata *dd)
8019{
8020 struct hfi1_pportdata *ppd;
8021 int i;
8022
8023 if (dd->synth_stats_timer.data)
8024 del_timer_sync(&dd->synth_stats_timer);
8025 dd->synth_stats_timer.data = 0;
8026 ppd = (struct hfi1_pportdata *)(dd + 1);
8027 for (i = 0; i < dd->num_pports; i++, ppd++) {
8028 kfree(ppd->cntrs);
8029 kfree(ppd->scntrs);
8030 free_percpu(ppd->ibport_data.rc_acks);
8031 free_percpu(ppd->ibport_data.rc_qacks);
8032 free_percpu(ppd->ibport_data.rc_delayed_comp);
8033 ppd->cntrs = NULL;
8034 ppd->scntrs = NULL;
8035 ppd->ibport_data.rc_acks = NULL;
8036 ppd->ibport_data.rc_qacks = NULL;
8037 ppd->ibport_data.rc_delayed_comp = NULL;
8038 }
8039 kfree(dd->portcntrnames);
8040 dd->portcntrnames = NULL;
8041 kfree(dd->cntrs);
8042 dd->cntrs = NULL;
8043 kfree(dd->scntrs);
8044 dd->scntrs = NULL;
8045 kfree(dd->cntrnames);
8046 dd->cntrnames = NULL;
8047}
8048
8049#define CNTR_MAX 0xFFFFFFFFFFFFFFFFULL
8050#define CNTR_32BIT_MAX 0x00000000FFFFFFFF
8051
8052static u64 read_dev_port_cntr(struct hfi1_devdata *dd, struct cntr_entry *entry,
8053 u64 *psval, void *context, int vl)
8054{
8055 u64 val;
8056 u64 sval = *psval;
8057
8058 if (entry->flags & CNTR_DISABLED) {
8059 dd_dev_err(dd, "Counter %s not enabled", entry->name);
8060 return 0;
8061 }
8062
8063 hfi1_cdbg(CNTR, "cntr: %s vl %d psval 0x%llx", entry->name, vl, *psval);
8064
8065 val = entry->rw_cntr(entry, context, vl, CNTR_MODE_R, 0);
8066
8067 /* If its a synthetic counter there is more work we need to do */
8068 if (entry->flags & CNTR_SYNTH) {
8069 if (sval == CNTR_MAX) {
8070 /* No need to read already saturated */
8071 return CNTR_MAX;
8072 }
8073
8074 if (entry->flags & CNTR_32BIT) {
8075 /* 32bit counters can wrap multiple times */
8076 u64 upper = sval >> 32;
8077 u64 lower = (sval << 32) >> 32;
8078
8079 if (lower > val) { /* hw wrapped */
8080 if (upper == CNTR_32BIT_MAX)
8081 val = CNTR_MAX;
8082 else
8083 upper++;
8084 }
8085
8086 if (val != CNTR_MAX)
8087 val = (upper << 32) | val;
8088
8089 } else {
8090 /* If we rolled we are saturated */
8091 if ((val < sval) || (val > CNTR_MAX))
8092 val = CNTR_MAX;
8093 }
8094 }
8095
8096 *psval = val;
8097
8098 hfi1_cdbg(CNTR, "\tNew val=0x%llx", val);
8099
8100 return val;
8101}
8102
8103static u64 write_dev_port_cntr(struct hfi1_devdata *dd,
8104 struct cntr_entry *entry,
8105 u64 *psval, void *context, int vl, u64 data)
8106{
8107 u64 val;
8108
8109 if (entry->flags & CNTR_DISABLED) {
8110 dd_dev_err(dd, "Counter %s not enabled", entry->name);
8111 return 0;
8112 }
8113
8114 hfi1_cdbg(CNTR, "cntr: %s vl %d psval 0x%llx", entry->name, vl, *psval);
8115
8116 if (entry->flags & CNTR_SYNTH) {
8117 *psval = data;
8118 if (entry->flags & CNTR_32BIT) {
8119 val = entry->rw_cntr(entry, context, vl, CNTR_MODE_W,
8120 (data << 32) >> 32);
8121 val = data; /* return the full 64bit value */
8122 } else {
8123 val = entry->rw_cntr(entry, context, vl, CNTR_MODE_W,
8124 data);
8125 }
8126 } else {
8127 val = entry->rw_cntr(entry, context, vl, CNTR_MODE_W, data);
8128 }
8129
8130 *psval = val;
8131
8132 hfi1_cdbg(CNTR, "\tNew val=0x%llx", val);
8133
8134 return val;
8135}
8136
8137u64 read_dev_cntr(struct hfi1_devdata *dd, int index, int vl)
8138{
8139 struct cntr_entry *entry;
8140 u64 *sval;
8141
8142 entry = &dev_cntrs[index];
8143 sval = dd->scntrs + entry->offset;
8144
8145 if (vl != CNTR_INVALID_VL)
8146 sval += vl;
8147
8148 return read_dev_port_cntr(dd, entry, sval, dd, vl);
8149}
8150
8151u64 write_dev_cntr(struct hfi1_devdata *dd, int index, int vl, u64 data)
8152{
8153 struct cntr_entry *entry;
8154 u64 *sval;
8155
8156 entry = &dev_cntrs[index];
8157 sval = dd->scntrs + entry->offset;
8158
8159 if (vl != CNTR_INVALID_VL)
8160 sval += vl;
8161
8162 return write_dev_port_cntr(dd, entry, sval, dd, vl, data);
8163}
8164
8165u64 read_port_cntr(struct hfi1_pportdata *ppd, int index, int vl)
8166{
8167 struct cntr_entry *entry;
8168 u64 *sval;
8169
8170 entry = &port_cntrs[index];
8171 sval = ppd->scntrs + entry->offset;
8172
8173 if (vl != CNTR_INVALID_VL)
8174 sval += vl;
8175
8176 if ((index >= C_RCV_HDR_OVF_FIRST + ppd->dd->num_rcv_contexts) &&
8177 (index <= C_RCV_HDR_OVF_LAST)) {
8178 /* We do not want to bother for disabled contexts */
8179 return 0;
8180 }
8181
8182 return read_dev_port_cntr(ppd->dd, entry, sval, ppd, vl);
8183}
8184
8185u64 write_port_cntr(struct hfi1_pportdata *ppd, int index, int vl, u64 data)
8186{
8187 struct cntr_entry *entry;
8188 u64 *sval;
8189
8190 entry = &port_cntrs[index];
8191 sval = ppd->scntrs + entry->offset;
8192
8193 if (vl != CNTR_INVALID_VL)
8194 sval += vl;
8195
8196 if ((index >= C_RCV_HDR_OVF_FIRST + ppd->dd->num_rcv_contexts) &&
8197 (index <= C_RCV_HDR_OVF_LAST)) {
8198 /* We do not want to bother for disabled contexts */
8199 return 0;
8200 }
8201
8202 return write_dev_port_cntr(ppd->dd, entry, sval, ppd, vl, data);
8203}
8204
8205static void update_synth_timer(unsigned long opaque)
8206{
8207 u64 cur_tx;
8208 u64 cur_rx;
8209 u64 total_flits;
8210 u8 update = 0;
8211 int i, j, vl;
8212 struct hfi1_pportdata *ppd;
8213 struct cntr_entry *entry;
8214
8215 struct hfi1_devdata *dd = (struct hfi1_devdata *)opaque;
8216
8217 /*
8218 * Rather than keep beating on the CSRs pick a minimal set that we can
8219 * check to watch for potential roll over. We can do this by looking at
8220 * the number of flits sent/recv. If the total flits exceeds 32bits then
8221 * we have to iterate all the counters and update.
8222 */
8223 entry = &dev_cntrs[C_DC_RCV_FLITS];
8224 cur_rx = entry->rw_cntr(entry, dd, CNTR_INVALID_VL, CNTR_MODE_R, 0);
8225
8226 entry = &dev_cntrs[C_DC_XMIT_FLITS];
8227 cur_tx = entry->rw_cntr(entry, dd, CNTR_INVALID_VL, CNTR_MODE_R, 0);
8228
8229 hfi1_cdbg(
8230 CNTR,
8231 "[%d] curr tx=0x%llx rx=0x%llx :: last tx=0x%llx rx=0x%llx\n",
8232 dd->unit, cur_tx, cur_rx, dd->last_tx, dd->last_rx);
8233
8234 if ((cur_tx < dd->last_tx) || (cur_rx < dd->last_rx)) {
8235 /*
8236 * May not be strictly necessary to update but it won't hurt and
8237 * simplifies the logic here.
8238 */
8239 update = 1;
8240 hfi1_cdbg(CNTR, "[%d] Tripwire counter rolled, updating",
8241 dd->unit);
8242 } else {
8243 total_flits = (cur_tx - dd->last_tx) + (cur_rx - dd->last_rx);
8244 hfi1_cdbg(CNTR,
8245 "[%d] total flits 0x%llx limit 0x%llx\n", dd->unit,
8246 total_flits, (u64)CNTR_32BIT_MAX);
8247 if (total_flits >= CNTR_32BIT_MAX) {
8248 hfi1_cdbg(CNTR, "[%d] 32bit limit hit, updating",
8249 dd->unit);
8250 update = 1;
8251 }
8252 }
8253
8254 if (update) {
8255 hfi1_cdbg(CNTR, "[%d] Updating dd and ppd counters", dd->unit);
8256 for (i = 0; i < DEV_CNTR_LAST; i++) {
8257 entry = &dev_cntrs[i];
8258 if (entry->flags & CNTR_VL) {
8259 for (vl = 0; vl < C_VL_COUNT; vl++)
8260 read_dev_cntr(dd, i, vl);
8261 } else {
8262 read_dev_cntr(dd, i, CNTR_INVALID_VL);
8263 }
8264 }
8265 ppd = (struct hfi1_pportdata *)(dd + 1);
8266 for (i = 0; i < dd->num_pports; i++, ppd++) {
8267 for (j = 0; j < PORT_CNTR_LAST; j++) {
8268 entry = &port_cntrs[j];
8269 if (entry->flags & CNTR_VL) {
8270 for (vl = 0; vl < C_VL_COUNT; vl++)
8271 read_port_cntr(ppd, j, vl);
8272 } else {
8273 read_port_cntr(ppd, j, CNTR_INVALID_VL);
8274 }
8275 }
8276 }
8277
8278 /*
8279 * We want the value in the register. The goal is to keep track
8280 * of the number of "ticks" not the counter value. In other
8281 * words if the register rolls we want to notice it and go ahead
8282 * and force an update.
8283 */
8284 entry = &dev_cntrs[C_DC_XMIT_FLITS];
8285 dd->last_tx = entry->rw_cntr(entry, dd, CNTR_INVALID_VL,
8286 CNTR_MODE_R, 0);
8287
8288 entry = &dev_cntrs[C_DC_RCV_FLITS];
8289 dd->last_rx = entry->rw_cntr(entry, dd, CNTR_INVALID_VL,
8290 CNTR_MODE_R, 0);
8291
8292 hfi1_cdbg(CNTR, "[%d] setting last tx/rx to 0x%llx 0x%llx",
8293 dd->unit, dd->last_tx, dd->last_rx);
8294
8295 } else {
8296 hfi1_cdbg(CNTR, "[%d] No update necessary", dd->unit);
8297 }
8298
8299mod_timer(&dd->synth_stats_timer, jiffies + HZ * SYNTH_CNT_TIME);
8300}
8301
8302#define C_MAX_NAME 13 /* 12 chars + one for /0 */
8303static int init_cntrs(struct hfi1_devdata *dd)
8304{
8305 int i, rcv_ctxts, index, j;
8306 size_t sz;
8307 char *p;
8308 char name[C_MAX_NAME];
8309 struct hfi1_pportdata *ppd;
8310
8311 /* set up the stats timer; the add_timer is done at the end */
Muhammad Falak R Wani24523a92015-10-25 16:13:23 +05308312 setup_timer(&dd->synth_stats_timer, update_synth_timer,
8313 (unsigned long)dd);
Mike Marciniszyn77241052015-07-30 15:17:43 -04008314
8315 /***********************/
8316 /* per device counters */
8317 /***********************/
8318
8319 /* size names and determine how many we have*/
8320 dd->ndevcntrs = 0;
8321 sz = 0;
8322 index = 0;
8323
8324 for (i = 0; i < DEV_CNTR_LAST; i++) {
8325 hfi1_dbg_early("Init cntr %s\n", dev_cntrs[i].name);
8326 if (dev_cntrs[i].flags & CNTR_DISABLED) {
8327 hfi1_dbg_early("\tSkipping %s\n", dev_cntrs[i].name);
8328 continue;
8329 }
8330
8331 if (dev_cntrs[i].flags & CNTR_VL) {
8332 hfi1_dbg_early("\tProcessing VL cntr\n");
8333 dev_cntrs[i].offset = index;
8334 for (j = 0; j < C_VL_COUNT; j++) {
8335 memset(name, '\0', C_MAX_NAME);
8336 snprintf(name, C_MAX_NAME, "%s%d",
8337 dev_cntrs[i].name,
8338 vl_from_idx(j));
8339 sz += strlen(name);
8340 sz++;
8341 hfi1_dbg_early("\t\t%s\n", name);
8342 dd->ndevcntrs++;
8343 index++;
8344 }
8345 } else {
8346 /* +1 for newline */
8347 sz += strlen(dev_cntrs[i].name) + 1;
8348 dd->ndevcntrs++;
8349 dev_cntrs[i].offset = index;
8350 index++;
8351 hfi1_dbg_early("\tAdding %s\n", dev_cntrs[i].name);
8352 }
8353 }
8354
8355 /* allocate space for the counter values */
8356 dd->cntrs = kcalloc(index, sizeof(u64), GFP_KERNEL);
8357 if (!dd->cntrs)
8358 goto bail;
8359
8360 dd->scntrs = kcalloc(index, sizeof(u64), GFP_KERNEL);
8361 if (!dd->scntrs)
8362 goto bail;
8363
8364
8365 /* allocate space for the counter names */
8366 dd->cntrnameslen = sz;
8367 dd->cntrnames = kmalloc(sz, GFP_KERNEL);
8368 if (!dd->cntrnames)
8369 goto bail;
8370
8371 /* fill in the names */
8372 for (p = dd->cntrnames, i = 0, index = 0; i < DEV_CNTR_LAST; i++) {
8373 if (dev_cntrs[i].flags & CNTR_DISABLED) {
8374 /* Nothing */
8375 } else {
8376 if (dev_cntrs[i].flags & CNTR_VL) {
8377 for (j = 0; j < C_VL_COUNT; j++) {
8378 memset(name, '\0', C_MAX_NAME);
8379 snprintf(name, C_MAX_NAME, "%s%d",
8380 dev_cntrs[i].name,
8381 vl_from_idx(j));
8382 memcpy(p, name, strlen(name));
8383 p += strlen(name);
8384 *p++ = '\n';
8385 }
8386 } else {
8387 memcpy(p, dev_cntrs[i].name,
8388 strlen(dev_cntrs[i].name));
8389 p += strlen(dev_cntrs[i].name);
8390 *p++ = '\n';
8391 }
8392 index++;
8393 }
8394 }
8395
8396 /*********************/
8397 /* per port counters */
8398 /*********************/
8399
8400 /*
8401 * Go through the counters for the overflows and disable the ones we
8402 * don't need. This varies based on platform so we need to do it
8403 * dynamically here.
8404 */
8405 rcv_ctxts = dd->num_rcv_contexts;
8406 for (i = C_RCV_HDR_OVF_FIRST + rcv_ctxts;
8407 i <= C_RCV_HDR_OVF_LAST; i++) {
8408 port_cntrs[i].flags |= CNTR_DISABLED;
8409 }
8410
8411 /* size port counter names and determine how many we have*/
8412 sz = 0;
8413 dd->nportcntrs = 0;
8414 for (i = 0; i < PORT_CNTR_LAST; i++) {
8415 hfi1_dbg_early("Init pcntr %s\n", port_cntrs[i].name);
8416 if (port_cntrs[i].flags & CNTR_DISABLED) {
8417 hfi1_dbg_early("\tSkipping %s\n", port_cntrs[i].name);
8418 continue;
8419 }
8420
8421 if (port_cntrs[i].flags & CNTR_VL) {
8422 hfi1_dbg_early("\tProcessing VL cntr\n");
8423 port_cntrs[i].offset = dd->nportcntrs;
8424 for (j = 0; j < C_VL_COUNT; j++) {
8425 memset(name, '\0', C_MAX_NAME);
8426 snprintf(name, C_MAX_NAME, "%s%d",
8427 port_cntrs[i].name,
8428 vl_from_idx(j));
8429 sz += strlen(name);
8430 sz++;
8431 hfi1_dbg_early("\t\t%s\n", name);
8432 dd->nportcntrs++;
8433 }
8434 } else {
8435 /* +1 for newline */
8436 sz += strlen(port_cntrs[i].name) + 1;
8437 port_cntrs[i].offset = dd->nportcntrs;
8438 dd->nportcntrs++;
8439 hfi1_dbg_early("\tAdding %s\n", port_cntrs[i].name);
8440 }
8441 }
8442
8443 /* allocate space for the counter names */
8444 dd->portcntrnameslen = sz;
8445 dd->portcntrnames = kmalloc(sz, GFP_KERNEL);
8446 if (!dd->portcntrnames)
8447 goto bail;
8448
8449 /* fill in port cntr names */
8450 for (p = dd->portcntrnames, i = 0; i < PORT_CNTR_LAST; i++) {
8451 if (port_cntrs[i].flags & CNTR_DISABLED)
8452 continue;
8453
8454 if (port_cntrs[i].flags & CNTR_VL) {
8455 for (j = 0; j < C_VL_COUNT; j++) {
8456 memset(name, '\0', C_MAX_NAME);
8457 snprintf(name, C_MAX_NAME, "%s%d",
8458 port_cntrs[i].name,
8459 vl_from_idx(j));
8460 memcpy(p, name, strlen(name));
8461 p += strlen(name);
8462 *p++ = '\n';
8463 }
8464 } else {
8465 memcpy(p, port_cntrs[i].name,
8466 strlen(port_cntrs[i].name));
8467 p += strlen(port_cntrs[i].name);
8468 *p++ = '\n';
8469 }
8470 }
8471
8472 /* allocate per port storage for counter values */
8473 ppd = (struct hfi1_pportdata *)(dd + 1);
8474 for (i = 0; i < dd->num_pports; i++, ppd++) {
8475 ppd->cntrs = kcalloc(dd->nportcntrs, sizeof(u64), GFP_KERNEL);
8476 if (!ppd->cntrs)
8477 goto bail;
8478
8479 ppd->scntrs = kcalloc(dd->nportcntrs, sizeof(u64), GFP_KERNEL);
8480 if (!ppd->scntrs)
8481 goto bail;
8482 }
8483
8484 /* CPU counters need to be allocated and zeroed */
8485 if (init_cpu_counters(dd))
8486 goto bail;
8487
8488 mod_timer(&dd->synth_stats_timer, jiffies + HZ * SYNTH_CNT_TIME);
8489 return 0;
8490bail:
8491 free_cntrs(dd);
8492 return -ENOMEM;
8493}
8494
8495
8496static u32 chip_to_opa_lstate(struct hfi1_devdata *dd, u32 chip_lstate)
8497{
8498 switch (chip_lstate) {
8499 default:
8500 dd_dev_err(dd,
8501 "Unknown logical state 0x%x, reporting IB_PORT_DOWN\n",
8502 chip_lstate);
8503 /* fall through */
8504 case LSTATE_DOWN:
8505 return IB_PORT_DOWN;
8506 case LSTATE_INIT:
8507 return IB_PORT_INIT;
8508 case LSTATE_ARMED:
8509 return IB_PORT_ARMED;
8510 case LSTATE_ACTIVE:
8511 return IB_PORT_ACTIVE;
8512 }
8513}
8514
8515u32 chip_to_opa_pstate(struct hfi1_devdata *dd, u32 chip_pstate)
8516{
8517 /* look at the HFI meta-states only */
8518 switch (chip_pstate & 0xf0) {
8519 default:
8520 dd_dev_err(dd, "Unexpected chip physical state of 0x%x\n",
8521 chip_pstate);
8522 /* fall through */
8523 case PLS_DISABLED:
8524 return IB_PORTPHYSSTATE_DISABLED;
8525 case PLS_OFFLINE:
8526 return OPA_PORTPHYSSTATE_OFFLINE;
8527 case PLS_POLLING:
8528 return IB_PORTPHYSSTATE_POLLING;
8529 case PLS_CONFIGPHY:
8530 return IB_PORTPHYSSTATE_TRAINING;
8531 case PLS_LINKUP:
8532 return IB_PORTPHYSSTATE_LINKUP;
8533 case PLS_PHYTEST:
8534 return IB_PORTPHYSSTATE_PHY_TEST;
8535 }
8536}
8537
8538/* return the OPA port logical state name */
8539const char *opa_lstate_name(u32 lstate)
8540{
8541 static const char * const port_logical_names[] = {
8542 "PORT_NOP",
8543 "PORT_DOWN",
8544 "PORT_INIT",
8545 "PORT_ARMED",
8546 "PORT_ACTIVE",
8547 "PORT_ACTIVE_DEFER",
8548 };
8549 if (lstate < ARRAY_SIZE(port_logical_names))
8550 return port_logical_names[lstate];
8551 return "unknown";
8552}
8553
8554/* return the OPA port physical state name */
8555const char *opa_pstate_name(u32 pstate)
8556{
8557 static const char * const port_physical_names[] = {
8558 "PHYS_NOP",
8559 "reserved1",
8560 "PHYS_POLL",
8561 "PHYS_DISABLED",
8562 "PHYS_TRAINING",
8563 "PHYS_LINKUP",
8564 "PHYS_LINK_ERR_RECOVER",
8565 "PHYS_PHY_TEST",
8566 "reserved8",
8567 "PHYS_OFFLINE",
8568 "PHYS_GANGED",
8569 "PHYS_TEST",
8570 };
8571 if (pstate < ARRAY_SIZE(port_physical_names))
8572 return port_physical_names[pstate];
8573 return "unknown";
8574}
8575
8576/*
8577 * Read the hardware link state and set the driver's cached value of it.
8578 * Return the (new) current value.
8579 */
8580u32 get_logical_state(struct hfi1_pportdata *ppd)
8581{
8582 u32 new_state;
8583
8584 new_state = chip_to_opa_lstate(ppd->dd, read_logical_state(ppd->dd));
8585 if (new_state != ppd->lstate) {
8586 dd_dev_info(ppd->dd, "logical state changed to %s (0x%x)\n",
8587 opa_lstate_name(new_state), new_state);
8588 ppd->lstate = new_state;
8589 }
8590 /*
8591 * Set port status flags in the page mapped into userspace
8592 * memory. Do it here to ensure a reliable state - this is
8593 * the only function called by all state handling code.
8594 * Always set the flags due to the fact that the cache value
8595 * might have been changed explicitly outside of this
8596 * function.
8597 */
8598 if (ppd->statusp) {
8599 switch (ppd->lstate) {
8600 case IB_PORT_DOWN:
8601 case IB_PORT_INIT:
8602 *ppd->statusp &= ~(HFI1_STATUS_IB_CONF |
8603 HFI1_STATUS_IB_READY);
8604 break;
8605 case IB_PORT_ARMED:
8606 *ppd->statusp |= HFI1_STATUS_IB_CONF;
8607 break;
8608 case IB_PORT_ACTIVE:
8609 *ppd->statusp |= HFI1_STATUS_IB_READY;
8610 break;
8611 }
8612 }
8613 return ppd->lstate;
8614}
8615
8616/**
8617 * wait_logical_linkstate - wait for an IB link state change to occur
8618 * @ppd: port device
8619 * @state: the state to wait for
8620 * @msecs: the number of milliseconds to wait
8621 *
8622 * Wait up to msecs milliseconds for IB link state change to occur.
8623 * For now, take the easy polling route.
8624 * Returns 0 if state reached, otherwise -ETIMEDOUT.
8625 */
8626static int wait_logical_linkstate(struct hfi1_pportdata *ppd, u32 state,
8627 int msecs)
8628{
8629 unsigned long timeout;
8630
8631 timeout = jiffies + msecs_to_jiffies(msecs);
8632 while (1) {
8633 if (get_logical_state(ppd) == state)
8634 return 0;
8635 if (time_after(jiffies, timeout))
8636 break;
8637 msleep(20);
8638 }
8639 dd_dev_err(ppd->dd, "timeout waiting for link state 0x%x\n", state);
8640
8641 return -ETIMEDOUT;
8642}
8643
8644u8 hfi1_ibphys_portstate(struct hfi1_pportdata *ppd)
8645{
8646 static u32 remembered_state = 0xff;
8647 u32 pstate;
8648 u32 ib_pstate;
8649
8650 pstate = read_physical_state(ppd->dd);
8651 ib_pstate = chip_to_opa_pstate(ppd->dd, pstate);
8652 if (remembered_state != ib_pstate) {
8653 dd_dev_info(ppd->dd,
8654 "%s: physical state changed to %s (0x%x), phy 0x%x\n",
8655 __func__, opa_pstate_name(ib_pstate), ib_pstate,
8656 pstate);
8657 remembered_state = ib_pstate;
8658 }
8659 return ib_pstate;
8660}
8661
8662/*
8663 * Read/modify/write ASIC_QSFP register bits as selected by mask
8664 * data: 0 or 1 in the positions depending on what needs to be written
8665 * dir: 0 for read, 1 for write
8666 * mask: select by setting
8667 * I2CCLK (bit 0)
8668 * I2CDATA (bit 1)
8669 */
8670u64 hfi1_gpio_mod(struct hfi1_devdata *dd, u32 target, u32 data, u32 dir,
8671 u32 mask)
8672{
8673 u64 qsfp_oe, target_oe;
8674
8675 target_oe = target ? ASIC_QSFP2_OE : ASIC_QSFP1_OE;
8676 if (mask) {
8677 /* We are writing register bits, so lock access */
8678 dir &= mask;
8679 data &= mask;
8680
8681 qsfp_oe = read_csr(dd, target_oe);
8682 qsfp_oe = (qsfp_oe & ~(u64)mask) | (u64)dir;
8683 write_csr(dd, target_oe, qsfp_oe);
8684 }
8685 /* We are exclusively reading bits here, but it is unlikely
8686 * we'll get valid data when we set the direction of the pin
8687 * in the same call, so read should call this function again
8688 * to get valid data
8689 */
8690 return read_csr(dd, target ? ASIC_QSFP2_IN : ASIC_QSFP1_IN);
8691}
8692
8693#define CLEAR_STATIC_RATE_CONTROL_SMASK(r) \
8694(r &= ~SEND_CTXT_CHECK_ENABLE_DISALLOW_PBC_STATIC_RATE_CONTROL_SMASK)
8695
8696#define SET_STATIC_RATE_CONTROL_SMASK(r) \
8697(r |= SEND_CTXT_CHECK_ENABLE_DISALLOW_PBC_STATIC_RATE_CONTROL_SMASK)
8698
8699int hfi1_init_ctxt(struct send_context *sc)
8700{
8701 if (sc != NULL) {
8702 struct hfi1_devdata *dd = sc->dd;
8703 u64 reg;
8704 u8 set = (sc->type == SC_USER ?
8705 HFI1_CAP_IS_USET(STATIC_RATE_CTRL) :
8706 HFI1_CAP_IS_KSET(STATIC_RATE_CTRL));
8707 reg = read_kctxt_csr(dd, sc->hw_context,
8708 SEND_CTXT_CHECK_ENABLE);
8709 if (set)
8710 CLEAR_STATIC_RATE_CONTROL_SMASK(reg);
8711 else
8712 SET_STATIC_RATE_CONTROL_SMASK(reg);
8713 write_kctxt_csr(dd, sc->hw_context,
8714 SEND_CTXT_CHECK_ENABLE, reg);
8715 }
8716 return 0;
8717}
8718
8719int hfi1_tempsense_rd(struct hfi1_devdata *dd, struct hfi1_temp *temp)
8720{
8721 int ret = 0;
8722 u64 reg;
8723
8724 if (dd->icode != ICODE_RTL_SILICON) {
8725 if (HFI1_CAP_IS_KSET(PRINT_UNIMPL))
8726 dd_dev_info(dd, "%s: tempsense not supported by HW\n",
8727 __func__);
8728 return -EINVAL;
8729 }
8730 reg = read_csr(dd, ASIC_STS_THERM);
8731 temp->curr = ((reg >> ASIC_STS_THERM_CURR_TEMP_SHIFT) &
8732 ASIC_STS_THERM_CURR_TEMP_MASK);
8733 temp->lo_lim = ((reg >> ASIC_STS_THERM_LO_TEMP_SHIFT) &
8734 ASIC_STS_THERM_LO_TEMP_MASK);
8735 temp->hi_lim = ((reg >> ASIC_STS_THERM_HI_TEMP_SHIFT) &
8736 ASIC_STS_THERM_HI_TEMP_MASK);
8737 temp->crit_lim = ((reg >> ASIC_STS_THERM_CRIT_TEMP_SHIFT) &
8738 ASIC_STS_THERM_CRIT_TEMP_MASK);
8739 /* triggers is a 3-bit value - 1 bit per trigger. */
8740 temp->triggers = (u8)((reg >> ASIC_STS_THERM_LOW_SHIFT) & 0x7);
8741
8742 return ret;
8743}
8744
8745/* ========================================================================= */
8746
8747/*
8748 * Enable/disable chip from delivering interrupts.
8749 */
8750void set_intr_state(struct hfi1_devdata *dd, u32 enable)
8751{
8752 int i;
8753
8754 /*
8755 * In HFI, the mask needs to be 1 to allow interrupts.
8756 */
8757 if (enable) {
8758 u64 cce_int_mask;
8759 const int qsfp1_int_smask = QSFP1_INT % 64;
8760 const int qsfp2_int_smask = QSFP2_INT % 64;
8761
8762 /* enable all interrupts */
8763 for (i = 0; i < CCE_NUM_INT_CSRS; i++)
8764 write_csr(dd, CCE_INT_MASK + (8*i), ~(u64)0);
8765
8766 /*
8767 * disable QSFP1 interrupts for HFI1, QSFP2 interrupts for HFI0
8768 * Qsfp1Int and Qsfp2Int are adjacent bits in the same CSR,
8769 * therefore just one of QSFP1_INT/QSFP2_INT can be used to find
8770 * the index of the appropriate CSR in the CCEIntMask CSR array
8771 */
8772 cce_int_mask = read_csr(dd, CCE_INT_MASK +
8773 (8*(QSFP1_INT/64)));
8774 if (dd->hfi1_id) {
8775 cce_int_mask &= ~((u64)1 << qsfp1_int_smask);
8776 write_csr(dd, CCE_INT_MASK + (8*(QSFP1_INT/64)),
8777 cce_int_mask);
8778 } else {
8779 cce_int_mask &= ~((u64)1 << qsfp2_int_smask);
8780 write_csr(dd, CCE_INT_MASK + (8*(QSFP2_INT/64)),
8781 cce_int_mask);
8782 }
8783 } else {
8784 for (i = 0; i < CCE_NUM_INT_CSRS; i++)
8785 write_csr(dd, CCE_INT_MASK + (8*i), 0ull);
8786 }
8787}
8788
8789/*
8790 * Clear all interrupt sources on the chip.
8791 */
8792static void clear_all_interrupts(struct hfi1_devdata *dd)
8793{
8794 int i;
8795
8796 for (i = 0; i < CCE_NUM_INT_CSRS; i++)
8797 write_csr(dd, CCE_INT_CLEAR + (8*i), ~(u64)0);
8798
8799 write_csr(dd, CCE_ERR_CLEAR, ~(u64)0);
8800 write_csr(dd, MISC_ERR_CLEAR, ~(u64)0);
8801 write_csr(dd, RCV_ERR_CLEAR, ~(u64)0);
8802 write_csr(dd, SEND_ERR_CLEAR, ~(u64)0);
8803 write_csr(dd, SEND_PIO_ERR_CLEAR, ~(u64)0);
8804 write_csr(dd, SEND_DMA_ERR_CLEAR, ~(u64)0);
8805 write_csr(dd, SEND_EGRESS_ERR_CLEAR, ~(u64)0);
8806 for (i = 0; i < dd->chip_send_contexts; i++)
8807 write_kctxt_csr(dd, i, SEND_CTXT_ERR_CLEAR, ~(u64)0);
8808 for (i = 0; i < dd->chip_sdma_engines; i++)
8809 write_kctxt_csr(dd, i, SEND_DMA_ENG_ERR_CLEAR, ~(u64)0);
8810
8811 write_csr(dd, DCC_ERR_FLG_CLR, ~(u64)0);
8812 write_csr(dd, DC_LCB_ERR_CLR, ~(u64)0);
8813 write_csr(dd, DC_DC8051_ERR_CLR, ~(u64)0);
8814}
8815
8816/* Move to pcie.c? */
8817static void disable_intx(struct pci_dev *pdev)
8818{
8819 pci_intx(pdev, 0);
8820}
8821
8822static void clean_up_interrupts(struct hfi1_devdata *dd)
8823{
8824 int i;
8825
8826 /* remove irqs - must happen before disabling/turning off */
8827 if (dd->num_msix_entries) {
8828 /* MSI-X */
8829 struct hfi1_msix_entry *me = dd->msix_entries;
8830
8831 for (i = 0; i < dd->num_msix_entries; i++, me++) {
8832 if (me->arg == NULL) /* => no irq, no affinity */
8833 break;
8834 irq_set_affinity_hint(dd->msix_entries[i].msix.vector,
8835 NULL);
8836 free_irq(me->msix.vector, me->arg);
8837 }
8838 } else {
8839 /* INTx */
8840 if (dd->requested_intx_irq) {
8841 free_irq(dd->pcidev->irq, dd);
8842 dd->requested_intx_irq = 0;
8843 }
8844 }
8845
8846 /* turn off interrupts */
8847 if (dd->num_msix_entries) {
8848 /* MSI-X */
Amitoj Kaur Chawla6e5b6132015-11-01 16:14:32 +05308849 pci_disable_msix(dd->pcidev);
Mike Marciniszyn77241052015-07-30 15:17:43 -04008850 } else {
8851 /* INTx */
8852 disable_intx(dd->pcidev);
8853 }
8854
8855 /* clean structures */
8856 for (i = 0; i < dd->num_msix_entries; i++)
8857 free_cpumask_var(dd->msix_entries[i].mask);
8858 kfree(dd->msix_entries);
8859 dd->msix_entries = NULL;
8860 dd->num_msix_entries = 0;
8861}
8862
8863/*
8864 * Remap the interrupt source from the general handler to the given MSI-X
8865 * interrupt.
8866 */
8867static void remap_intr(struct hfi1_devdata *dd, int isrc, int msix_intr)
8868{
8869 u64 reg;
8870 int m, n;
8871
8872 /* clear from the handled mask of the general interrupt */
8873 m = isrc / 64;
8874 n = isrc % 64;
8875 dd->gi_mask[m] &= ~((u64)1 << n);
8876
8877 /* direct the chip source to the given MSI-X interrupt */
8878 m = isrc / 8;
8879 n = isrc % 8;
8880 reg = read_csr(dd, CCE_INT_MAP + (8*m));
8881 reg &= ~((u64)0xff << (8*n));
8882 reg |= ((u64)msix_intr & 0xff) << (8*n);
8883 write_csr(dd, CCE_INT_MAP + (8*m), reg);
8884}
8885
8886static void remap_sdma_interrupts(struct hfi1_devdata *dd,
8887 int engine, int msix_intr)
8888{
8889 /*
8890 * SDMA engine interrupt sources grouped by type, rather than
8891 * engine. Per-engine interrupts are as follows:
8892 * SDMA
8893 * SDMAProgress
8894 * SDMAIdle
8895 */
8896 remap_intr(dd, IS_SDMA_START + 0*TXE_NUM_SDMA_ENGINES + engine,
8897 msix_intr);
8898 remap_intr(dd, IS_SDMA_START + 1*TXE_NUM_SDMA_ENGINES + engine,
8899 msix_intr);
8900 remap_intr(dd, IS_SDMA_START + 2*TXE_NUM_SDMA_ENGINES + engine,
8901 msix_intr);
8902}
8903
Mike Marciniszyn77241052015-07-30 15:17:43 -04008904static int request_intx_irq(struct hfi1_devdata *dd)
8905{
8906 int ret;
8907
8908 snprintf(dd->intx_name, sizeof(dd->intx_name), DRIVER_NAME"_%d",
8909 dd->unit);
8910 ret = request_irq(dd->pcidev->irq, general_interrupt,
8911 IRQF_SHARED, dd->intx_name, dd);
8912 if (ret)
8913 dd_dev_err(dd, "unable to request INTx interrupt, err %d\n",
8914 ret);
8915 else
8916 dd->requested_intx_irq = 1;
8917 return ret;
8918}
8919
8920static int request_msix_irqs(struct hfi1_devdata *dd)
8921{
8922 const struct cpumask *local_mask;
8923 cpumask_var_t def, rcv;
8924 bool def_ret, rcv_ret;
8925 int first_general, last_general;
8926 int first_sdma, last_sdma;
8927 int first_rx, last_rx;
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05008928 int first_cpu, curr_cpu;
Mike Marciniszyn77241052015-07-30 15:17:43 -04008929 int rcv_cpu, sdma_cpu;
8930 int i, ret = 0, possible;
8931 int ht;
8932
8933 /* calculate the ranges we are going to use */
8934 first_general = 0;
8935 first_sdma = last_general = first_general + 1;
8936 first_rx = last_sdma = first_sdma + dd->num_sdma;
8937 last_rx = first_rx + dd->n_krcv_queues;
8938
8939 /*
8940 * Interrupt affinity.
8941 *
8942 * non-rcv avail gets a default mask that
8943 * starts as possible cpus with threads reset
8944 * and each rcv avail reset.
8945 *
8946 * rcv avail gets node relative 1 wrapping back
8947 * to the node relative 1 as necessary.
8948 *
8949 */
8950 local_mask = cpumask_of_pcibus(dd->pcidev->bus);
8951 /* if first cpu is invalid, use NUMA 0 */
8952 if (cpumask_first(local_mask) >= nr_cpu_ids)
8953 local_mask = topology_core_cpumask(0);
8954
8955 def_ret = zalloc_cpumask_var(&def, GFP_KERNEL);
8956 rcv_ret = zalloc_cpumask_var(&rcv, GFP_KERNEL);
8957 if (!def_ret || !rcv_ret)
8958 goto bail;
8959 /* use local mask as default */
8960 cpumask_copy(def, local_mask);
8961 possible = cpumask_weight(def);
8962 /* disarm threads from default */
8963 ht = cpumask_weight(
8964 topology_sibling_cpumask(cpumask_first(local_mask)));
8965 for (i = possible/ht; i < possible; i++)
8966 cpumask_clear_cpu(i, def);
Mike Marciniszyn77241052015-07-30 15:17:43 -04008967 /* def now has full cores on chosen node*/
8968 first_cpu = cpumask_first(def);
8969 if (nr_cpu_ids >= first_cpu)
8970 first_cpu++;
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05008971 curr_cpu = first_cpu;
Mike Marciniszyn77241052015-07-30 15:17:43 -04008972
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05008973 /* One context is reserved as control context */
8974 for (i = first_cpu; i < dd->n_krcv_queues + first_cpu - 1; i++) {
Mike Marciniszyn77241052015-07-30 15:17:43 -04008975 cpumask_clear_cpu(curr_cpu, def);
8976 cpumask_set_cpu(curr_cpu, rcv);
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05008977 curr_cpu = cpumask_next(curr_cpu, def);
8978 if (curr_cpu >= nr_cpu_ids)
8979 break;
Mike Marciniszyn77241052015-07-30 15:17:43 -04008980 }
8981 /* def mask has non-rcv, rcv has recv mask */
8982 rcv_cpu = cpumask_first(rcv);
8983 sdma_cpu = cpumask_first(def);
8984
8985 /*
8986 * Sanity check - the code expects all SDMA chip source
8987 * interrupts to be in the same CSR, starting at bit 0. Verify
8988 * that this is true by checking the bit location of the start.
8989 */
8990 BUILD_BUG_ON(IS_SDMA_START % 64);
8991
8992 for (i = 0; i < dd->num_msix_entries; i++) {
8993 struct hfi1_msix_entry *me = &dd->msix_entries[i];
8994 const char *err_info;
8995 irq_handler_t handler;
Dean Luickf4f30031c2015-10-26 10:28:44 -04008996 irq_handler_t thread = NULL;
Mike Marciniszyn77241052015-07-30 15:17:43 -04008997 void *arg;
8998 int idx;
8999 struct hfi1_ctxtdata *rcd = NULL;
9000 struct sdma_engine *sde = NULL;
9001
9002 /* obtain the arguments to request_irq */
9003 if (first_general <= i && i < last_general) {
9004 idx = i - first_general;
9005 handler = general_interrupt;
9006 arg = dd;
9007 snprintf(me->name, sizeof(me->name),
9008 DRIVER_NAME"_%d", dd->unit);
9009 err_info = "general";
9010 } else if (first_sdma <= i && i < last_sdma) {
9011 idx = i - first_sdma;
9012 sde = &dd->per_sdma[idx];
9013 handler = sdma_interrupt;
9014 arg = sde;
9015 snprintf(me->name, sizeof(me->name),
9016 DRIVER_NAME"_%d sdma%d", dd->unit, idx);
9017 err_info = "sdma";
9018 remap_sdma_interrupts(dd, idx, i);
9019 } else if (first_rx <= i && i < last_rx) {
9020 idx = i - first_rx;
9021 rcd = dd->rcd[idx];
9022 /* no interrupt if no rcd */
9023 if (!rcd)
9024 continue;
9025 /*
9026 * Set the interrupt register and mask for this
9027 * context's interrupt.
9028 */
9029 rcd->ireg = (IS_RCVAVAIL_START+idx) / 64;
9030 rcd->imask = ((u64)1) <<
9031 ((IS_RCVAVAIL_START+idx) % 64);
9032 handler = receive_context_interrupt;
Dean Luickf4f30031c2015-10-26 10:28:44 -04009033 thread = receive_context_thread;
Mike Marciniszyn77241052015-07-30 15:17:43 -04009034 arg = rcd;
9035 snprintf(me->name, sizeof(me->name),
9036 DRIVER_NAME"_%d kctxt%d", dd->unit, idx);
9037 err_info = "receive context";
Amitoj Kaur Chawla66c09332015-11-01 16:18:18 +05309038 remap_intr(dd, IS_RCVAVAIL_START + idx, i);
Mike Marciniszyn77241052015-07-30 15:17:43 -04009039 } else {
9040 /* not in our expected range - complain, then
9041 ignore it */
9042 dd_dev_err(dd,
9043 "Unexpected extra MSI-X interrupt %d\n", i);
9044 continue;
9045 }
9046 /* no argument, no interrupt */
9047 if (arg == NULL)
9048 continue;
9049 /* make sure the name is terminated */
9050 me->name[sizeof(me->name)-1] = 0;
9051
Dean Luickf4f30031c2015-10-26 10:28:44 -04009052 ret = request_threaded_irq(me->msix.vector, handler, thread, 0,
9053 me->name, arg);
Mike Marciniszyn77241052015-07-30 15:17:43 -04009054 if (ret) {
9055 dd_dev_err(dd,
9056 "unable to allocate %s interrupt, vector %d, index %d, err %d\n",
9057 err_info, me->msix.vector, idx, ret);
9058 return ret;
9059 }
9060 /*
9061 * assign arg after request_irq call, so it will be
9062 * cleaned up
9063 */
9064 me->arg = arg;
9065
9066 if (!zalloc_cpumask_var(
9067 &dd->msix_entries[i].mask,
9068 GFP_KERNEL))
9069 goto bail;
9070 if (handler == sdma_interrupt) {
9071 dd_dev_info(dd, "sdma engine %d cpu %d\n",
9072 sde->this_idx, sdma_cpu);
Mike Marciniszyn0a226ed2015-11-09 19:13:58 -05009073 sde->cpu = sdma_cpu;
Mike Marciniszyn77241052015-07-30 15:17:43 -04009074 cpumask_set_cpu(sdma_cpu, dd->msix_entries[i].mask);
9075 sdma_cpu = cpumask_next(sdma_cpu, def);
9076 if (sdma_cpu >= nr_cpu_ids)
9077 sdma_cpu = cpumask_first(def);
9078 } else if (handler == receive_context_interrupt) {
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05009079 dd_dev_info(dd, "rcv ctxt %d cpu %d\n", rcd->ctxt,
9080 (rcd->ctxt == HFI1_CTRL_CTXT) ?
9081 cpumask_first(def) : rcv_cpu);
9082 if (rcd->ctxt == HFI1_CTRL_CTXT) {
9083 /* map to first default */
9084 cpumask_set_cpu(cpumask_first(def),
9085 dd->msix_entries[i].mask);
9086 } else {
9087 cpumask_set_cpu(rcv_cpu,
9088 dd->msix_entries[i].mask);
9089 rcv_cpu = cpumask_next(rcv_cpu, rcv);
9090 if (rcv_cpu >= nr_cpu_ids)
9091 rcv_cpu = cpumask_first(rcv);
9092 }
Mike Marciniszyn77241052015-07-30 15:17:43 -04009093 } else {
9094 /* otherwise first def */
9095 dd_dev_info(dd, "%s cpu %d\n",
9096 err_info, cpumask_first(def));
9097 cpumask_set_cpu(
9098 cpumask_first(def), dd->msix_entries[i].mask);
9099 }
9100 irq_set_affinity_hint(
9101 dd->msix_entries[i].msix.vector,
9102 dd->msix_entries[i].mask);
9103 }
9104
9105out:
9106 free_cpumask_var(def);
9107 free_cpumask_var(rcv);
9108 return ret;
9109bail:
9110 ret = -ENOMEM;
9111 goto out;
9112}
9113
9114/*
9115 * Set the general handler to accept all interrupts, remap all
9116 * chip interrupts back to MSI-X 0.
9117 */
9118static void reset_interrupts(struct hfi1_devdata *dd)
9119{
9120 int i;
9121
9122 /* all interrupts handled by the general handler */
9123 for (i = 0; i < CCE_NUM_INT_CSRS; i++)
9124 dd->gi_mask[i] = ~(u64)0;
9125
9126 /* all chip interrupts map to MSI-X 0 */
9127 for (i = 0; i < CCE_NUM_INT_MAP_CSRS; i++)
9128 write_csr(dd, CCE_INT_MAP + (8*i), 0);
9129}
9130
9131static int set_up_interrupts(struct hfi1_devdata *dd)
9132{
9133 struct hfi1_msix_entry *entries;
9134 u32 total, request;
9135 int i, ret;
9136 int single_interrupt = 0; /* we expect to have all the interrupts */
9137
9138 /*
9139 * Interrupt count:
9140 * 1 general, "slow path" interrupt (includes the SDMA engines
9141 * slow source, SDMACleanupDone)
9142 * N interrupts - one per used SDMA engine
9143 * M interrupt - one per kernel receive context
9144 */
9145 total = 1 + dd->num_sdma + dd->n_krcv_queues;
9146
9147 entries = kcalloc(total, sizeof(*entries), GFP_KERNEL);
9148 if (!entries) {
Mike Marciniszyn77241052015-07-30 15:17:43 -04009149 ret = -ENOMEM;
9150 goto fail;
9151 }
9152 /* 1-1 MSI-X entry assignment */
9153 for (i = 0; i < total; i++)
9154 entries[i].msix.entry = i;
9155
9156 /* ask for MSI-X interrupts */
9157 request = total;
9158 request_msix(dd, &request, entries);
9159
9160 if (request == 0) {
9161 /* using INTx */
9162 /* dd->num_msix_entries already zero */
9163 kfree(entries);
9164 single_interrupt = 1;
9165 dd_dev_err(dd, "MSI-X failed, using INTx interrupts\n");
9166 } else {
9167 /* using MSI-X */
9168 dd->num_msix_entries = request;
9169 dd->msix_entries = entries;
9170
9171 if (request != total) {
9172 /* using MSI-X, with reduced interrupts */
9173 dd_dev_err(
9174 dd,
9175 "cannot handle reduced interrupt case, want %u, got %u\n",
9176 total, request);
9177 ret = -EINVAL;
9178 goto fail;
9179 }
9180 dd_dev_info(dd, "%u MSI-X interrupts allocated\n", total);
9181 }
9182
9183 /* mask all interrupts */
9184 set_intr_state(dd, 0);
9185 /* clear all pending interrupts */
9186 clear_all_interrupts(dd);
9187
9188 /* reset general handler mask, chip MSI-X mappings */
9189 reset_interrupts(dd);
9190
9191 if (single_interrupt)
9192 ret = request_intx_irq(dd);
9193 else
9194 ret = request_msix_irqs(dd);
9195 if (ret)
9196 goto fail;
9197
9198 return 0;
9199
9200fail:
9201 clean_up_interrupts(dd);
9202 return ret;
9203}
9204
9205/*
9206 * Set up context values in dd. Sets:
9207 *
9208 * num_rcv_contexts - number of contexts being used
9209 * n_krcv_queues - number of kernel contexts
9210 * first_user_ctxt - first non-kernel context in array of contexts
9211 * freectxts - number of free user contexts
9212 * num_send_contexts - number of PIO send contexts being used
9213 */
9214static int set_up_context_variables(struct hfi1_devdata *dd)
9215{
9216 int num_kernel_contexts;
9217 int num_user_contexts;
9218 int total_contexts;
9219 int ret;
9220 unsigned ngroups;
9221
9222 /*
9223 * Kernel contexts: (to be fixed later):
9224 * - min or 2 or 1 context/numa
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05009225 * - Context 0 - control context (VL15/multicast/error)
9226 * - Context 1 - default context
Mike Marciniszyn77241052015-07-30 15:17:43 -04009227 */
9228 if (n_krcvqs)
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -05009229 /*
9230 * Don't count context 0 in n_krcvqs since
9231 * is isn't used for normal verbs traffic.
9232 *
9233 * krcvqs will reflect number of kernel
9234 * receive contexts above 0.
9235 */
9236 num_kernel_contexts = n_krcvqs + MIN_KERNEL_KCTXTS - 1;
Mike Marciniszyn77241052015-07-30 15:17:43 -04009237 else
9238 num_kernel_contexts = num_online_nodes();
9239 num_kernel_contexts =
9240 max_t(int, MIN_KERNEL_KCTXTS, num_kernel_contexts);
9241 /*
9242 * Every kernel receive context needs an ACK send context.
9243 * one send context is allocated for each VL{0-7} and VL15
9244 */
9245 if (num_kernel_contexts > (dd->chip_send_contexts - num_vls - 1)) {
9246 dd_dev_err(dd,
9247 "Reducing # kernel rcv contexts to: %d, from %d\n",
9248 (int)(dd->chip_send_contexts - num_vls - 1),
9249 (int)num_kernel_contexts);
9250 num_kernel_contexts = dd->chip_send_contexts - num_vls - 1;
9251 }
9252 /*
9253 * User contexts: (to be fixed later)
9254 * - set to num_rcv_contexts if non-zero
9255 * - default to 1 user context per CPU
9256 */
9257 if (num_rcv_contexts)
9258 num_user_contexts = num_rcv_contexts;
9259 else
9260 num_user_contexts = num_online_cpus();
9261
9262 total_contexts = num_kernel_contexts + num_user_contexts;
9263
9264 /*
9265 * Adjust the counts given a global max.
9266 */
9267 if (total_contexts > dd->chip_rcv_contexts) {
9268 dd_dev_err(dd,
9269 "Reducing # user receive contexts to: %d, from %d\n",
9270 (int)(dd->chip_rcv_contexts - num_kernel_contexts),
9271 (int)num_user_contexts);
9272 num_user_contexts = dd->chip_rcv_contexts - num_kernel_contexts;
9273 /* recalculate */
9274 total_contexts = num_kernel_contexts + num_user_contexts;
9275 }
9276
9277 /* the first N are kernel contexts, the rest are user contexts */
9278 dd->num_rcv_contexts = total_contexts;
9279 dd->n_krcv_queues = num_kernel_contexts;
9280 dd->first_user_ctxt = num_kernel_contexts;
9281 dd->freectxts = num_user_contexts;
9282 dd_dev_info(dd,
9283 "rcv contexts: chip %d, used %d (kernel %d, user %d)\n",
9284 (int)dd->chip_rcv_contexts,
9285 (int)dd->num_rcv_contexts,
9286 (int)dd->n_krcv_queues,
9287 (int)dd->num_rcv_contexts - dd->n_krcv_queues);
9288
9289 /*
9290 * Receive array allocation:
9291 * All RcvArray entries are divided into groups of 8. This
9292 * is required by the hardware and will speed up writes to
9293 * consecutive entries by using write-combining of the entire
9294 * cacheline.
9295 *
9296 * The number of groups are evenly divided among all contexts.
9297 * any left over groups will be given to the first N user
9298 * contexts.
9299 */
9300 dd->rcv_entries.group_size = RCV_INCREMENT;
9301 ngroups = dd->chip_rcv_array_count / dd->rcv_entries.group_size;
9302 dd->rcv_entries.ngroups = ngroups / dd->num_rcv_contexts;
9303 dd->rcv_entries.nctxt_extra = ngroups -
9304 (dd->num_rcv_contexts * dd->rcv_entries.ngroups);
9305 dd_dev_info(dd, "RcvArray groups %u, ctxts extra %u\n",
9306 dd->rcv_entries.ngroups,
9307 dd->rcv_entries.nctxt_extra);
9308 if (dd->rcv_entries.ngroups * dd->rcv_entries.group_size >
9309 MAX_EAGER_ENTRIES * 2) {
9310 dd->rcv_entries.ngroups = (MAX_EAGER_ENTRIES * 2) /
9311 dd->rcv_entries.group_size;
9312 dd_dev_info(dd,
9313 "RcvArray group count too high, change to %u\n",
9314 dd->rcv_entries.ngroups);
9315 dd->rcv_entries.nctxt_extra = 0;
9316 }
9317 /*
9318 * PIO send contexts
9319 */
9320 ret = init_sc_pools_and_sizes(dd);
9321 if (ret >= 0) { /* success */
9322 dd->num_send_contexts = ret;
9323 dd_dev_info(
9324 dd,
9325 "send contexts: chip %d, used %d (kernel %d, ack %d, user %d)\n",
9326 dd->chip_send_contexts,
9327 dd->num_send_contexts,
9328 dd->sc_sizes[SC_KERNEL].count,
9329 dd->sc_sizes[SC_ACK].count,
9330 dd->sc_sizes[SC_USER].count);
9331 ret = 0; /* success */
9332 }
9333
9334 return ret;
9335}
9336
9337/*
9338 * Set the device/port partition key table. The MAD code
9339 * will ensure that, at least, the partial management
9340 * partition key is present in the table.
9341 */
9342static void set_partition_keys(struct hfi1_pportdata *ppd)
9343{
9344 struct hfi1_devdata *dd = ppd->dd;
9345 u64 reg = 0;
9346 int i;
9347
9348 dd_dev_info(dd, "Setting partition keys\n");
9349 for (i = 0; i < hfi1_get_npkeys(dd); i++) {
9350 reg |= (ppd->pkeys[i] &
9351 RCV_PARTITION_KEY_PARTITION_KEY_A_MASK) <<
9352 ((i % 4) *
9353 RCV_PARTITION_KEY_PARTITION_KEY_B_SHIFT);
9354 /* Each register holds 4 PKey values. */
9355 if ((i % 4) == 3) {
9356 write_csr(dd, RCV_PARTITION_KEY +
9357 ((i - 3) * 2), reg);
9358 reg = 0;
9359 }
9360 }
9361
9362 /* Always enable HW pkeys check when pkeys table is set */
9363 add_rcvctrl(dd, RCV_CTRL_RCV_PARTITION_KEY_ENABLE_SMASK);
9364}
9365
9366/*
9367 * These CSRs and memories are uninitialized on reset and must be
9368 * written before reading to set the ECC/parity bits.
9369 *
9370 * NOTE: All user context CSRs that are not mmaped write-only
9371 * (e.g. the TID flows) must be initialized even if the driver never
9372 * reads them.
9373 */
9374static void write_uninitialized_csrs_and_memories(struct hfi1_devdata *dd)
9375{
9376 int i, j;
9377
9378 /* CceIntMap */
9379 for (i = 0; i < CCE_NUM_INT_MAP_CSRS; i++)
9380 write_csr(dd, CCE_INT_MAP+(8*i), 0);
9381
9382 /* SendCtxtCreditReturnAddr */
9383 for (i = 0; i < dd->chip_send_contexts; i++)
9384 write_kctxt_csr(dd, i, SEND_CTXT_CREDIT_RETURN_ADDR, 0);
9385
9386 /* PIO Send buffers */
9387 /* SDMA Send buffers */
9388 /* These are not normally read, and (presently) have no method
9389 to be read, so are not pre-initialized */
9390
9391 /* RcvHdrAddr */
9392 /* RcvHdrTailAddr */
9393 /* RcvTidFlowTable */
9394 for (i = 0; i < dd->chip_rcv_contexts; i++) {
9395 write_kctxt_csr(dd, i, RCV_HDR_ADDR, 0);
9396 write_kctxt_csr(dd, i, RCV_HDR_TAIL_ADDR, 0);
9397 for (j = 0; j < RXE_NUM_TID_FLOWS; j++)
9398 write_uctxt_csr(dd, i, RCV_TID_FLOW_TABLE+(8*j), 0);
9399 }
9400
9401 /* RcvArray */
9402 for (i = 0; i < dd->chip_rcv_array_count; i++)
9403 write_csr(dd, RCV_ARRAY + (8*i),
9404 RCV_ARRAY_RT_WRITE_ENABLE_SMASK);
9405
9406 /* RcvQPMapTable */
9407 for (i = 0; i < 32; i++)
9408 write_csr(dd, RCV_QP_MAP_TABLE + (8 * i), 0);
9409}
9410
9411/*
9412 * Use the ctrl_bits in CceCtrl to clear the status_bits in CceStatus.
9413 */
9414static void clear_cce_status(struct hfi1_devdata *dd, u64 status_bits,
9415 u64 ctrl_bits)
9416{
9417 unsigned long timeout;
9418 u64 reg;
9419
9420 /* is the condition present? */
9421 reg = read_csr(dd, CCE_STATUS);
9422 if ((reg & status_bits) == 0)
9423 return;
9424
9425 /* clear the condition */
9426 write_csr(dd, CCE_CTRL, ctrl_bits);
9427
9428 /* wait for the condition to clear */
9429 timeout = jiffies + msecs_to_jiffies(CCE_STATUS_TIMEOUT);
9430 while (1) {
9431 reg = read_csr(dd, CCE_STATUS);
9432 if ((reg & status_bits) == 0)
9433 return;
9434 if (time_after(jiffies, timeout)) {
9435 dd_dev_err(dd,
9436 "Timeout waiting for CceStatus to clear bits 0x%llx, remaining 0x%llx\n",
9437 status_bits, reg & status_bits);
9438 return;
9439 }
9440 udelay(1);
9441 }
9442}
9443
9444/* set CCE CSRs to chip reset defaults */
9445static void reset_cce_csrs(struct hfi1_devdata *dd)
9446{
9447 int i;
9448
9449 /* CCE_REVISION read-only */
9450 /* CCE_REVISION2 read-only */
9451 /* CCE_CTRL - bits clear automatically */
9452 /* CCE_STATUS read-only, use CceCtrl to clear */
9453 clear_cce_status(dd, ALL_FROZE, CCE_CTRL_SPC_UNFREEZE_SMASK);
9454 clear_cce_status(dd, ALL_TXE_PAUSE, CCE_CTRL_TXE_RESUME_SMASK);
9455 clear_cce_status(dd, ALL_RXE_PAUSE, CCE_CTRL_RXE_RESUME_SMASK);
9456 for (i = 0; i < CCE_NUM_SCRATCH; i++)
9457 write_csr(dd, CCE_SCRATCH + (8 * i), 0);
9458 /* CCE_ERR_STATUS read-only */
9459 write_csr(dd, CCE_ERR_MASK, 0);
9460 write_csr(dd, CCE_ERR_CLEAR, ~0ull);
9461 /* CCE_ERR_FORCE leave alone */
9462 for (i = 0; i < CCE_NUM_32_BIT_COUNTERS; i++)
9463 write_csr(dd, CCE_COUNTER_ARRAY32 + (8 * i), 0);
9464 write_csr(dd, CCE_DC_CTRL, CCE_DC_CTRL_RESETCSR);
9465 /* CCE_PCIE_CTRL leave alone */
9466 for (i = 0; i < CCE_NUM_MSIX_VECTORS; i++) {
9467 write_csr(dd, CCE_MSIX_TABLE_LOWER + (8 * i), 0);
9468 write_csr(dd, CCE_MSIX_TABLE_UPPER + (8 * i),
9469 CCE_MSIX_TABLE_UPPER_RESETCSR);
9470 }
9471 for (i = 0; i < CCE_NUM_MSIX_PBAS; i++) {
9472 /* CCE_MSIX_PBA read-only */
9473 write_csr(dd, CCE_MSIX_INT_GRANTED, ~0ull);
9474 write_csr(dd, CCE_MSIX_VEC_CLR_WITHOUT_INT, ~0ull);
9475 }
9476 for (i = 0; i < CCE_NUM_INT_MAP_CSRS; i++)
9477 write_csr(dd, CCE_INT_MAP, 0);
9478 for (i = 0; i < CCE_NUM_INT_CSRS; i++) {
9479 /* CCE_INT_STATUS read-only */
9480 write_csr(dd, CCE_INT_MASK + (8 * i), 0);
9481 write_csr(dd, CCE_INT_CLEAR + (8 * i), ~0ull);
9482 /* CCE_INT_FORCE leave alone */
9483 /* CCE_INT_BLOCKED read-only */
9484 }
9485 for (i = 0; i < CCE_NUM_32_BIT_INT_COUNTERS; i++)
9486 write_csr(dd, CCE_INT_COUNTER_ARRAY32 + (8 * i), 0);
9487}
9488
9489/* set ASIC CSRs to chip reset defaults */
9490static void reset_asic_csrs(struct hfi1_devdata *dd)
9491{
Mike Marciniszyn77241052015-07-30 15:17:43 -04009492 int i;
9493
9494 /*
9495 * If the HFIs are shared between separate nodes or VMs,
9496 * then more will need to be done here. One idea is a module
9497 * parameter that returns early, letting the first power-on or
9498 * a known first load do the reset and blocking all others.
9499 */
9500
Easwar Hariharan7c03ed82015-10-26 10:28:28 -04009501 if (!(dd->flags & HFI1_DO_INIT_ASIC))
9502 return;
Mike Marciniszyn77241052015-07-30 15:17:43 -04009503
9504 if (dd->icode != ICODE_FPGA_EMULATION) {
9505 /* emulation does not have an SBus - leave these alone */
9506 /*
9507 * All writes to ASIC_CFG_SBUS_REQUEST do something.
9508 * Notes:
9509 * o The reset is not zero if aimed at the core. See the
9510 * SBus documentation for details.
9511 * o If the SBus firmware has been updated (e.g. by the BIOS),
9512 * will the reset revert that?
9513 */
9514 /* ASIC_CFG_SBUS_REQUEST leave alone */
9515 write_csr(dd, ASIC_CFG_SBUS_EXECUTE, 0);
9516 }
9517 /* ASIC_SBUS_RESULT read-only */
9518 write_csr(dd, ASIC_STS_SBUS_COUNTERS, 0);
9519 for (i = 0; i < ASIC_NUM_SCRATCH; i++)
9520 write_csr(dd, ASIC_CFG_SCRATCH + (8 * i), 0);
9521 write_csr(dd, ASIC_CFG_MUTEX, 0); /* this will clear it */
Easwar Hariharan7c03ed82015-10-26 10:28:28 -04009522
9523 /* We might want to retain this state across FLR if we ever use it */
Mike Marciniszyn77241052015-07-30 15:17:43 -04009524 write_csr(dd, ASIC_CFG_DRV_STR, 0);
Easwar Hariharan7c03ed82015-10-26 10:28:28 -04009525
Jareer Abdel-Qader4ef98982015-11-06 20:07:00 -05009526 /* ASIC_CFG_THERM_POLL_EN leave alone */
Mike Marciniszyn77241052015-07-30 15:17:43 -04009527 /* ASIC_STS_THERM read-only */
9528 /* ASIC_CFG_RESET leave alone */
9529
9530 write_csr(dd, ASIC_PCIE_SD_HOST_CMD, 0);
9531 /* ASIC_PCIE_SD_HOST_STATUS read-only */
9532 write_csr(dd, ASIC_PCIE_SD_INTRPT_DATA_CODE, 0);
9533 write_csr(dd, ASIC_PCIE_SD_INTRPT_ENABLE, 0);
9534 /* ASIC_PCIE_SD_INTRPT_PROGRESS read-only */
9535 write_csr(dd, ASIC_PCIE_SD_INTRPT_STATUS, ~0ull); /* clear */
9536 /* ASIC_HFI0_PCIE_SD_INTRPT_RSPD_DATA read-only */
9537 /* ASIC_HFI1_PCIE_SD_INTRPT_RSPD_DATA read-only */
9538 for (i = 0; i < 16; i++)
9539 write_csr(dd, ASIC_PCIE_SD_INTRPT_LIST + (8 * i), 0);
9540
9541 /* ASIC_GPIO_IN read-only */
9542 write_csr(dd, ASIC_GPIO_OE, 0);
9543 write_csr(dd, ASIC_GPIO_INVERT, 0);
9544 write_csr(dd, ASIC_GPIO_OUT, 0);
9545 write_csr(dd, ASIC_GPIO_MASK, 0);
9546 /* ASIC_GPIO_STATUS read-only */
9547 write_csr(dd, ASIC_GPIO_CLEAR, ~0ull);
9548 /* ASIC_GPIO_FORCE leave alone */
9549
9550 /* ASIC_QSFP1_IN read-only */
9551 write_csr(dd, ASIC_QSFP1_OE, 0);
9552 write_csr(dd, ASIC_QSFP1_INVERT, 0);
9553 write_csr(dd, ASIC_QSFP1_OUT, 0);
9554 write_csr(dd, ASIC_QSFP1_MASK, 0);
9555 /* ASIC_QSFP1_STATUS read-only */
9556 write_csr(dd, ASIC_QSFP1_CLEAR, ~0ull);
9557 /* ASIC_QSFP1_FORCE leave alone */
9558
9559 /* ASIC_QSFP2_IN read-only */
9560 write_csr(dd, ASIC_QSFP2_OE, 0);
9561 write_csr(dd, ASIC_QSFP2_INVERT, 0);
9562 write_csr(dd, ASIC_QSFP2_OUT, 0);
9563 write_csr(dd, ASIC_QSFP2_MASK, 0);
9564 /* ASIC_QSFP2_STATUS read-only */
9565 write_csr(dd, ASIC_QSFP2_CLEAR, ~0ull);
9566 /* ASIC_QSFP2_FORCE leave alone */
9567
9568 write_csr(dd, ASIC_EEP_CTL_STAT, ASIC_EEP_CTL_STAT_RESETCSR);
9569 /* this also writes a NOP command, clearing paging mode */
9570 write_csr(dd, ASIC_EEP_ADDR_CMD, 0);
9571 write_csr(dd, ASIC_EEP_DATA, 0);
Mike Marciniszyn77241052015-07-30 15:17:43 -04009572}
9573
9574/* set MISC CSRs to chip reset defaults */
9575static void reset_misc_csrs(struct hfi1_devdata *dd)
9576{
9577 int i;
9578
9579 for (i = 0; i < 32; i++) {
9580 write_csr(dd, MISC_CFG_RSA_R2 + (8 * i), 0);
9581 write_csr(dd, MISC_CFG_RSA_SIGNATURE + (8 * i), 0);
9582 write_csr(dd, MISC_CFG_RSA_MODULUS + (8 * i), 0);
9583 }
9584 /* MISC_CFG_SHA_PRELOAD leave alone - always reads 0 and can
9585 only be written 128-byte chunks */
9586 /* init RSA engine to clear lingering errors */
9587 write_csr(dd, MISC_CFG_RSA_CMD, 1);
9588 write_csr(dd, MISC_CFG_RSA_MU, 0);
9589 write_csr(dd, MISC_CFG_FW_CTRL, 0);
9590 /* MISC_STS_8051_DIGEST read-only */
9591 /* MISC_STS_SBM_DIGEST read-only */
9592 /* MISC_STS_PCIE_DIGEST read-only */
9593 /* MISC_STS_FAB_DIGEST read-only */
9594 /* MISC_ERR_STATUS read-only */
9595 write_csr(dd, MISC_ERR_MASK, 0);
9596 write_csr(dd, MISC_ERR_CLEAR, ~0ull);
9597 /* MISC_ERR_FORCE leave alone */
9598}
9599
9600/* set TXE CSRs to chip reset defaults */
9601static void reset_txe_csrs(struct hfi1_devdata *dd)
9602{
9603 int i;
9604
9605 /*
9606 * TXE Kernel CSRs
9607 */
9608 write_csr(dd, SEND_CTRL, 0);
9609 __cm_reset(dd, 0); /* reset CM internal state */
9610 /* SEND_CONTEXTS read-only */
9611 /* SEND_DMA_ENGINES read-only */
9612 /* SEND_PIO_MEM_SIZE read-only */
9613 /* SEND_DMA_MEM_SIZE read-only */
9614 write_csr(dd, SEND_HIGH_PRIORITY_LIMIT, 0);
9615 pio_reset_all(dd); /* SEND_PIO_INIT_CTXT */
9616 /* SEND_PIO_ERR_STATUS read-only */
9617 write_csr(dd, SEND_PIO_ERR_MASK, 0);
9618 write_csr(dd, SEND_PIO_ERR_CLEAR, ~0ull);
9619 /* SEND_PIO_ERR_FORCE leave alone */
9620 /* SEND_DMA_ERR_STATUS read-only */
9621 write_csr(dd, SEND_DMA_ERR_MASK, 0);
9622 write_csr(dd, SEND_DMA_ERR_CLEAR, ~0ull);
9623 /* SEND_DMA_ERR_FORCE leave alone */
9624 /* SEND_EGRESS_ERR_STATUS read-only */
9625 write_csr(dd, SEND_EGRESS_ERR_MASK, 0);
9626 write_csr(dd, SEND_EGRESS_ERR_CLEAR, ~0ull);
9627 /* SEND_EGRESS_ERR_FORCE leave alone */
9628 write_csr(dd, SEND_BTH_QP, 0);
9629 write_csr(dd, SEND_STATIC_RATE_CONTROL, 0);
9630 write_csr(dd, SEND_SC2VLT0, 0);
9631 write_csr(dd, SEND_SC2VLT1, 0);
9632 write_csr(dd, SEND_SC2VLT2, 0);
9633 write_csr(dd, SEND_SC2VLT3, 0);
9634 write_csr(dd, SEND_LEN_CHECK0, 0);
9635 write_csr(dd, SEND_LEN_CHECK1, 0);
9636 /* SEND_ERR_STATUS read-only */
9637 write_csr(dd, SEND_ERR_MASK, 0);
9638 write_csr(dd, SEND_ERR_CLEAR, ~0ull);
9639 /* SEND_ERR_FORCE read-only */
9640 for (i = 0; i < VL_ARB_LOW_PRIO_TABLE_SIZE; i++)
9641 write_csr(dd, SEND_LOW_PRIORITY_LIST + (8*i), 0);
9642 for (i = 0; i < VL_ARB_HIGH_PRIO_TABLE_SIZE; i++)
9643 write_csr(dd, SEND_HIGH_PRIORITY_LIST + (8*i), 0);
9644 for (i = 0; i < dd->chip_send_contexts/NUM_CONTEXTS_PER_SET; i++)
9645 write_csr(dd, SEND_CONTEXT_SET_CTRL + (8*i), 0);
9646 for (i = 0; i < TXE_NUM_32_BIT_COUNTER; i++)
9647 write_csr(dd, SEND_COUNTER_ARRAY32 + (8*i), 0);
9648 for (i = 0; i < TXE_NUM_64_BIT_COUNTER; i++)
9649 write_csr(dd, SEND_COUNTER_ARRAY64 + (8*i), 0);
9650 write_csr(dd, SEND_CM_CTRL, SEND_CM_CTRL_RESETCSR);
9651 write_csr(dd, SEND_CM_GLOBAL_CREDIT,
9652 SEND_CM_GLOBAL_CREDIT_RESETCSR);
9653 /* SEND_CM_CREDIT_USED_STATUS read-only */
9654 write_csr(dd, SEND_CM_TIMER_CTRL, 0);
9655 write_csr(dd, SEND_CM_LOCAL_AU_TABLE0_TO3, 0);
9656 write_csr(dd, SEND_CM_LOCAL_AU_TABLE4_TO7, 0);
9657 write_csr(dd, SEND_CM_REMOTE_AU_TABLE0_TO3, 0);
9658 write_csr(dd, SEND_CM_REMOTE_AU_TABLE4_TO7, 0);
9659 for (i = 0; i < TXE_NUM_DATA_VL; i++)
9660 write_csr(dd, SEND_CM_CREDIT_VL + (8*i), 0);
9661 write_csr(dd, SEND_CM_CREDIT_VL15, 0);
9662 /* SEND_CM_CREDIT_USED_VL read-only */
9663 /* SEND_CM_CREDIT_USED_VL15 read-only */
9664 /* SEND_EGRESS_CTXT_STATUS read-only */
9665 /* SEND_EGRESS_SEND_DMA_STATUS read-only */
9666 write_csr(dd, SEND_EGRESS_ERR_INFO, ~0ull);
9667 /* SEND_EGRESS_ERR_INFO read-only */
9668 /* SEND_EGRESS_ERR_SOURCE read-only */
9669
9670 /*
9671 * TXE Per-Context CSRs
9672 */
9673 for (i = 0; i < dd->chip_send_contexts; i++) {
9674 write_kctxt_csr(dd, i, SEND_CTXT_CTRL, 0);
9675 write_kctxt_csr(dd, i, SEND_CTXT_CREDIT_CTRL, 0);
9676 write_kctxt_csr(dd, i, SEND_CTXT_CREDIT_RETURN_ADDR, 0);
9677 write_kctxt_csr(dd, i, SEND_CTXT_CREDIT_FORCE, 0);
9678 write_kctxt_csr(dd, i, SEND_CTXT_ERR_MASK, 0);
9679 write_kctxt_csr(dd, i, SEND_CTXT_ERR_CLEAR, ~0ull);
9680 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_ENABLE, 0);
9681 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_VL, 0);
9682 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_JOB_KEY, 0);
9683 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_PARTITION_KEY, 0);
9684 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_SLID, 0);
9685 write_kctxt_csr(dd, i, SEND_CTXT_CHECK_OPCODE, 0);
9686 }
9687
9688 /*
9689 * TXE Per-SDMA CSRs
9690 */
9691 for (i = 0; i < dd->chip_sdma_engines; i++) {
9692 write_kctxt_csr(dd, i, SEND_DMA_CTRL, 0);
9693 /* SEND_DMA_STATUS read-only */
9694 write_kctxt_csr(dd, i, SEND_DMA_BASE_ADDR, 0);
9695 write_kctxt_csr(dd, i, SEND_DMA_LEN_GEN, 0);
9696 write_kctxt_csr(dd, i, SEND_DMA_TAIL, 0);
9697 /* SEND_DMA_HEAD read-only */
9698 write_kctxt_csr(dd, i, SEND_DMA_HEAD_ADDR, 0);
9699 write_kctxt_csr(dd, i, SEND_DMA_PRIORITY_THLD, 0);
9700 /* SEND_DMA_IDLE_CNT read-only */
9701 write_kctxt_csr(dd, i, SEND_DMA_RELOAD_CNT, 0);
9702 write_kctxt_csr(dd, i, SEND_DMA_DESC_CNT, 0);
9703 /* SEND_DMA_DESC_FETCHED_CNT read-only */
9704 /* SEND_DMA_ENG_ERR_STATUS read-only */
9705 write_kctxt_csr(dd, i, SEND_DMA_ENG_ERR_MASK, 0);
9706 write_kctxt_csr(dd, i, SEND_DMA_ENG_ERR_CLEAR, ~0ull);
9707 /* SEND_DMA_ENG_ERR_FORCE leave alone */
9708 write_kctxt_csr(dd, i, SEND_DMA_CHECK_ENABLE, 0);
9709 write_kctxt_csr(dd, i, SEND_DMA_CHECK_VL, 0);
9710 write_kctxt_csr(dd, i, SEND_DMA_CHECK_JOB_KEY, 0);
9711 write_kctxt_csr(dd, i, SEND_DMA_CHECK_PARTITION_KEY, 0);
9712 write_kctxt_csr(dd, i, SEND_DMA_CHECK_SLID, 0);
9713 write_kctxt_csr(dd, i, SEND_DMA_CHECK_OPCODE, 0);
9714 write_kctxt_csr(dd, i, SEND_DMA_MEMORY, 0);
9715 }
9716}
9717
9718/*
9719 * Expect on entry:
9720 * o Packet ingress is disabled, i.e. RcvCtrl.RcvPortEnable == 0
9721 */
9722static void init_rbufs(struct hfi1_devdata *dd)
9723{
9724 u64 reg;
9725 int count;
9726
9727 /*
9728 * Wait for DMA to stop: RxRbufPktPending and RxPktInProgress are
9729 * clear.
9730 */
9731 count = 0;
9732 while (1) {
9733 reg = read_csr(dd, RCV_STATUS);
9734 if ((reg & (RCV_STATUS_RX_RBUF_PKT_PENDING_SMASK
9735 | RCV_STATUS_RX_PKT_IN_PROGRESS_SMASK)) == 0)
9736 break;
9737 /*
9738 * Give up after 1ms - maximum wait time.
9739 *
9740 * RBuf size is 148KiB. Slowest possible is PCIe Gen1 x1 at
9741 * 250MB/s bandwidth. Lower rate to 66% for overhead to get:
9742 * 148 KB / (66% * 250MB/s) = 920us
9743 */
9744 if (count++ > 500) {
9745 dd_dev_err(dd,
9746 "%s: in-progress DMA not clearing: RcvStatus 0x%llx, continuing\n",
9747 __func__, reg);
9748 break;
9749 }
9750 udelay(2); /* do not busy-wait the CSR */
9751 }
9752
9753 /* start the init - expect RcvCtrl to be 0 */
9754 write_csr(dd, RCV_CTRL, RCV_CTRL_RX_RBUF_INIT_SMASK);
9755
9756 /*
9757 * Read to force the write of Rcvtrl.RxRbufInit. There is a brief
9758 * period after the write before RcvStatus.RxRbufInitDone is valid.
9759 * The delay in the first run through the loop below is sufficient and
9760 * required before the first read of RcvStatus.RxRbufInintDone.
9761 */
9762 read_csr(dd, RCV_CTRL);
9763
9764 /* wait for the init to finish */
9765 count = 0;
9766 while (1) {
9767 /* delay is required first time through - see above */
9768 udelay(2); /* do not busy-wait the CSR */
9769 reg = read_csr(dd, RCV_STATUS);
9770 if (reg & (RCV_STATUS_RX_RBUF_INIT_DONE_SMASK))
9771 break;
9772
9773 /* give up after 100us - slowest possible at 33MHz is 73us */
9774 if (count++ > 50) {
9775 dd_dev_err(dd,
9776 "%s: RcvStatus.RxRbufInit not set, continuing\n",
9777 __func__);
9778 break;
9779 }
9780 }
9781}
9782
9783/* set RXE CSRs to chip reset defaults */
9784static void reset_rxe_csrs(struct hfi1_devdata *dd)
9785{
9786 int i, j;
9787
9788 /*
9789 * RXE Kernel CSRs
9790 */
9791 write_csr(dd, RCV_CTRL, 0);
9792 init_rbufs(dd);
9793 /* RCV_STATUS read-only */
9794 /* RCV_CONTEXTS read-only */
9795 /* RCV_ARRAY_CNT read-only */
9796 /* RCV_BUF_SIZE read-only */
9797 write_csr(dd, RCV_BTH_QP, 0);
9798 write_csr(dd, RCV_MULTICAST, 0);
9799 write_csr(dd, RCV_BYPASS, 0);
9800 write_csr(dd, RCV_VL15, 0);
9801 /* this is a clear-down */
9802 write_csr(dd, RCV_ERR_INFO,
9803 RCV_ERR_INFO_RCV_EXCESS_BUFFER_OVERRUN_SMASK);
9804 /* RCV_ERR_STATUS read-only */
9805 write_csr(dd, RCV_ERR_MASK, 0);
9806 write_csr(dd, RCV_ERR_CLEAR, ~0ull);
9807 /* RCV_ERR_FORCE leave alone */
9808 for (i = 0; i < 32; i++)
9809 write_csr(dd, RCV_QP_MAP_TABLE + (8 * i), 0);
9810 for (i = 0; i < 4; i++)
9811 write_csr(dd, RCV_PARTITION_KEY + (8 * i), 0);
9812 for (i = 0; i < RXE_NUM_32_BIT_COUNTERS; i++)
9813 write_csr(dd, RCV_COUNTER_ARRAY32 + (8 * i), 0);
9814 for (i = 0; i < RXE_NUM_64_BIT_COUNTERS; i++)
9815 write_csr(dd, RCV_COUNTER_ARRAY64 + (8 * i), 0);
9816 for (i = 0; i < RXE_NUM_RSM_INSTANCES; i++) {
9817 write_csr(dd, RCV_RSM_CFG + (8 * i), 0);
9818 write_csr(dd, RCV_RSM_SELECT + (8 * i), 0);
9819 write_csr(dd, RCV_RSM_MATCH + (8 * i), 0);
9820 }
9821 for (i = 0; i < 32; i++)
9822 write_csr(dd, RCV_RSM_MAP_TABLE + (8 * i), 0);
9823
9824 /*
9825 * RXE Kernel and User Per-Context CSRs
9826 */
9827 for (i = 0; i < dd->chip_rcv_contexts; i++) {
9828 /* kernel */
9829 write_kctxt_csr(dd, i, RCV_CTXT_CTRL, 0);
9830 /* RCV_CTXT_STATUS read-only */
9831 write_kctxt_csr(dd, i, RCV_EGR_CTRL, 0);
9832 write_kctxt_csr(dd, i, RCV_TID_CTRL, 0);
9833 write_kctxt_csr(dd, i, RCV_KEY_CTRL, 0);
9834 write_kctxt_csr(dd, i, RCV_HDR_ADDR, 0);
9835 write_kctxt_csr(dd, i, RCV_HDR_CNT, 0);
9836 write_kctxt_csr(dd, i, RCV_HDR_ENT_SIZE, 0);
9837 write_kctxt_csr(dd, i, RCV_HDR_SIZE, 0);
9838 write_kctxt_csr(dd, i, RCV_HDR_TAIL_ADDR, 0);
9839 write_kctxt_csr(dd, i, RCV_AVAIL_TIME_OUT, 0);
9840 write_kctxt_csr(dd, i, RCV_HDR_OVFL_CNT, 0);
9841
9842 /* user */
9843 /* RCV_HDR_TAIL read-only */
9844 write_uctxt_csr(dd, i, RCV_HDR_HEAD, 0);
9845 /* RCV_EGR_INDEX_TAIL read-only */
9846 write_uctxt_csr(dd, i, RCV_EGR_INDEX_HEAD, 0);
9847 /* RCV_EGR_OFFSET_TAIL read-only */
9848 for (j = 0; j < RXE_NUM_TID_FLOWS; j++) {
9849 write_uctxt_csr(dd, i, RCV_TID_FLOW_TABLE + (8 * j),
9850 0);
9851 }
9852 }
9853}
9854
9855/*
9856 * Set sc2vl tables.
9857 *
9858 * They power on to zeros, so to avoid send context errors
9859 * they need to be set:
9860 *
9861 * SC 0-7 -> VL 0-7 (respectively)
9862 * SC 15 -> VL 15
9863 * otherwise
9864 * -> VL 0
9865 */
9866static void init_sc2vl_tables(struct hfi1_devdata *dd)
9867{
9868 int i;
9869 /* init per architecture spec, constrained by hardware capability */
9870
9871 /* HFI maps sent packets */
9872 write_csr(dd, SEND_SC2VLT0, SC2VL_VAL(
9873 0,
9874 0, 0, 1, 1,
9875 2, 2, 3, 3,
9876 4, 4, 5, 5,
9877 6, 6, 7, 7));
9878 write_csr(dd, SEND_SC2VLT1, SC2VL_VAL(
9879 1,
9880 8, 0, 9, 0,
9881 10, 0, 11, 0,
9882 12, 0, 13, 0,
9883 14, 0, 15, 15));
9884 write_csr(dd, SEND_SC2VLT2, SC2VL_VAL(
9885 2,
9886 16, 0, 17, 0,
9887 18, 0, 19, 0,
9888 20, 0, 21, 0,
9889 22, 0, 23, 0));
9890 write_csr(dd, SEND_SC2VLT3, SC2VL_VAL(
9891 3,
9892 24, 0, 25, 0,
9893 26, 0, 27, 0,
9894 28, 0, 29, 0,
9895 30, 0, 31, 0));
9896
9897 /* DC maps received packets */
9898 write_csr(dd, DCC_CFG_SC_VL_TABLE_15_0, DC_SC_VL_VAL(
9899 15_0,
9900 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7,
9901 8, 0, 9, 0, 10, 0, 11, 0, 12, 0, 13, 0, 14, 0, 15, 15));
9902 write_csr(dd, DCC_CFG_SC_VL_TABLE_31_16, DC_SC_VL_VAL(
9903 31_16,
9904 16, 0, 17, 0, 18, 0, 19, 0, 20, 0, 21, 0, 22, 0, 23, 0,
9905 24, 0, 25, 0, 26, 0, 27, 0, 28, 0, 29, 0, 30, 0, 31, 0));
9906
9907 /* initialize the cached sc2vl values consistently with h/w */
9908 for (i = 0; i < 32; i++) {
9909 if (i < 8 || i == 15)
9910 *((u8 *)(dd->sc2vl) + i) = (u8)i;
9911 else
9912 *((u8 *)(dd->sc2vl) + i) = 0;
9913 }
9914}
9915
9916/*
9917 * Read chip sizes and then reset parts to sane, disabled, values. We cannot
9918 * depend on the chip going through a power-on reset - a driver may be loaded
9919 * and unloaded many times.
9920 *
9921 * Do not write any CSR values to the chip in this routine - there may be
9922 * a reset following the (possible) FLR in this routine.
9923 *
9924 */
9925static void init_chip(struct hfi1_devdata *dd)
9926{
9927 int i;
9928
9929 /*
9930 * Put the HFI CSRs in a known state.
9931 * Combine this with a DC reset.
9932 *
9933 * Stop the device from doing anything while we do a
9934 * reset. We know there are no other active users of
9935 * the device since we are now in charge. Turn off
9936 * off all outbound and inbound traffic and make sure
9937 * the device does not generate any interrupts.
9938 */
9939
9940 /* disable send contexts and SDMA engines */
9941 write_csr(dd, SEND_CTRL, 0);
9942 for (i = 0; i < dd->chip_send_contexts; i++)
9943 write_kctxt_csr(dd, i, SEND_CTXT_CTRL, 0);
9944 for (i = 0; i < dd->chip_sdma_engines; i++)
9945 write_kctxt_csr(dd, i, SEND_DMA_CTRL, 0);
9946 /* disable port (turn off RXE inbound traffic) and contexts */
9947 write_csr(dd, RCV_CTRL, 0);
9948 for (i = 0; i < dd->chip_rcv_contexts; i++)
9949 write_csr(dd, RCV_CTXT_CTRL, 0);
9950 /* mask all interrupt sources */
9951 for (i = 0; i < CCE_NUM_INT_CSRS; i++)
9952 write_csr(dd, CCE_INT_MASK + (8*i), 0ull);
9953
9954 /*
9955 * DC Reset: do a full DC reset before the register clear.
9956 * A recommended length of time to hold is one CSR read,
9957 * so reread the CceDcCtrl. Then, hold the DC in reset
9958 * across the clear.
9959 */
9960 write_csr(dd, CCE_DC_CTRL, CCE_DC_CTRL_DC_RESET_SMASK);
9961 (void) read_csr(dd, CCE_DC_CTRL);
9962
9963 if (use_flr) {
9964 /*
9965 * A FLR will reset the SPC core and part of the PCIe.
9966 * The parts that need to be restored have already been
9967 * saved.
9968 */
9969 dd_dev_info(dd, "Resetting CSRs with FLR\n");
9970
9971 /* do the FLR, the DC reset will remain */
9972 hfi1_pcie_flr(dd);
9973
9974 /* restore command and BARs */
9975 restore_pci_variables(dd);
9976
9977 if (is_a0(dd)) {
9978 dd_dev_info(dd, "Resetting CSRs with FLR\n");
9979 hfi1_pcie_flr(dd);
9980 restore_pci_variables(dd);
9981 }
9982
Easwar Hariharan7c03ed82015-10-26 10:28:28 -04009983 reset_asic_csrs(dd);
Mike Marciniszyn77241052015-07-30 15:17:43 -04009984 } else {
9985 dd_dev_info(dd, "Resetting CSRs with writes\n");
9986 reset_cce_csrs(dd);
9987 reset_txe_csrs(dd);
9988 reset_rxe_csrs(dd);
9989 reset_asic_csrs(dd);
9990 reset_misc_csrs(dd);
9991 }
9992 /* clear the DC reset */
9993 write_csr(dd, CCE_DC_CTRL, 0);
Easwar Hariharan7c03ed82015-10-26 10:28:28 -04009994
Mike Marciniszyn77241052015-07-30 15:17:43 -04009995 /* Set the LED off */
9996 if (is_a0(dd))
9997 setextled(dd, 0);
9998 /*
9999 * Clear the QSFP reset.
Easwar Hariharan72a67ba2015-11-06 20:06:57 -050010000 * An FLR enforces a 0 on all out pins. The driver does not touch
Mike Marciniszyn77241052015-07-30 15:17:43 -040010001 * ASIC_QSFPn_OUT otherwise. This leaves RESET_N low and
Easwar Hariharan72a67ba2015-11-06 20:06:57 -050010002 * anything plugged constantly in reset, if it pays attention
Mike Marciniszyn77241052015-07-30 15:17:43 -040010003 * to RESET_N.
Easwar Hariharan72a67ba2015-11-06 20:06:57 -050010004 * Prime examples of this are optical cables. Set all pins high.
Mike Marciniszyn77241052015-07-30 15:17:43 -040010005 * I2CCLK and I2CDAT will change per direction, and INT_N and
10006 * MODPRS_N are input only and their value is ignored.
10007 */
Easwar Hariharan72a67ba2015-11-06 20:06:57 -050010008 write_csr(dd, ASIC_QSFP1_OUT, 0x1f);
10009 write_csr(dd, ASIC_QSFP2_OUT, 0x1f);
Mike Marciniszyn77241052015-07-30 15:17:43 -040010010}
10011
10012static void init_early_variables(struct hfi1_devdata *dd)
10013{
10014 int i;
10015
10016 /* assign link credit variables */
10017 dd->vau = CM_VAU;
10018 dd->link_credits = CM_GLOBAL_CREDITS;
10019 if (is_a0(dd))
10020 dd->link_credits--;
10021 dd->vcu = cu_to_vcu(hfi1_cu);
10022 /* enough room for 8 MAD packets plus header - 17K */
10023 dd->vl15_init = (8 * (2048 + 128)) / vau_to_au(dd->vau);
10024 if (dd->vl15_init > dd->link_credits)
10025 dd->vl15_init = dd->link_credits;
10026
10027 write_uninitialized_csrs_and_memories(dd);
10028
10029 if (HFI1_CAP_IS_KSET(PKEY_CHECK))
10030 for (i = 0; i < dd->num_pports; i++) {
10031 struct hfi1_pportdata *ppd = &dd->pport[i];
10032
10033 set_partition_keys(ppd);
10034 }
10035 init_sc2vl_tables(dd);
10036}
10037
10038static void init_kdeth_qp(struct hfi1_devdata *dd)
10039{
10040 /* user changed the KDETH_QP */
10041 if (kdeth_qp != 0 && kdeth_qp >= 0xff) {
10042 /* out of range or illegal value */
10043 dd_dev_err(dd, "Invalid KDETH queue pair prefix, ignoring");
10044 kdeth_qp = 0;
10045 }
10046 if (kdeth_qp == 0) /* not set, or failed range check */
10047 kdeth_qp = DEFAULT_KDETH_QP;
10048
10049 write_csr(dd, SEND_BTH_QP,
10050 (kdeth_qp & SEND_BTH_QP_KDETH_QP_MASK)
10051 << SEND_BTH_QP_KDETH_QP_SHIFT);
10052
10053 write_csr(dd, RCV_BTH_QP,
10054 (kdeth_qp & RCV_BTH_QP_KDETH_QP_MASK)
10055 << RCV_BTH_QP_KDETH_QP_SHIFT);
10056}
10057
10058/**
10059 * init_qpmap_table
10060 * @dd - device data
10061 * @first_ctxt - first context
10062 * @last_ctxt - first context
10063 *
10064 * This return sets the qpn mapping table that
10065 * is indexed by qpn[8:1].
10066 *
10067 * The routine will round robin the 256 settings
10068 * from first_ctxt to last_ctxt.
10069 *
10070 * The first/last looks ahead to having specialized
10071 * receive contexts for mgmt and bypass. Normal
10072 * verbs traffic will assumed to be on a range
10073 * of receive contexts.
10074 */
10075static void init_qpmap_table(struct hfi1_devdata *dd,
10076 u32 first_ctxt,
10077 u32 last_ctxt)
10078{
10079 u64 reg = 0;
10080 u64 regno = RCV_QP_MAP_TABLE;
10081 int i;
10082 u64 ctxt = first_ctxt;
10083
10084 for (i = 0; i < 256;) {
Mike Marciniszyn77241052015-07-30 15:17:43 -040010085 reg |= ctxt << (8 * (i % 8));
10086 i++;
10087 ctxt++;
10088 if (ctxt > last_ctxt)
10089 ctxt = first_ctxt;
10090 if (i % 8 == 0) {
10091 write_csr(dd, regno, reg);
10092 reg = 0;
10093 regno += 8;
10094 }
10095 }
10096 if (i % 8)
10097 write_csr(dd, regno, reg);
10098
10099 add_rcvctrl(dd, RCV_CTRL_RCV_QP_MAP_ENABLE_SMASK
10100 | RCV_CTRL_RCV_BYPASS_ENABLE_SMASK);
10101}
10102
10103/**
10104 * init_qos - init RX qos
10105 * @dd - device data
10106 * @first_context
10107 *
10108 * This routine initializes Rule 0 and the
10109 * RSM map table to implement qos.
10110 *
10111 * If all of the limit tests succeed,
10112 * qos is applied based on the array
10113 * interpretation of krcvqs where
10114 * entry 0 is VL0.
10115 *
10116 * The number of vl bits (n) and the number of qpn
10117 * bits (m) are computed to feed both the RSM map table
10118 * and the single rule.
10119 *
10120 */
10121static void init_qos(struct hfi1_devdata *dd, u32 first_ctxt)
10122{
10123 u8 max_by_vl = 0;
10124 unsigned qpns_per_vl, ctxt, i, qpn, n = 1, m;
10125 u64 *rsmmap;
10126 u64 reg;
10127 u8 rxcontext = is_a0(dd) ? 0 : 0xff; /* 0 is default if a0 ver. */
10128
10129 /* validate */
10130 if (dd->n_krcv_queues <= MIN_KERNEL_KCTXTS ||
10131 num_vls == 1 ||
10132 krcvqsset <= 1)
10133 goto bail;
10134 for (i = 0; i < min_t(unsigned, num_vls, krcvqsset); i++)
10135 if (krcvqs[i] > max_by_vl)
10136 max_by_vl = krcvqs[i];
10137 if (max_by_vl > 32)
10138 goto bail;
10139 qpns_per_vl = __roundup_pow_of_two(max_by_vl);
10140 /* determine bits vl */
10141 n = ilog2(num_vls);
10142 /* determine bits for qpn */
10143 m = ilog2(qpns_per_vl);
10144 if ((m + n) > 7)
10145 goto bail;
10146 if (num_vls * qpns_per_vl > dd->chip_rcv_contexts)
10147 goto bail;
10148 rsmmap = kmalloc_array(NUM_MAP_REGS, sizeof(u64), GFP_KERNEL);
10149 memset(rsmmap, rxcontext, NUM_MAP_REGS * sizeof(u64));
10150 /* init the local copy of the table */
10151 for (i = 0, ctxt = first_ctxt; i < num_vls; i++) {
10152 unsigned tctxt;
10153
10154 for (qpn = 0, tctxt = ctxt;
10155 krcvqs[i] && qpn < qpns_per_vl; qpn++) {
10156 unsigned idx, regoff, regidx;
10157
10158 /* generate index <= 128 */
10159 idx = (qpn << n) ^ i;
10160 regoff = (idx % 8) * 8;
10161 regidx = idx / 8;
10162 reg = rsmmap[regidx];
10163 /* replace 0xff with context number */
10164 reg &= ~(RCV_RSM_MAP_TABLE_RCV_CONTEXT_A_MASK
10165 << regoff);
10166 reg |= (u64)(tctxt++) << regoff;
10167 rsmmap[regidx] = reg;
10168 if (tctxt == ctxt + krcvqs[i])
10169 tctxt = ctxt;
10170 }
10171 ctxt += krcvqs[i];
10172 }
10173 /* flush cached copies to chip */
10174 for (i = 0; i < NUM_MAP_REGS; i++)
10175 write_csr(dd, RCV_RSM_MAP_TABLE + (8 * i), rsmmap[i]);
10176 /* add rule0 */
10177 write_csr(dd, RCV_RSM_CFG /* + (8 * 0) */,
10178 RCV_RSM_CFG_ENABLE_OR_CHAIN_RSM0_MASK
10179 << RCV_RSM_CFG_ENABLE_OR_CHAIN_RSM0_SHIFT |
10180 2ull << RCV_RSM_CFG_PACKET_TYPE_SHIFT);
10181 write_csr(dd, RCV_RSM_SELECT /* + (8 * 0) */,
10182 LRH_BTH_MATCH_OFFSET
10183 << RCV_RSM_SELECT_FIELD1_OFFSET_SHIFT |
10184 LRH_SC_MATCH_OFFSET << RCV_RSM_SELECT_FIELD2_OFFSET_SHIFT |
10185 LRH_SC_SELECT_OFFSET << RCV_RSM_SELECT_INDEX1_OFFSET_SHIFT |
10186 ((u64)n) << RCV_RSM_SELECT_INDEX1_WIDTH_SHIFT |
10187 QPN_SELECT_OFFSET << RCV_RSM_SELECT_INDEX2_OFFSET_SHIFT |
10188 ((u64)m + (u64)n) << RCV_RSM_SELECT_INDEX2_WIDTH_SHIFT);
10189 write_csr(dd, RCV_RSM_MATCH /* + (8 * 0) */,
10190 LRH_BTH_MASK << RCV_RSM_MATCH_MASK1_SHIFT |
10191 LRH_BTH_VALUE << RCV_RSM_MATCH_VALUE1_SHIFT |
10192 LRH_SC_MASK << RCV_RSM_MATCH_MASK2_SHIFT |
10193 LRH_SC_VALUE << RCV_RSM_MATCH_VALUE2_SHIFT);
10194 /* Enable RSM */
10195 add_rcvctrl(dd, RCV_CTRL_RCV_RSM_ENABLE_SMASK);
10196 kfree(rsmmap);
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -050010197 /* map everything else to first context */
10198 init_qpmap_table(dd, FIRST_KERNEL_KCTXT, MIN_KERNEL_KCTXTS - 1);
Mike Marciniszyn77241052015-07-30 15:17:43 -040010199 dd->qos_shift = n + 1;
10200 return;
10201bail:
10202 dd->qos_shift = 1;
Niranjana Vishwanathapura82c26112015-11-11 00:35:19 -050010203 init_qpmap_table(dd, FIRST_KERNEL_KCTXT, dd->n_krcv_queues - 1);
Mike Marciniszyn77241052015-07-30 15:17:43 -040010204}
10205
10206static void init_rxe(struct hfi1_devdata *dd)
10207{
10208 /* enable all receive errors */
10209 write_csr(dd, RCV_ERR_MASK, ~0ull);
10210 /* setup QPN map table - start where VL15 context leaves off */
10211 init_qos(
10212 dd,
10213 dd->n_krcv_queues > MIN_KERNEL_KCTXTS ? MIN_KERNEL_KCTXTS : 0);
10214 /*
10215 * make sure RcvCtrl.RcvWcb <= PCIe Device Control
10216 * Register Max_Payload_Size (PCI_EXP_DEVCTL in Linux PCIe config
10217 * space, PciCfgCap2.MaxPayloadSize in HFI). There is only one
10218 * invalid configuration: RcvCtrl.RcvWcb set to its max of 256 and
10219 * Max_PayLoad_Size set to its minimum of 128.
10220 *
10221 * Presently, RcvCtrl.RcvWcb is not modified from its default of 0
10222 * (64 bytes). Max_Payload_Size is possibly modified upward in
10223 * tune_pcie_caps() which is called after this routine.
10224 */
10225}
10226
10227static void init_other(struct hfi1_devdata *dd)
10228{
10229 /* enable all CCE errors */
10230 write_csr(dd, CCE_ERR_MASK, ~0ull);
10231 /* enable *some* Misc errors */
10232 write_csr(dd, MISC_ERR_MASK, DRIVER_MISC_MASK);
10233 /* enable all DC errors, except LCB */
10234 write_csr(dd, DCC_ERR_FLG_EN, ~0ull);
10235 write_csr(dd, DC_DC8051_ERR_EN, ~0ull);
10236}
10237
10238/*
10239 * Fill out the given AU table using the given CU. A CU is defined in terms
10240 * AUs. The table is a an encoding: given the index, how many AUs does that
10241 * represent?
10242 *
10243 * NOTE: Assumes that the register layout is the same for the
10244 * local and remote tables.
10245 */
10246static void assign_cm_au_table(struct hfi1_devdata *dd, u32 cu,
10247 u32 csr0to3, u32 csr4to7)
10248{
10249 write_csr(dd, csr0to3,
10250 0ull <<
10251 SEND_CM_LOCAL_AU_TABLE0_TO3_LOCAL_AU_TABLE0_SHIFT
10252 | 1ull <<
10253 SEND_CM_LOCAL_AU_TABLE0_TO3_LOCAL_AU_TABLE1_SHIFT
10254 | 2ull * cu <<
10255 SEND_CM_LOCAL_AU_TABLE0_TO3_LOCAL_AU_TABLE2_SHIFT
10256 | 4ull * cu <<
10257 SEND_CM_LOCAL_AU_TABLE0_TO3_LOCAL_AU_TABLE3_SHIFT);
10258 write_csr(dd, csr4to7,
10259 8ull * cu <<
10260 SEND_CM_LOCAL_AU_TABLE4_TO7_LOCAL_AU_TABLE4_SHIFT
10261 | 16ull * cu <<
10262 SEND_CM_LOCAL_AU_TABLE4_TO7_LOCAL_AU_TABLE5_SHIFT
10263 | 32ull * cu <<
10264 SEND_CM_LOCAL_AU_TABLE4_TO7_LOCAL_AU_TABLE6_SHIFT
10265 | 64ull * cu <<
10266 SEND_CM_LOCAL_AU_TABLE4_TO7_LOCAL_AU_TABLE7_SHIFT);
10267
10268}
10269
10270static void assign_local_cm_au_table(struct hfi1_devdata *dd, u8 vcu)
10271{
10272 assign_cm_au_table(dd, vcu_to_cu(vcu), SEND_CM_LOCAL_AU_TABLE0_TO3,
10273 SEND_CM_LOCAL_AU_TABLE4_TO7);
10274}
10275
10276void assign_remote_cm_au_table(struct hfi1_devdata *dd, u8 vcu)
10277{
10278 assign_cm_au_table(dd, vcu_to_cu(vcu), SEND_CM_REMOTE_AU_TABLE0_TO3,
10279 SEND_CM_REMOTE_AU_TABLE4_TO7);
10280}
10281
10282static void init_txe(struct hfi1_devdata *dd)
10283{
10284 int i;
10285
10286 /* enable all PIO, SDMA, general, and Egress errors */
10287 write_csr(dd, SEND_PIO_ERR_MASK, ~0ull);
10288 write_csr(dd, SEND_DMA_ERR_MASK, ~0ull);
10289 write_csr(dd, SEND_ERR_MASK, ~0ull);
10290 write_csr(dd, SEND_EGRESS_ERR_MASK, ~0ull);
10291
10292 /* enable all per-context and per-SDMA engine errors */
10293 for (i = 0; i < dd->chip_send_contexts; i++)
10294 write_kctxt_csr(dd, i, SEND_CTXT_ERR_MASK, ~0ull);
10295 for (i = 0; i < dd->chip_sdma_engines; i++)
10296 write_kctxt_csr(dd, i, SEND_DMA_ENG_ERR_MASK, ~0ull);
10297
10298 /* set the local CU to AU mapping */
10299 assign_local_cm_au_table(dd, dd->vcu);
10300
10301 /*
10302 * Set reasonable default for Credit Return Timer
10303 * Don't set on Simulator - causes it to choke.
10304 */
10305 if (dd->icode != ICODE_FUNCTIONAL_SIMULATOR)
10306 write_csr(dd, SEND_CM_TIMER_CTRL, HFI1_CREDIT_RETURN_RATE);
10307}
10308
10309int hfi1_set_ctxt_jkey(struct hfi1_devdata *dd, unsigned ctxt, u16 jkey)
10310{
10311 struct hfi1_ctxtdata *rcd = dd->rcd[ctxt];
10312 unsigned sctxt;
10313 int ret = 0;
10314 u64 reg;
10315
10316 if (!rcd || !rcd->sc) {
10317 ret = -EINVAL;
10318 goto done;
10319 }
10320 sctxt = rcd->sc->hw_context;
10321 reg = SEND_CTXT_CHECK_JOB_KEY_MASK_SMASK | /* mask is always 1's */
10322 ((jkey & SEND_CTXT_CHECK_JOB_KEY_VALUE_MASK) <<
10323 SEND_CTXT_CHECK_JOB_KEY_VALUE_SHIFT);
10324 /* JOB_KEY_ALLOW_PERMISSIVE is not allowed by default */
10325 if (HFI1_CAP_KGET_MASK(rcd->flags, ALLOW_PERM_JKEY))
10326 reg |= SEND_CTXT_CHECK_JOB_KEY_ALLOW_PERMISSIVE_SMASK;
10327 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_JOB_KEY, reg);
10328 /*
10329 * Enable send-side J_KEY integrity check, unless this is A0 h/w
10330 * (due to A0 erratum).
10331 */
10332 if (!is_a0(dd)) {
10333 reg = read_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE);
10334 reg |= SEND_CTXT_CHECK_ENABLE_CHECK_JOB_KEY_SMASK;
10335 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE, reg);
10336 }
10337
10338 /* Enable J_KEY check on receive context. */
10339 reg = RCV_KEY_CTRL_JOB_KEY_ENABLE_SMASK |
10340 ((jkey & RCV_KEY_CTRL_JOB_KEY_VALUE_MASK) <<
10341 RCV_KEY_CTRL_JOB_KEY_VALUE_SHIFT);
10342 write_kctxt_csr(dd, ctxt, RCV_KEY_CTRL, reg);
10343done:
10344 return ret;
10345}
10346
10347int hfi1_clear_ctxt_jkey(struct hfi1_devdata *dd, unsigned ctxt)
10348{
10349 struct hfi1_ctxtdata *rcd = dd->rcd[ctxt];
10350 unsigned sctxt;
10351 int ret = 0;
10352 u64 reg;
10353
10354 if (!rcd || !rcd->sc) {
10355 ret = -EINVAL;
10356 goto done;
10357 }
10358 sctxt = rcd->sc->hw_context;
10359 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_JOB_KEY, 0);
10360 /*
10361 * Disable send-side J_KEY integrity check, unless this is A0 h/w.
10362 * This check would not have been enabled for A0 h/w, see
10363 * set_ctxt_jkey().
10364 */
10365 if (!is_a0(dd)) {
10366 reg = read_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE);
10367 reg &= ~SEND_CTXT_CHECK_ENABLE_CHECK_JOB_KEY_SMASK;
10368 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE, reg);
10369 }
10370 /* Turn off the J_KEY on the receive side */
10371 write_kctxt_csr(dd, ctxt, RCV_KEY_CTRL, 0);
10372done:
10373 return ret;
10374}
10375
10376int hfi1_set_ctxt_pkey(struct hfi1_devdata *dd, unsigned ctxt, u16 pkey)
10377{
10378 struct hfi1_ctxtdata *rcd;
10379 unsigned sctxt;
10380 int ret = 0;
10381 u64 reg;
10382
10383 if (ctxt < dd->num_rcv_contexts)
10384 rcd = dd->rcd[ctxt];
10385 else {
10386 ret = -EINVAL;
10387 goto done;
10388 }
10389 if (!rcd || !rcd->sc) {
10390 ret = -EINVAL;
10391 goto done;
10392 }
10393 sctxt = rcd->sc->hw_context;
10394 reg = ((u64)pkey & SEND_CTXT_CHECK_PARTITION_KEY_VALUE_MASK) <<
10395 SEND_CTXT_CHECK_PARTITION_KEY_VALUE_SHIFT;
10396 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_PARTITION_KEY, reg);
10397 reg = read_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE);
10398 reg |= SEND_CTXT_CHECK_ENABLE_CHECK_PARTITION_KEY_SMASK;
10399 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE, reg);
10400done:
10401 return ret;
10402}
10403
10404int hfi1_clear_ctxt_pkey(struct hfi1_devdata *dd, unsigned ctxt)
10405{
10406 struct hfi1_ctxtdata *rcd;
10407 unsigned sctxt;
10408 int ret = 0;
10409 u64 reg;
10410
10411 if (ctxt < dd->num_rcv_contexts)
10412 rcd = dd->rcd[ctxt];
10413 else {
10414 ret = -EINVAL;
10415 goto done;
10416 }
10417 if (!rcd || !rcd->sc) {
10418 ret = -EINVAL;
10419 goto done;
10420 }
10421 sctxt = rcd->sc->hw_context;
10422 reg = read_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE);
10423 reg &= ~SEND_CTXT_CHECK_ENABLE_CHECK_PARTITION_KEY_SMASK;
10424 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_ENABLE, reg);
10425 write_kctxt_csr(dd, sctxt, SEND_CTXT_CHECK_PARTITION_KEY, 0);
10426done:
10427 return ret;
10428}
10429
10430/*
10431 * Start doing the clean up the the chip. Our clean up happens in multiple
10432 * stages and this is just the first.
10433 */
10434void hfi1_start_cleanup(struct hfi1_devdata *dd)
10435{
10436 free_cntrs(dd);
10437 free_rcverr(dd);
10438 clean_up_interrupts(dd);
10439}
10440
10441#define HFI_BASE_GUID(dev) \
10442 ((dev)->base_guid & ~(1ULL << GUID_HFI_INDEX_SHIFT))
10443
10444/*
10445 * Certain chip functions need to be initialized only once per asic
10446 * instead of per-device. This function finds the peer device and
10447 * checks whether that chip initialization needs to be done by this
10448 * device.
10449 */
10450static void asic_should_init(struct hfi1_devdata *dd)
10451{
10452 unsigned long flags;
10453 struct hfi1_devdata *tmp, *peer = NULL;
10454
10455 spin_lock_irqsave(&hfi1_devs_lock, flags);
10456 /* Find our peer device */
10457 list_for_each_entry(tmp, &hfi1_dev_list, list) {
10458 if ((HFI_BASE_GUID(dd) == HFI_BASE_GUID(tmp)) &&
10459 dd->unit != tmp->unit) {
10460 peer = tmp;
10461 break;
10462 }
10463 }
10464
10465 /*
10466 * "Claim" the ASIC for initialization if it hasn't been
10467 " "claimed" yet.
10468 */
10469 if (!peer || !(peer->flags & HFI1_DO_INIT_ASIC))
10470 dd->flags |= HFI1_DO_INIT_ASIC;
10471 spin_unlock_irqrestore(&hfi1_devs_lock, flags);
10472}
10473
10474/**
Easwar Hariharan7c03ed82015-10-26 10:28:28 -040010475 * Allocate and initialize the device structure for the hfi.
Mike Marciniszyn77241052015-07-30 15:17:43 -040010476 * @dev: the pci_dev for hfi1_ib device
10477 * @ent: pci_device_id struct for this dev
10478 *
10479 * Also allocates, initializes, and returns the devdata struct for this
10480 * device instance
10481 *
10482 * This is global, and is called directly at init to set up the
10483 * chip-specific function pointers for later use.
10484 */
10485struct hfi1_devdata *hfi1_init_dd(struct pci_dev *pdev,
10486 const struct pci_device_id *ent)
10487{
10488 struct hfi1_devdata *dd;
10489 struct hfi1_pportdata *ppd;
10490 u64 reg;
10491 int i, ret;
10492 static const char * const inames[] = { /* implementation names */
10493 "RTL silicon",
10494 "RTL VCS simulation",
10495 "RTL FPGA emulation",
10496 "Functional simulator"
10497 };
10498
10499 dd = hfi1_alloc_devdata(pdev,
10500 NUM_IB_PORTS * sizeof(struct hfi1_pportdata));
10501 if (IS_ERR(dd))
10502 goto bail;
10503 ppd = dd->pport;
10504 for (i = 0; i < dd->num_pports; i++, ppd++) {
10505 int vl;
10506 /* init common fields */
10507 hfi1_init_pportdata(pdev, ppd, dd, 0, 1);
10508 /* DC supports 4 link widths */
10509 ppd->link_width_supported =
10510 OPA_LINK_WIDTH_1X | OPA_LINK_WIDTH_2X |
10511 OPA_LINK_WIDTH_3X | OPA_LINK_WIDTH_4X;
10512 ppd->link_width_downgrade_supported =
10513 ppd->link_width_supported;
10514 /* start out enabling only 4X */
10515 ppd->link_width_enabled = OPA_LINK_WIDTH_4X;
10516 ppd->link_width_downgrade_enabled =
10517 ppd->link_width_downgrade_supported;
10518 /* link width active is 0 when link is down */
10519 /* link width downgrade active is 0 when link is down */
10520
10521 if (num_vls < HFI1_MIN_VLS_SUPPORTED
10522 || num_vls > HFI1_MAX_VLS_SUPPORTED) {
10523 hfi1_early_err(&pdev->dev,
10524 "Invalid num_vls %u, using %u VLs\n",
10525 num_vls, HFI1_MAX_VLS_SUPPORTED);
10526 num_vls = HFI1_MAX_VLS_SUPPORTED;
10527 }
10528 ppd->vls_supported = num_vls;
10529 ppd->vls_operational = ppd->vls_supported;
10530 /* Set the default MTU. */
10531 for (vl = 0; vl < num_vls; vl++)
10532 dd->vld[vl].mtu = hfi1_max_mtu;
10533 dd->vld[15].mtu = MAX_MAD_PACKET;
10534 /*
10535 * Set the initial values to reasonable default, will be set
10536 * for real when link is up.
10537 */
10538 ppd->lstate = IB_PORT_DOWN;
10539 ppd->overrun_threshold = 0x4;
10540 ppd->phy_error_threshold = 0xf;
10541 ppd->port_crc_mode_enabled = link_crc_mask;
10542 /* initialize supported LTP CRC mode */
10543 ppd->port_ltp_crc_mode = cap_to_port_ltp(link_crc_mask) << 8;
10544 /* initialize enabled LTP CRC mode */
10545 ppd->port_ltp_crc_mode |= cap_to_port_ltp(link_crc_mask) << 4;
10546 /* start in offline */
10547 ppd->host_link_state = HLS_DN_OFFLINE;
10548 init_vl_arb_caches(ppd);
10549 }
10550
10551 dd->link_default = HLS_DN_POLL;
10552
10553 /*
10554 * Do remaining PCIe setup and save PCIe values in dd.
10555 * Any error printing is already done by the init code.
10556 * On return, we have the chip mapped.
10557 */
10558 ret = hfi1_pcie_ddinit(dd, pdev, ent);
10559 if (ret < 0)
10560 goto bail_free;
10561
10562 /* verify that reads actually work, save revision for reset check */
10563 dd->revision = read_csr(dd, CCE_REVISION);
10564 if (dd->revision == ~(u64)0) {
10565 dd_dev_err(dd, "cannot read chip CSRs\n");
10566 ret = -EINVAL;
10567 goto bail_cleanup;
10568 }
10569 dd->majrev = (dd->revision >> CCE_REVISION_CHIP_REV_MAJOR_SHIFT)
10570 & CCE_REVISION_CHIP_REV_MAJOR_MASK;
10571 dd->minrev = (dd->revision >> CCE_REVISION_CHIP_REV_MINOR_SHIFT)
10572 & CCE_REVISION_CHIP_REV_MINOR_MASK;
10573
10574 /* obtain the hardware ID - NOT related to unit, which is a
10575 software enumeration */
10576 reg = read_csr(dd, CCE_REVISION2);
10577 dd->hfi1_id = (reg >> CCE_REVISION2_HFI_ID_SHIFT)
10578 & CCE_REVISION2_HFI_ID_MASK;
10579 /* the variable size will remove unwanted bits */
10580 dd->icode = reg >> CCE_REVISION2_IMPL_CODE_SHIFT;
10581 dd->irev = reg >> CCE_REVISION2_IMPL_REVISION_SHIFT;
10582 dd_dev_info(dd, "Implementation: %s, revision 0x%x\n",
10583 dd->icode < ARRAY_SIZE(inames) ? inames[dd->icode] : "unknown",
10584 (int)dd->irev);
10585
10586 /* speeds the hardware can support */
10587 dd->pport->link_speed_supported = OPA_LINK_SPEED_25G;
10588 /* speeds allowed to run at */
10589 dd->pport->link_speed_enabled = dd->pport->link_speed_supported;
10590 /* give a reasonable active value, will be set on link up */
10591 dd->pport->link_speed_active = OPA_LINK_SPEED_25G;
10592
10593 dd->chip_rcv_contexts = read_csr(dd, RCV_CONTEXTS);
10594 dd->chip_send_contexts = read_csr(dd, SEND_CONTEXTS);
10595 dd->chip_sdma_engines = read_csr(dd, SEND_DMA_ENGINES);
10596 dd->chip_pio_mem_size = read_csr(dd, SEND_PIO_MEM_SIZE);
10597 dd->chip_sdma_mem_size = read_csr(dd, SEND_DMA_MEM_SIZE);
10598 /* fix up link widths for emulation _p */
10599 ppd = dd->pport;
10600 if (dd->icode == ICODE_FPGA_EMULATION && is_emulator_p(dd)) {
10601 ppd->link_width_supported =
10602 ppd->link_width_enabled =
10603 ppd->link_width_downgrade_supported =
10604 ppd->link_width_downgrade_enabled =
10605 OPA_LINK_WIDTH_1X;
10606 }
10607 /* insure num_vls isn't larger than number of sdma engines */
10608 if (HFI1_CAP_IS_KSET(SDMA) && num_vls > dd->chip_sdma_engines) {
10609 dd_dev_err(dd, "num_vls %u too large, using %u VLs\n",
10610 num_vls, HFI1_MAX_VLS_SUPPORTED);
10611 ppd->vls_supported = num_vls = HFI1_MAX_VLS_SUPPORTED;
10612 ppd->vls_operational = ppd->vls_supported;
10613 }
10614
10615 /*
10616 * Convert the ns parameter to the 64 * cclocks used in the CSR.
10617 * Limit the max if larger than the field holds. If timeout is
10618 * non-zero, then the calculated field will be at least 1.
10619 *
10620 * Must be after icode is set up - the cclock rate depends
10621 * on knowing the hardware being used.
10622 */
10623 dd->rcv_intr_timeout_csr = ns_to_cclock(dd, rcv_intr_timeout) / 64;
10624 if (dd->rcv_intr_timeout_csr >
10625 RCV_AVAIL_TIME_OUT_TIME_OUT_RELOAD_MASK)
10626 dd->rcv_intr_timeout_csr =
10627 RCV_AVAIL_TIME_OUT_TIME_OUT_RELOAD_MASK;
10628 else if (dd->rcv_intr_timeout_csr == 0 && rcv_intr_timeout)
10629 dd->rcv_intr_timeout_csr = 1;
10630
Easwar Hariharan7c03ed82015-10-26 10:28:28 -040010631 /* needs to be done before we look for the peer device */
10632 read_guid(dd);
10633
10634 /* should this device init the ASIC block? */
10635 asic_should_init(dd);
10636
Mike Marciniszyn77241052015-07-30 15:17:43 -040010637 /* obtain chip sizes, reset chip CSRs */
10638 init_chip(dd);
10639
10640 /* read in the PCIe link speed information */
10641 ret = pcie_speeds(dd);
10642 if (ret)
10643 goto bail_cleanup;
10644
Mike Marciniszyn77241052015-07-30 15:17:43 -040010645 /* read in firmware */
10646 ret = hfi1_firmware_init(dd);
10647 if (ret)
10648 goto bail_cleanup;
10649
10650 /*
10651 * In general, the PCIe Gen3 transition must occur after the
10652 * chip has been idled (so it won't initiate any PCIe transactions
10653 * e.g. an interrupt) and before the driver changes any registers
10654 * (the transition will reset the registers).
10655 *
10656 * In particular, place this call after:
10657 * - init_chip() - the chip will not initiate any PCIe transactions
10658 * - pcie_speeds() - reads the current link speed
10659 * - hfi1_firmware_init() - the needed firmware is ready to be
10660 * downloaded
10661 */
10662 ret = do_pcie_gen3_transition(dd);
10663 if (ret)
10664 goto bail_cleanup;
10665
10666 /* start setting dd values and adjusting CSRs */
10667 init_early_variables(dd);
10668
10669 parse_platform_config(dd);
10670
10671 /* add board names as they are defined */
10672 dd->boardname = kmalloc(64, GFP_KERNEL);
10673 if (!dd->boardname)
10674 goto bail_cleanup;
10675 snprintf(dd->boardname, 64, "Board ID 0x%llx",
10676 dd->revision >> CCE_REVISION_BOARD_ID_LOWER_NIBBLE_SHIFT
10677 & CCE_REVISION_BOARD_ID_LOWER_NIBBLE_MASK);
10678
10679 snprintf(dd->boardversion, BOARD_VERS_MAX,
10680 "ChipABI %u.%u, %s, ChipRev %u.%u, SW Compat %llu\n",
10681 HFI1_CHIP_VERS_MAJ, HFI1_CHIP_VERS_MIN,
10682 dd->boardname,
10683 (u32)dd->majrev,
10684 (u32)dd->minrev,
10685 (dd->revision >> CCE_REVISION_SW_SHIFT)
10686 & CCE_REVISION_SW_MASK);
10687
10688 ret = set_up_context_variables(dd);
10689 if (ret)
10690 goto bail_cleanup;
10691
10692 /* set initial RXE CSRs */
10693 init_rxe(dd);
10694 /* set initial TXE CSRs */
10695 init_txe(dd);
10696 /* set initial non-RXE, non-TXE CSRs */
10697 init_other(dd);
10698 /* set up KDETH QP prefix in both RX and TX CSRs */
10699 init_kdeth_qp(dd);
10700
10701 /* send contexts must be set up before receive contexts */
10702 ret = init_send_contexts(dd);
10703 if (ret)
10704 goto bail_cleanup;
10705
10706 ret = hfi1_create_ctxts(dd);
10707 if (ret)
10708 goto bail_cleanup;
10709
10710 dd->rcvhdrsize = DEFAULT_RCVHDRSIZE;
10711 /*
10712 * rcd[0] is guaranteed to be valid by this point. Also, all
10713 * context are using the same value, as per the module parameter.
10714 */
10715 dd->rhf_offset = dd->rcd[0]->rcvhdrqentsize - sizeof(u64) / sizeof(u32);
10716
10717 ret = init_pervl_scs(dd);
10718 if (ret)
10719 goto bail_cleanup;
10720
10721 /* sdma init */
10722 for (i = 0; i < dd->num_pports; ++i) {
10723 ret = sdma_init(dd, i);
10724 if (ret)
10725 goto bail_cleanup;
10726 }
10727
10728 /* use contexts created by hfi1_create_ctxts */
10729 ret = set_up_interrupts(dd);
10730 if (ret)
10731 goto bail_cleanup;
10732
10733 /* set up LCB access - must be after set_up_interrupts() */
10734 init_lcb_access(dd);
10735
10736 snprintf(dd->serial, SERIAL_MAX, "0x%08llx\n",
10737 dd->base_guid & 0xFFFFFF);
10738
10739 dd->oui1 = dd->base_guid >> 56 & 0xFF;
10740 dd->oui2 = dd->base_guid >> 48 & 0xFF;
10741 dd->oui3 = dd->base_guid >> 40 & 0xFF;
10742
10743 ret = load_firmware(dd); /* asymmetric with dispose_firmware() */
10744 if (ret)
10745 goto bail_clear_intr;
10746 check_fabric_firmware_versions(dd);
10747
10748 thermal_init(dd);
10749
10750 ret = init_cntrs(dd);
10751 if (ret)
10752 goto bail_clear_intr;
10753
10754 ret = init_rcverr(dd);
10755 if (ret)
10756 goto bail_free_cntrs;
10757
10758 ret = eprom_init(dd);
10759 if (ret)
10760 goto bail_free_rcverr;
10761
10762 goto bail;
10763
10764bail_free_rcverr:
10765 free_rcverr(dd);
10766bail_free_cntrs:
10767 free_cntrs(dd);
10768bail_clear_intr:
10769 clean_up_interrupts(dd);
10770bail_cleanup:
10771 hfi1_pcie_ddcleanup(dd);
10772bail_free:
10773 hfi1_free_devdata(dd);
10774 dd = ERR_PTR(ret);
10775bail:
10776 return dd;
10777}
10778
10779static u16 delay_cycles(struct hfi1_pportdata *ppd, u32 desired_egress_rate,
10780 u32 dw_len)
10781{
10782 u32 delta_cycles;
10783 u32 current_egress_rate = ppd->current_egress_rate;
10784 /* rates here are in units of 10^6 bits/sec */
10785
10786 if (desired_egress_rate == -1)
10787 return 0; /* shouldn't happen */
10788
10789 if (desired_egress_rate >= current_egress_rate)
10790 return 0; /* we can't help go faster, only slower */
10791
10792 delta_cycles = egress_cycles(dw_len * 4, desired_egress_rate) -
10793 egress_cycles(dw_len * 4, current_egress_rate);
10794
10795 return (u16)delta_cycles;
10796}
10797
10798
10799/**
10800 * create_pbc - build a pbc for transmission
10801 * @flags: special case flags or-ed in built pbc
10802 * @srate: static rate
10803 * @vl: vl
10804 * @dwlen: dword length (header words + data words + pbc words)
10805 *
10806 * Create a PBC with the given flags, rate, VL, and length.
10807 *
10808 * NOTE: The PBC created will not insert any HCRC - all callers but one are
10809 * for verbs, which does not use this PSM feature. The lone other caller
10810 * is for the diagnostic interface which calls this if the user does not
10811 * supply their own PBC.
10812 */
10813u64 create_pbc(struct hfi1_pportdata *ppd, u64 flags, int srate_mbs, u32 vl,
10814 u32 dw_len)
10815{
10816 u64 pbc, delay = 0;
10817
10818 if (unlikely(srate_mbs))
10819 delay = delay_cycles(ppd, srate_mbs, dw_len);
10820
10821 pbc = flags
10822 | (delay << PBC_STATIC_RATE_CONTROL_COUNT_SHIFT)
10823 | ((u64)PBC_IHCRC_NONE << PBC_INSERT_HCRC_SHIFT)
10824 | (vl & PBC_VL_MASK) << PBC_VL_SHIFT
10825 | (dw_len & PBC_LENGTH_DWS_MASK)
10826 << PBC_LENGTH_DWS_SHIFT;
10827
10828 return pbc;
10829}
10830
10831#define SBUS_THERMAL 0x4f
10832#define SBUS_THERM_MONITOR_MODE 0x1
10833
10834#define THERM_FAILURE(dev, ret, reason) \
10835 dd_dev_err((dd), \
10836 "Thermal sensor initialization failed: %s (%d)\n", \
10837 (reason), (ret))
10838
10839/*
10840 * Initialize the Avago Thermal sensor.
10841 *
10842 * After initialization, enable polling of thermal sensor through
10843 * SBus interface. In order for this to work, the SBus Master
10844 * firmware has to be loaded due to the fact that the HW polling
10845 * logic uses SBus interrupts, which are not supported with
10846 * default firmware. Otherwise, no data will be returned through
10847 * the ASIC_STS_THERM CSR.
10848 */
10849static int thermal_init(struct hfi1_devdata *dd)
10850{
10851 int ret = 0;
10852
10853 if (dd->icode != ICODE_RTL_SILICON ||
10854 !(dd->flags & HFI1_DO_INIT_ASIC))
10855 return ret;
10856
10857 acquire_hw_mutex(dd);
10858 dd_dev_info(dd, "Initializing thermal sensor\n");
Jareer Abdel-Qader4ef98982015-11-06 20:07:00 -050010859 /* Disable polling of thermal readings */
10860 write_csr(dd, ASIC_CFG_THERM_POLL_EN, 0x0);
10861 msleep(100);
Mike Marciniszyn77241052015-07-30 15:17:43 -040010862 /* Thermal Sensor Initialization */
10863 /* Step 1: Reset the Thermal SBus Receiver */
10864 ret = sbus_request_slow(dd, SBUS_THERMAL, 0x0,
10865 RESET_SBUS_RECEIVER, 0);
10866 if (ret) {
10867 THERM_FAILURE(dd, ret, "Bus Reset");
10868 goto done;
10869 }
10870 /* Step 2: Set Reset bit in Thermal block */
10871 ret = sbus_request_slow(dd, SBUS_THERMAL, 0x0,
10872 WRITE_SBUS_RECEIVER, 0x1);
10873 if (ret) {
10874 THERM_FAILURE(dd, ret, "Therm Block Reset");
10875 goto done;
10876 }
10877 /* Step 3: Write clock divider value (100MHz -> 2MHz) */
10878 ret = sbus_request_slow(dd, SBUS_THERMAL, 0x1,
10879 WRITE_SBUS_RECEIVER, 0x32);
10880 if (ret) {
10881 THERM_FAILURE(dd, ret, "Write Clock Div");
10882 goto done;
10883 }
10884 /* Step 4: Select temperature mode */
10885 ret = sbus_request_slow(dd, SBUS_THERMAL, 0x3,
10886 WRITE_SBUS_RECEIVER,
10887 SBUS_THERM_MONITOR_MODE);
10888 if (ret) {
10889 THERM_FAILURE(dd, ret, "Write Mode Sel");
10890 goto done;
10891 }
10892 /* Step 5: De-assert block reset and start conversion */
10893 ret = sbus_request_slow(dd, SBUS_THERMAL, 0x0,
10894 WRITE_SBUS_RECEIVER, 0x2);
10895 if (ret) {
10896 THERM_FAILURE(dd, ret, "Write Reset Deassert");
10897 goto done;
10898 }
10899 /* Step 5.1: Wait for first conversion (21.5ms per spec) */
10900 msleep(22);
10901
10902 /* Enable polling of thermal readings */
10903 write_csr(dd, ASIC_CFG_THERM_POLL_EN, 0x1);
10904done:
10905 release_hw_mutex(dd);
10906 return ret;
10907}
10908
10909static void handle_temp_err(struct hfi1_devdata *dd)
10910{
10911 struct hfi1_pportdata *ppd = &dd->pport[0];
10912 /*
10913 * Thermal Critical Interrupt
10914 * Put the device into forced freeze mode, take link down to
10915 * offline, and put DC into reset.
10916 */
10917 dd_dev_emerg(dd,
10918 "Critical temperature reached! Forcing device into freeze mode!\n");
10919 dd->flags |= HFI1_FORCED_FREEZE;
10920 start_freeze_handling(ppd, FREEZE_SELF|FREEZE_ABORT);
10921 /*
10922 * Shut DC down as much and as quickly as possible.
10923 *
10924 * Step 1: Take the link down to OFFLINE. This will cause the
10925 * 8051 to put the Serdes in reset. However, we don't want to
10926 * go through the entire link state machine since we want to
10927 * shutdown ASAP. Furthermore, this is not a graceful shutdown
10928 * but rather an attempt to save the chip.
10929 * Code below is almost the same as quiet_serdes() but avoids
10930 * all the extra work and the sleeps.
10931 */
10932 ppd->driver_link_ready = 0;
10933 ppd->link_enabled = 0;
10934 set_physical_link_state(dd, PLS_OFFLINE |
10935 (OPA_LINKDOWN_REASON_SMA_DISABLED << 8));
10936 /*
10937 * Step 2: Shutdown LCB and 8051
10938 * After shutdown, do not restore DC_CFG_RESET value.
10939 */
10940 dc_shutdown(dd);
10941}