blob: 47e54e8d2e254538e779fecdedd2c7dcef53f80f [file] [log] [blame]
Jeff Kirsher8af3c332012-02-18 07:08:14 +00001/*******************************************************************************
2
3 Intel 10 Gigabit PCI Express Linux driver
4 Copyright(c) 1999 - 2012 Intel Corporation.
5
6 This program is free software; you can redistribute it and/or modify it
7 under the terms and conditions of the GNU General Public License,
8 version 2, as published by the Free Software Foundation.
9
10 This program is distributed in the hope it will be useful, but WITHOUT
11 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 more details.
14
15 You should have received a copy of the GNU General Public License along with
16 this program; if not, write to the Free Software Foundation, Inc.,
17 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18
19 The full GNU General Public License is included in this distribution in
20 the file called "COPYING".
21
22 Contact Information:
23 e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
24 Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
25
26*******************************************************************************/
27
28#include "ixgbe.h"
29#include "ixgbe_sriov.h"
30
31/**
32 * ixgbe_cache_ring_rss - Descriptor ring to register mapping for RSS
33 * @adapter: board private structure to initialize
34 *
35 * Cache the descriptor ring offsets for RSS to the assigned rings.
36 *
37 **/
38static inline bool ixgbe_cache_ring_rss(struct ixgbe_adapter *adapter)
39{
40 int i;
41
42 if (!(adapter->flags & IXGBE_FLAG_RSS_ENABLED))
43 return false;
44
45 for (i = 0; i < adapter->num_rx_queues; i++)
46 adapter->rx_ring[i]->reg_idx = i;
47 for (i = 0; i < adapter->num_tx_queues; i++)
48 adapter->tx_ring[i]->reg_idx = i;
49
50 return true;
51}
52#ifdef CONFIG_IXGBE_DCB
53
54/* ixgbe_get_first_reg_idx - Return first register index associated with ring */
55static void ixgbe_get_first_reg_idx(struct ixgbe_adapter *adapter, u8 tc,
56 unsigned int *tx, unsigned int *rx)
57{
58 struct net_device *dev = adapter->netdev;
59 struct ixgbe_hw *hw = &adapter->hw;
60 u8 num_tcs = netdev_get_num_tc(dev);
61
62 *tx = 0;
63 *rx = 0;
64
65 switch (hw->mac.type) {
66 case ixgbe_mac_82598EB:
67 *tx = tc << 2;
68 *rx = tc << 3;
69 break;
70 case ixgbe_mac_82599EB:
71 case ixgbe_mac_X540:
72 if (num_tcs > 4) {
73 if (tc < 3) {
74 *tx = tc << 5;
75 *rx = tc << 4;
76 } else if (tc < 5) {
77 *tx = ((tc + 2) << 4);
78 *rx = tc << 4;
79 } else if (tc < num_tcs) {
80 *tx = ((tc + 8) << 3);
81 *rx = tc << 4;
82 }
83 } else {
84 *rx = tc << 5;
85 switch (tc) {
86 case 0:
87 *tx = 0;
88 break;
89 case 1:
90 *tx = 64;
91 break;
92 case 2:
93 *tx = 96;
94 break;
95 case 3:
96 *tx = 112;
97 break;
98 default:
99 break;
100 }
101 }
102 break;
103 default:
104 break;
105 }
106}
107
108/**
109 * ixgbe_cache_ring_dcb - Descriptor ring to register mapping for DCB
110 * @adapter: board private structure to initialize
111 *
112 * Cache the descriptor ring offsets for DCB to the assigned rings.
113 *
114 **/
115static inline bool ixgbe_cache_ring_dcb(struct ixgbe_adapter *adapter)
116{
117 struct net_device *dev = adapter->netdev;
118 int i, j, k;
119 u8 num_tcs = netdev_get_num_tc(dev);
120
121 if (!num_tcs)
122 return false;
123
124 for (i = 0, k = 0; i < num_tcs; i++) {
125 unsigned int tx_s, rx_s;
126 u16 count = dev->tc_to_txq[i].count;
127
128 ixgbe_get_first_reg_idx(adapter, i, &tx_s, &rx_s);
129 for (j = 0; j < count; j++, k++) {
130 adapter->tx_ring[k]->reg_idx = tx_s + j;
131 adapter->rx_ring[k]->reg_idx = rx_s + j;
132 adapter->tx_ring[k]->dcb_tc = i;
133 adapter->rx_ring[k]->dcb_tc = i;
134 }
135 }
136
137 return true;
138}
139#endif
140
141/**
142 * ixgbe_cache_ring_fdir - Descriptor ring to register mapping for Flow Director
143 * @adapter: board private structure to initialize
144 *
145 * Cache the descriptor ring offsets for Flow Director to the assigned rings.
146 *
147 **/
148static inline bool ixgbe_cache_ring_fdir(struct ixgbe_adapter *adapter)
149{
150 int i;
151 bool ret = false;
152
153 if ((adapter->flags & IXGBE_FLAG_RSS_ENABLED) &&
154 (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE)) {
155 for (i = 0; i < adapter->num_rx_queues; i++)
156 adapter->rx_ring[i]->reg_idx = i;
157 for (i = 0; i < adapter->num_tx_queues; i++)
158 adapter->tx_ring[i]->reg_idx = i;
159 ret = true;
160 }
161
162 return ret;
163}
164
165#ifdef IXGBE_FCOE
166/**
167 * ixgbe_cache_ring_fcoe - Descriptor ring to register mapping for the FCoE
168 * @adapter: board private structure to initialize
169 *
170 * Cache the descriptor ring offsets for FCoE mode to the assigned rings.
171 *
172 */
173static inline bool ixgbe_cache_ring_fcoe(struct ixgbe_adapter *adapter)
174{
175 struct ixgbe_ring_feature *f = &adapter->ring_feature[RING_F_FCOE];
176 int i;
177 u8 fcoe_rx_i = 0, fcoe_tx_i = 0;
178
179 if (!(adapter->flags & IXGBE_FLAG_FCOE_ENABLED))
180 return false;
181
182 if (adapter->flags & IXGBE_FLAG_RSS_ENABLED) {
183 if (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE)
184 ixgbe_cache_ring_fdir(adapter);
185 else
186 ixgbe_cache_ring_rss(adapter);
187
Alexander Duycke4b317e2012-05-05 05:30:53 +0000188 fcoe_rx_i = f->offset;
189 fcoe_tx_i = f->offset;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000190 }
191 for (i = 0; i < f->indices; i++, fcoe_rx_i++, fcoe_tx_i++) {
Alexander Duycke4b317e2012-05-05 05:30:53 +0000192 adapter->rx_ring[f->offset + i]->reg_idx = fcoe_rx_i;
193 adapter->tx_ring[f->offset + i]->reg_idx = fcoe_tx_i;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000194 }
195 return true;
196}
197
198#endif /* IXGBE_FCOE */
199/**
200 * ixgbe_cache_ring_sriov - Descriptor ring to register mapping for sriov
201 * @adapter: board private structure to initialize
202 *
203 * SR-IOV doesn't use any descriptor rings but changes the default if
204 * no other mapping is used.
205 *
206 */
207static inline bool ixgbe_cache_ring_sriov(struct ixgbe_adapter *adapter)
208{
209 adapter->rx_ring[0]->reg_idx = adapter->num_vfs * 2;
210 adapter->tx_ring[0]->reg_idx = adapter->num_vfs * 2;
211 if (adapter->num_vfs)
212 return true;
213 else
214 return false;
215}
216
217/**
218 * ixgbe_cache_ring_register - Descriptor ring to register mapping
219 * @adapter: board private structure to initialize
220 *
221 * Once we know the feature-set enabled for the device, we'll cache
222 * the register offset the descriptor ring is assigned to.
223 *
224 * Note, the order the various feature calls is important. It must start with
225 * the "most" features enabled at the same time, then trickle down to the
226 * least amount of features turned on at once.
227 **/
228static void ixgbe_cache_ring_register(struct ixgbe_adapter *adapter)
229{
230 /* start with default case */
231 adapter->rx_ring[0]->reg_idx = 0;
232 adapter->tx_ring[0]->reg_idx = 0;
233
234 if (ixgbe_cache_ring_sriov(adapter))
235 return;
236
237#ifdef CONFIG_IXGBE_DCB
238 if (ixgbe_cache_ring_dcb(adapter))
239 return;
240#endif
241
242#ifdef IXGBE_FCOE
243 if (ixgbe_cache_ring_fcoe(adapter))
244 return;
245#endif /* IXGBE_FCOE */
246
247 if (ixgbe_cache_ring_fdir(adapter))
248 return;
249
250 if (ixgbe_cache_ring_rss(adapter))
251 return;
252}
253
254/**
Ben Hutchings49ce9c22012-07-10 10:56:00 +0000255 * ixgbe_set_sriov_queues - Allocate queues for IOV use
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000256 * @adapter: board private structure to initialize
257 *
258 * IOV doesn't actually use anything, so just NAK the
259 * request for now and let the other queue routines
260 * figure out what to do.
261 */
262static inline bool ixgbe_set_sriov_queues(struct ixgbe_adapter *adapter)
263{
264 return false;
265}
266
267/**
Ben Hutchings49ce9c22012-07-10 10:56:00 +0000268 * ixgbe_set_rss_queues - Allocate queues for RSS
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000269 * @adapter: board private structure to initialize
270 *
271 * This is our "base" multiqueue mode. RSS (Receive Side Scaling) will try
272 * to allocate one Rx queue per CPU, and if available, one Tx queue per CPU.
273 *
274 **/
275static inline bool ixgbe_set_rss_queues(struct ixgbe_adapter *adapter)
276{
277 bool ret = false;
278 struct ixgbe_ring_feature *f = &adapter->ring_feature[RING_F_RSS];
279
280 if (adapter->flags & IXGBE_FLAG_RSS_ENABLED) {
281 f->mask = 0xF;
282 adapter->num_rx_queues = f->indices;
283 adapter->num_tx_queues = f->indices;
284 ret = true;
285 }
286
287 return ret;
288}
289
290/**
Ben Hutchings49ce9c22012-07-10 10:56:00 +0000291 * ixgbe_set_fdir_queues - Allocate queues for Flow Director
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000292 * @adapter: board private structure to initialize
293 *
294 * Flow Director is an advanced Rx filter, attempting to get Rx flows back
295 * to the original CPU that initiated the Tx session. This runs in addition
296 * to RSS, so if a packet doesn't match an FDIR filter, we can still spread the
297 * Rx load across CPUs using RSS.
298 *
299 **/
300static inline bool ixgbe_set_fdir_queues(struct ixgbe_adapter *adapter)
301{
302 bool ret = false;
303 struct ixgbe_ring_feature *f_fdir = &adapter->ring_feature[RING_F_FDIR];
304
Alexander Duyckc0876632012-05-10 00:01:46 +0000305 f_fdir->indices = min_t(int, num_online_cpus(), f_fdir->limit);
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000306 f_fdir->mask = 0;
307
308 /*
309 * Use RSS in addition to Flow Director to ensure the best
310 * distribution of flows across cores, even when an FDIR flow
311 * isn't matched.
312 */
313 if ((adapter->flags & IXGBE_FLAG_RSS_ENABLED) &&
314 (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE)) {
315 adapter->num_tx_queues = f_fdir->indices;
316 adapter->num_rx_queues = f_fdir->indices;
317 ret = true;
318 } else {
319 adapter->flags &= ~IXGBE_FLAG_FDIR_HASH_CAPABLE;
320 }
321 return ret;
322}
323
324#ifdef IXGBE_FCOE
325/**
Ben Hutchings49ce9c22012-07-10 10:56:00 +0000326 * ixgbe_set_fcoe_queues - Allocate queues for Fiber Channel over Ethernet (FCoE)
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000327 * @adapter: board private structure to initialize
328 *
329 * FCoE RX FCRETA can use up to 8 rx queues for up to 8 different exchanges.
Alexander Duycke4b317e2012-05-05 05:30:53 +0000330 * Offset is used as the index of the first rx queue used by FCoE.
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000331 **/
332static inline bool ixgbe_set_fcoe_queues(struct ixgbe_adapter *adapter)
333{
334 struct ixgbe_ring_feature *f = &adapter->ring_feature[RING_F_FCOE];
335
336 if (!(adapter->flags & IXGBE_FLAG_FCOE_ENABLED))
337 return false;
338
Alexander Duyckc0876632012-05-10 00:01:46 +0000339 f->indices = min_t(int, num_online_cpus(), f->limit);
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000340
341 adapter->num_rx_queues = 1;
342 adapter->num_tx_queues = 1;
343
344 if (adapter->flags & IXGBE_FLAG_RSS_ENABLED) {
345 e_info(probe, "FCoE enabled with RSS\n");
346 if (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE)
347 ixgbe_set_fdir_queues(adapter);
348 else
349 ixgbe_set_rss_queues(adapter);
350 }
351
352 /* adding FCoE rx rings to the end */
Alexander Duycke4b317e2012-05-05 05:30:53 +0000353 f->offset = adapter->num_rx_queues;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000354 adapter->num_rx_queues += f->indices;
355 adapter->num_tx_queues += f->indices;
356
357 return true;
358}
359#endif /* IXGBE_FCOE */
360
361/* Artificial max queue cap per traffic class in DCB mode */
362#define DCB_QUEUE_CAP 8
363
364#ifdef CONFIG_IXGBE_DCB
365static inline bool ixgbe_set_dcb_queues(struct ixgbe_adapter *adapter)
366{
367 int per_tc_q, q, i, offset = 0;
368 struct net_device *dev = adapter->netdev;
369 int tcs = netdev_get_num_tc(dev);
370
371 if (!tcs)
372 return false;
373
374 /* Map queue offset and counts onto allocated tx queues */
375 per_tc_q = min_t(unsigned int, dev->num_tx_queues / tcs, DCB_QUEUE_CAP);
376 q = min_t(int, num_online_cpus(), per_tc_q);
377
378 for (i = 0; i < tcs; i++) {
379 netdev_set_tc_queue(dev, i, q, offset);
380 offset += q;
381 }
382
383 adapter->num_tx_queues = q * tcs;
384 adapter->num_rx_queues = q * tcs;
385
386#ifdef IXGBE_FCOE
387 /* FCoE enabled queues require special configuration indexed
Alexander Duycke4b317e2012-05-05 05:30:53 +0000388 * by feature specific indices and offset. Here we map FCoE
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000389 * indices onto the DCB queue pairs allowing FCoE to own
390 * configuration later.
391 */
392 if (adapter->flags & IXGBE_FLAG_FCOE_ENABLED) {
393 u8 prio_tc[MAX_USER_PRIORITY] = {0};
394 int tc;
395 struct ixgbe_ring_feature *f =
396 &adapter->ring_feature[RING_F_FCOE];
397
398 ixgbe_dcb_unpack_map(&adapter->dcb_cfg, DCB_TX_CONFIG, prio_tc);
399 tc = prio_tc[adapter->fcoe.up];
400 f->indices = dev->tc_to_txq[tc].count;
Alexander Duycke4b317e2012-05-05 05:30:53 +0000401 f->offset = dev->tc_to_txq[tc].offset;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000402 }
403#endif
404
405 return true;
406}
407#endif
408
409/**
Ben Hutchings49ce9c22012-07-10 10:56:00 +0000410 * ixgbe_set_num_queues - Allocate queues for device, feature dependent
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000411 * @adapter: board private structure to initialize
412 *
413 * This is the top level queue allocation routine. The order here is very
414 * important, starting with the "most" number of features turned on at once,
415 * and ending with the smallest set of features. This way large combinations
416 * can be allocated if they're turned on, and smaller combinations are the
417 * fallthrough conditions.
418 *
419 **/
420static int ixgbe_set_num_queues(struct ixgbe_adapter *adapter)
421{
422 /* Start with base case */
423 adapter->num_rx_queues = 1;
424 adapter->num_tx_queues = 1;
425 adapter->num_rx_pools = adapter->num_rx_queues;
426 adapter->num_rx_queues_per_pool = 1;
427
428 if (ixgbe_set_sriov_queues(adapter))
429 goto done;
430
431#ifdef CONFIG_IXGBE_DCB
432 if (ixgbe_set_dcb_queues(adapter))
433 goto done;
434
435#endif
436#ifdef IXGBE_FCOE
437 if (ixgbe_set_fcoe_queues(adapter))
438 goto done;
439
440#endif /* IXGBE_FCOE */
441 if (ixgbe_set_fdir_queues(adapter))
442 goto done;
443
444 if (ixgbe_set_rss_queues(adapter))
445 goto done;
446
447 /* fallback to base case */
448 adapter->num_rx_queues = 1;
449 adapter->num_tx_queues = 1;
450
451done:
452 if ((adapter->netdev->reg_state == NETREG_UNREGISTERED) ||
453 (adapter->netdev->reg_state == NETREG_UNREGISTERING))
454 return 0;
455
456 /* Notify the stack of the (possibly) reduced queue counts. */
457 netif_set_real_num_tx_queues(adapter->netdev, adapter->num_tx_queues);
458 return netif_set_real_num_rx_queues(adapter->netdev,
459 adapter->num_rx_queues);
460}
461
462static void ixgbe_acquire_msix_vectors(struct ixgbe_adapter *adapter,
463 int vectors)
464{
465 int err, vector_threshold;
466
467 /* We'll want at least 2 (vector_threshold):
468 * 1) TxQ[0] + RxQ[0] handler
469 * 2) Other (Link Status Change, etc.)
470 */
471 vector_threshold = MIN_MSIX_COUNT;
472
473 /*
474 * The more we get, the more we will assign to Tx/Rx Cleanup
475 * for the separate queues...where Rx Cleanup >= Tx Cleanup.
476 * Right now, we simply care about how many we'll get; we'll
477 * set them up later while requesting irq's.
478 */
479 while (vectors >= vector_threshold) {
480 err = pci_enable_msix(adapter->pdev, adapter->msix_entries,
481 vectors);
482 if (!err) /* Success in acquiring all requested vectors. */
483 break;
484 else if (err < 0)
485 vectors = 0; /* Nasty failure, quit now */
486 else /* err == number of vectors we should try again with */
487 vectors = err;
488 }
489
490 if (vectors < vector_threshold) {
491 /* Can't allocate enough MSI-X interrupts? Oh well.
492 * This just means we'll go with either a single MSI
493 * vector or fall back to legacy interrupts.
494 */
495 netif_printk(adapter, hw, KERN_DEBUG, adapter->netdev,
496 "Unable to allocate MSI-X interrupts\n");
497 adapter->flags &= ~IXGBE_FLAG_MSIX_ENABLED;
498 kfree(adapter->msix_entries);
499 adapter->msix_entries = NULL;
500 } else {
501 adapter->flags |= IXGBE_FLAG_MSIX_ENABLED; /* Woot! */
502 /*
503 * Adjust for only the vectors we'll use, which is minimum
504 * of max_msix_q_vectors + NON_Q_VECTORS, or the number of
505 * vectors we were allocated.
506 */
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000507 vectors -= NON_Q_VECTORS;
508 adapter->num_q_vectors = min(vectors, adapter->max_q_vectors);
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000509 }
510}
511
512static void ixgbe_add_ring(struct ixgbe_ring *ring,
513 struct ixgbe_ring_container *head)
514{
515 ring->next = head->ring;
516 head->ring = ring;
517 head->count++;
518}
519
520/**
521 * ixgbe_alloc_q_vector - Allocate memory for a single interrupt vector
522 * @adapter: board private structure to initialize
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000523 * @v_count: q_vectors allocated on adapter, used for ring interleaving
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000524 * @v_idx: index of vector in adapter struct
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000525 * @txr_count: total number of Tx rings to allocate
526 * @txr_idx: index of first Tx ring to allocate
527 * @rxr_count: total number of Rx rings to allocate
528 * @rxr_idx: index of first Rx ring to allocate
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000529 *
530 * We allocate one q_vector. If allocation fails we return -ENOMEM.
531 **/
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000532static int ixgbe_alloc_q_vector(struct ixgbe_adapter *adapter,
533 int v_count, int v_idx,
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000534 int txr_count, int txr_idx,
535 int rxr_count, int rxr_idx)
536{
537 struct ixgbe_q_vector *q_vector;
538 struct ixgbe_ring *ring;
539 int node = -1;
540 int cpu = -1;
541 int ring_count, size;
542
543 ring_count = txr_count + rxr_count;
544 size = sizeof(struct ixgbe_q_vector) +
545 (sizeof(struct ixgbe_ring) * ring_count);
546
547 /* customize cpu for Flow Director mapping */
548 if (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE) {
549 if (cpu_online(v_idx)) {
550 cpu = v_idx;
551 node = cpu_to_node(cpu);
552 }
553 }
554
555 /* allocate q_vector and rings */
556 q_vector = kzalloc_node(size, GFP_KERNEL, node);
557 if (!q_vector)
558 q_vector = kzalloc(size, GFP_KERNEL);
559 if (!q_vector)
560 return -ENOMEM;
561
562 /* setup affinity mask and node */
563 if (cpu != -1)
564 cpumask_set_cpu(cpu, &q_vector->affinity_mask);
565 else
566 cpumask_copy(&q_vector->affinity_mask, cpu_online_mask);
567 q_vector->numa_node = node;
568
569 /* initialize NAPI */
570 netif_napi_add(adapter->netdev, &q_vector->napi,
571 ixgbe_poll, 64);
572
573 /* tie q_vector and adapter together */
574 adapter->q_vector[v_idx] = q_vector;
575 q_vector->adapter = adapter;
576 q_vector->v_idx = v_idx;
577
578 /* initialize work limits */
579 q_vector->tx.work_limit = adapter->tx_work_limit;
580
581 /* initialize pointer to rings */
582 ring = q_vector->ring;
583
584 while (txr_count) {
585 /* assign generic ring traits */
586 ring->dev = &adapter->pdev->dev;
587 ring->netdev = adapter->netdev;
588
589 /* configure backlink on ring */
590 ring->q_vector = q_vector;
591
592 /* update q_vector Tx values */
593 ixgbe_add_ring(ring, &q_vector->tx);
594
595 /* apply Tx specific ring traits */
596 ring->count = adapter->tx_ring_count;
597 ring->queue_index = txr_idx;
598
599 /* assign ring to adapter */
600 adapter->tx_ring[txr_idx] = ring;
601
602 /* update count and index */
603 txr_count--;
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000604 txr_idx += v_count;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000605
606 /* push pointer to next ring */
607 ring++;
608 }
609
610 while (rxr_count) {
611 /* assign generic ring traits */
612 ring->dev = &adapter->pdev->dev;
613 ring->netdev = adapter->netdev;
614
615 /* configure backlink on ring */
616 ring->q_vector = q_vector;
617
618 /* update q_vector Rx values */
619 ixgbe_add_ring(ring, &q_vector->rx);
620
621 /*
622 * 82599 errata, UDP frames with a 0 checksum
623 * can be marked as checksum errors.
624 */
625 if (adapter->hw.mac.type == ixgbe_mac_82599EB)
626 set_bit(__IXGBE_RX_CSUM_UDP_ZERO_ERR, &ring->state);
627
Alexander Duyckb2db4972012-04-07 04:57:29 +0000628#ifdef IXGBE_FCOE
629 if (adapter->netdev->features & NETIF_F_FCOE_MTU) {
630 struct ixgbe_ring_feature *f;
631 f = &adapter->ring_feature[RING_F_FCOE];
Alexander Duycke4b317e2012-05-05 05:30:53 +0000632 if ((rxr_idx >= f->offset) &&
633 (rxr_idx < f->offset + f->indices))
Alexander Duyck57efd442012-06-25 21:54:46 +0000634 set_bit(__IXGBE_RX_FCOE, &ring->state);
Alexander Duyckb2db4972012-04-07 04:57:29 +0000635 }
636
637#endif /* IXGBE_FCOE */
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000638 /* apply Rx specific ring traits */
639 ring->count = adapter->rx_ring_count;
640 ring->queue_index = rxr_idx;
641
642 /* assign ring to adapter */
643 adapter->rx_ring[rxr_idx] = ring;
644
645 /* update count and index */
646 rxr_count--;
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000647 rxr_idx += v_count;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000648
649 /* push pointer to next ring */
650 ring++;
651 }
652
653 return 0;
654}
655
656/**
657 * ixgbe_free_q_vector - Free memory allocated for specific interrupt vector
658 * @adapter: board private structure to initialize
659 * @v_idx: Index of vector to be freed
660 *
661 * This function frees the memory allocated to the q_vector. In addition if
662 * NAPI is enabled it will delete any references to the NAPI struct prior
663 * to freeing the q_vector.
664 **/
665static void ixgbe_free_q_vector(struct ixgbe_adapter *adapter, int v_idx)
666{
667 struct ixgbe_q_vector *q_vector = adapter->q_vector[v_idx];
668 struct ixgbe_ring *ring;
669
670 ixgbe_for_each_ring(ring, q_vector->tx)
671 adapter->tx_ring[ring->queue_index] = NULL;
672
673 ixgbe_for_each_ring(ring, q_vector->rx)
674 adapter->rx_ring[ring->queue_index] = NULL;
675
676 adapter->q_vector[v_idx] = NULL;
677 netif_napi_del(&q_vector->napi);
678
679 /*
680 * ixgbe_get_stats64() might access the rings on this vector,
681 * we must wait a grace period before freeing it.
682 */
683 kfree_rcu(q_vector, rcu);
684}
685
686/**
687 * ixgbe_alloc_q_vectors - Allocate memory for interrupt vectors
688 * @adapter: board private structure to initialize
689 *
690 * We allocate one q_vector per queue interrupt. If allocation fails we
691 * return -ENOMEM.
692 **/
693static int ixgbe_alloc_q_vectors(struct ixgbe_adapter *adapter)
694{
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000695 int q_vectors = adapter->num_q_vectors;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000696 int rxr_remaining = adapter->num_rx_queues;
697 int txr_remaining = adapter->num_tx_queues;
698 int rxr_idx = 0, txr_idx = 0, v_idx = 0;
699 int err;
700
701 /* only one q_vector if MSI-X is disabled. */
702 if (!(adapter->flags & IXGBE_FLAG_MSIX_ENABLED))
703 q_vectors = 1;
704
705 if (q_vectors >= (rxr_remaining + txr_remaining)) {
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000706 for (; rxr_remaining; v_idx++) {
707 err = ixgbe_alloc_q_vector(adapter, q_vectors, v_idx,
708 0, 0, 1, rxr_idx);
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000709
710 if (err)
711 goto err_out;
712
713 /* update counts and index */
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000714 rxr_remaining--;
715 rxr_idx++;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000716 }
717 }
718
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000719 for (; v_idx < q_vectors; v_idx++) {
720 int rqpv = DIV_ROUND_UP(rxr_remaining, q_vectors - v_idx);
721 int tqpv = DIV_ROUND_UP(txr_remaining, q_vectors - v_idx);
722 err = ixgbe_alloc_q_vector(adapter, q_vectors, v_idx,
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000723 tqpv, txr_idx,
724 rqpv, rxr_idx);
725
726 if (err)
727 goto err_out;
728
729 /* update counts and index */
730 rxr_remaining -= rqpv;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000731 txr_remaining -= tqpv;
Alexander Duyckd0bfcdf2012-03-28 08:03:43 +0000732 rxr_idx++;
733 txr_idx++;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000734 }
735
736 return 0;
737
738err_out:
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000739 adapter->num_tx_queues = 0;
740 adapter->num_rx_queues = 0;
741 adapter->num_q_vectors = 0;
742
743 while (v_idx--)
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000744 ixgbe_free_q_vector(adapter, v_idx);
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000745
746 return -ENOMEM;
747}
748
749/**
750 * ixgbe_free_q_vectors - Free memory allocated for interrupt vectors
751 * @adapter: board private structure to initialize
752 *
753 * This function frees the memory allocated to the q_vectors. In addition if
754 * NAPI is enabled it will delete any references to the NAPI struct prior
755 * to freeing the q_vector.
756 **/
757static void ixgbe_free_q_vectors(struct ixgbe_adapter *adapter)
758{
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000759 int v_idx = adapter->num_q_vectors;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000760
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000761 adapter->num_tx_queues = 0;
762 adapter->num_rx_queues = 0;
763 adapter->num_q_vectors = 0;
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000764
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000765 while (v_idx--)
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000766 ixgbe_free_q_vector(adapter, v_idx);
767}
768
769static void ixgbe_reset_interrupt_capability(struct ixgbe_adapter *adapter)
770{
771 if (adapter->flags & IXGBE_FLAG_MSIX_ENABLED) {
772 adapter->flags &= ~IXGBE_FLAG_MSIX_ENABLED;
773 pci_disable_msix(adapter->pdev);
774 kfree(adapter->msix_entries);
775 adapter->msix_entries = NULL;
776 } else if (adapter->flags & IXGBE_FLAG_MSI_ENABLED) {
777 adapter->flags &= ~IXGBE_FLAG_MSI_ENABLED;
778 pci_disable_msi(adapter->pdev);
779 }
780}
781
782/**
783 * ixgbe_set_interrupt_capability - set MSI-X or MSI if supported
784 * @adapter: board private structure to initialize
785 *
786 * Attempt to configure the interrupts using the best available
787 * capabilities of the hardware and the kernel.
788 **/
789static int ixgbe_set_interrupt_capability(struct ixgbe_adapter *adapter)
790{
791 struct ixgbe_hw *hw = &adapter->hw;
792 int err = 0;
793 int vector, v_budget;
794
795 /*
796 * It's easy to be greedy for MSI-X vectors, but it really
797 * doesn't do us much good if we have a lot more vectors
798 * than CPU's. So let's be conservative and only ask for
799 * (roughly) the same number of vectors as there are CPU's.
800 * The default is to use pairs of vectors.
801 */
802 v_budget = max(adapter->num_rx_queues, adapter->num_tx_queues);
803 v_budget = min_t(int, v_budget, num_online_cpus());
804 v_budget += NON_Q_VECTORS;
805
806 /*
807 * At the same time, hardware can only support a maximum of
808 * hw.mac->max_msix_vectors vectors. With features
809 * such as RSS and VMDq, we can easily surpass the number of Rx and Tx
810 * descriptor queues supported by our device. Thus, we cap it off in
811 * those rare cases where the cpu count also exceeds our vector limit.
812 */
813 v_budget = min_t(int, v_budget, hw->mac.max_msix_vectors);
814
815 /* A failure in MSI-X entry allocation isn't fatal, but it does
816 * mean we disable MSI-X capabilities of the adapter. */
817 adapter->msix_entries = kcalloc(v_budget,
818 sizeof(struct msix_entry), GFP_KERNEL);
819 if (adapter->msix_entries) {
820 for (vector = 0; vector < v_budget; vector++)
821 adapter->msix_entries[vector].entry = vector;
822
823 ixgbe_acquire_msix_vectors(adapter, v_budget);
824
825 if (adapter->flags & IXGBE_FLAG_MSIX_ENABLED)
826 goto out;
827 }
828
829 adapter->flags &= ~IXGBE_FLAG_DCB_ENABLED;
830 adapter->flags &= ~IXGBE_FLAG_RSS_ENABLED;
831 if (adapter->flags & IXGBE_FLAG_FDIR_HASH_CAPABLE) {
832 e_err(probe,
833 "ATR is not supported while multiple "
834 "queues are disabled. Disabling Flow Director\n");
835 }
836 adapter->flags &= ~IXGBE_FLAG_FDIR_HASH_CAPABLE;
837 adapter->atr_sample_rate = 0;
838 if (adapter->flags & IXGBE_FLAG_SRIOV_ENABLED)
839 ixgbe_disable_sriov(adapter);
840
841 err = ixgbe_set_num_queues(adapter);
842 if (err)
843 return err;
844
Alexander Duyck49c7ffb2012-05-05 05:30:43 +0000845 adapter->num_q_vectors = 1;
846
Jeff Kirsher8af3c332012-02-18 07:08:14 +0000847 err = pci_enable_msi(adapter->pdev);
848 if (!err) {
849 adapter->flags |= IXGBE_FLAG_MSI_ENABLED;
850 } else {
851 netif_printk(adapter, hw, KERN_DEBUG, adapter->netdev,
852 "Unable to allocate MSI interrupt, "
853 "falling back to legacy. Error: %d\n", err);
854 /* reset err */
855 err = 0;
856 }
857
858out:
859 return err;
860}
861
862/**
863 * ixgbe_init_interrupt_scheme - Determine proper interrupt scheme
864 * @adapter: board private structure to initialize
865 *
866 * We determine which interrupt scheme to use based on...
867 * - Kernel support (MSI, MSI-X)
868 * - which can be user-defined (via MODULE_PARAM)
869 * - Hardware queue count (num_*_queues)
870 * - defined by miscellaneous hardware support/features (RSS, etc.)
871 **/
872int ixgbe_init_interrupt_scheme(struct ixgbe_adapter *adapter)
873{
874 int err;
875
876 /* Number of supported queues */
877 err = ixgbe_set_num_queues(adapter);
878 if (err)
879 return err;
880
881 err = ixgbe_set_interrupt_capability(adapter);
882 if (err) {
883 e_dev_err("Unable to setup interrupt capabilities\n");
884 goto err_set_interrupt;
885 }
886
887 err = ixgbe_alloc_q_vectors(adapter);
888 if (err) {
889 e_dev_err("Unable to allocate memory for queue vectors\n");
890 goto err_alloc_q_vectors;
891 }
892
893 ixgbe_cache_ring_register(adapter);
894
895 e_dev_info("Multiqueue %s: Rx Queue count = %u, Tx Queue count = %u\n",
896 (adapter->num_rx_queues > 1) ? "Enabled" : "Disabled",
897 adapter->num_rx_queues, adapter->num_tx_queues);
898
899 set_bit(__IXGBE_DOWN, &adapter->state);
900
901 return 0;
902
903err_alloc_q_vectors:
904 ixgbe_reset_interrupt_capability(adapter);
905err_set_interrupt:
906 return err;
907}
908
909/**
910 * ixgbe_clear_interrupt_scheme - Clear the current interrupt scheme settings
911 * @adapter: board private structure to clear interrupt scheme on
912 *
913 * We go through and clear interrupt specific resources and reset the structure
914 * to pre-load conditions
915 **/
916void ixgbe_clear_interrupt_scheme(struct ixgbe_adapter *adapter)
917{
918 adapter->num_tx_queues = 0;
919 adapter->num_rx_queues = 0;
920
921 ixgbe_free_q_vectors(adapter);
922 ixgbe_reset_interrupt_capability(adapter);
923}
924
925void ixgbe_tx_ctxtdesc(struct ixgbe_ring *tx_ring, u32 vlan_macip_lens,
926 u32 fcoe_sof_eof, u32 type_tucmd, u32 mss_l4len_idx)
927{
928 struct ixgbe_adv_tx_context_desc *context_desc;
929 u16 i = tx_ring->next_to_use;
930
931 context_desc = IXGBE_TX_CTXTDESC(tx_ring, i);
932
933 i++;
934 tx_ring->next_to_use = (i < tx_ring->count) ? i : 0;
935
936 /* set bits to identify this as an advanced context descriptor */
937 type_tucmd |= IXGBE_TXD_CMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
938
939 context_desc->vlan_macip_lens = cpu_to_le32(vlan_macip_lens);
940 context_desc->seqnum_seed = cpu_to_le32(fcoe_sof_eof);
941 context_desc->type_tucmd_mlhl = cpu_to_le32(type_tucmd);
942 context_desc->mss_l4len_idx = cpu_to_le32(mss_l4len_idx);
943}
944