blob: 08bf321a9e62b36eb145b1ac5c001048f6ccbcff [file] [log] [blame]
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -07001/*
2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 *
32 */
33
34#ifndef _MLX4_EN_H_
35#define _MLX4_EN_H_
36
37#include <linux/compiler.h>
38#include <linux/list.h>
39#include <linux/mutex.h>
40#include <linux/netdevice.h>
41#include <linux/inet_lro.h>
42
43#include <linux/mlx4/device.h>
44#include <linux/mlx4/qp.h>
45#include <linux/mlx4/cq.h>
46#include <linux/mlx4/srq.h>
47#include <linux/mlx4/doorbell.h>
48
49#include "en_port.h"
50
51#define DRV_NAME "mlx4_en"
52#define DRV_VERSION "1.4.0"
53#define DRV_RELDATE "Sep 2008"
54
55
56#define MLX4_EN_MSG_LEVEL (NETIF_MSG_LINK | NETIF_MSG_IFDOWN)
57
58#define mlx4_dbg(mlevel, priv, format, arg...) \
59 if (NETIF_MSG_##mlevel & priv->msg_enable) \
60 printk(KERN_DEBUG "%s %s: " format , DRV_NAME ,\
Kay Sieversfb28ad32008-11-10 13:55:14 -080061 (dev_name(&priv->mdev->pdev->dev)) , ## arg)
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -070062
63#define mlx4_err(mdev, format, arg...) \
64 printk(KERN_ERR "%s %s: " format , DRV_NAME ,\
Kay Sieversfb28ad32008-11-10 13:55:14 -080065 (dev_name(&mdev->pdev->dev)) , ## arg)
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -070066#define mlx4_info(mdev, format, arg...) \
67 printk(KERN_INFO "%s %s: " format , DRV_NAME ,\
Kay Sieversfb28ad32008-11-10 13:55:14 -080068 (dev_name(&mdev->pdev->dev)) , ## arg)
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -070069#define mlx4_warn(mdev, format, arg...) \
70 printk(KERN_WARNING "%s %s: " format , DRV_NAME ,\
Kay Sieversfb28ad32008-11-10 13:55:14 -080071 (dev_name(&mdev->pdev->dev)) , ## arg)
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -070072
73/*
74 * Device constants
75 */
76
77
78#define MLX4_EN_PAGE_SHIFT 12
79#define MLX4_EN_PAGE_SIZE (1 << MLX4_EN_PAGE_SHIFT)
80#define MAX_TX_RINGS 16
81#define MAX_RX_RINGS 16
82#define MAX_RSS_MAP_SIZE 64
83#define RSS_FACTOR 2
84#define TXBB_SIZE 64
85#define HEADROOM (2048 / TXBB_SIZE + 1)
86#define MAX_LSO_HDR_SIZE 92
87#define STAMP_STRIDE 64
88#define STAMP_DWORDS (STAMP_STRIDE / 4)
89#define STAMP_SHIFT 31
90#define STAMP_VAL 0x7fffffff
91#define STATS_DELAY (HZ / 4)
92
93/* Typical TSO descriptor with 16 gather entries is 352 bytes... */
94#define MAX_DESC_SIZE 512
95#define MAX_DESC_TXBBS (MAX_DESC_SIZE / TXBB_SIZE)
96
97/*
98 * OS related constants and tunables
99 */
100
101#define MLX4_EN_WATCHDOG_TIMEOUT (15 * HZ)
102
103#define MLX4_EN_ALLOC_ORDER 2
104#define MLX4_EN_ALLOC_SIZE (PAGE_SIZE << MLX4_EN_ALLOC_ORDER)
105
106#define MLX4_EN_MAX_LRO_DESCRIPTORS 32
107
108/* Receive fragment sizes; we use at most 4 fragments (for 9600 byte MTU
109 * and 4K allocations) */
110enum {
111 FRAG_SZ0 = 512 - NET_IP_ALIGN,
112 FRAG_SZ1 = 1024,
113 FRAG_SZ2 = 4096,
114 FRAG_SZ3 = MLX4_EN_ALLOC_SIZE
115};
116#define MLX4_EN_MAX_RX_FRAGS 4
117
118/* Minimum ring size for our page-allocation sceme to work */
119#define MLX4_EN_MIN_RX_SIZE (MLX4_EN_ALLOC_SIZE / SMP_CACHE_BYTES)
120#define MLX4_EN_MIN_TX_SIZE (4096 / TXBB_SIZE)
121
122#define MLX4_EN_TX_RING_NUM 9
123#define MLX4_EN_DEF_TX_RING_SIZE 1024
124#define MLX4_EN_DEF_RX_RING_SIZE 1024
125
126/* Target number of bytes to coalesce with interrupt moderation */
127#define MLX4_EN_RX_COAL_TARGET 0x20000
128#define MLX4_EN_RX_COAL_TIME 0x10
129
130#define MLX4_EN_TX_COAL_PKTS 5
131#define MLX4_EN_TX_COAL_TIME 0x80
132
133#define MLX4_EN_RX_RATE_LOW 400000
134#define MLX4_EN_RX_COAL_TIME_LOW 0
135#define MLX4_EN_RX_RATE_HIGH 450000
136#define MLX4_EN_RX_COAL_TIME_HIGH 128
137#define MLX4_EN_RX_SIZE_THRESH 1024
138#define MLX4_EN_RX_RATE_THRESH (1000000 / MLX4_EN_RX_COAL_TIME_HIGH)
139#define MLX4_EN_SAMPLE_INTERVAL 0
140
141#define MLX4_EN_AUTO_CONF 0xffff
142
143#define MLX4_EN_DEF_RX_PAUSE 1
144#define MLX4_EN_DEF_TX_PAUSE 1
145
146/* Interval between sucessive polls in the Tx routine when polling is used
147 instead of interrupts (in per-core Tx rings) - should be power of 2 */
148#define MLX4_EN_TX_POLL_MODER 16
149#define MLX4_EN_TX_POLL_TIMEOUT (HZ / 4)
150
151#define ETH_LLC_SNAP_SIZE 8
152
153#define SMALL_PACKET_SIZE (256 - NET_IP_ALIGN)
154#define HEADER_COPY_SIZE (128 - NET_IP_ALIGN)
155
156#define MLX4_EN_MIN_MTU 46
157#define ETH_BCAST 0xffffffffffffULL
158
159#ifdef MLX4_EN_PERF_STAT
160/* Number of samples to 'average' */
161#define AVG_SIZE 128
162#define AVG_FACTOR 1024
163#define NUM_PERF_STATS NUM_PERF_COUNTERS
164
165#define INC_PERF_COUNTER(cnt) (++(cnt))
166#define ADD_PERF_COUNTER(cnt, add) ((cnt) += (add))
167#define AVG_PERF_COUNTER(cnt, sample) \
168 ((cnt) = ((cnt) * (AVG_SIZE - 1) + (sample) * AVG_FACTOR) / AVG_SIZE)
169#define GET_PERF_COUNTER(cnt) (cnt)
170#define GET_AVG_PERF_COUNTER(cnt) ((cnt) / AVG_FACTOR)
171
172#else
173
174#define NUM_PERF_STATS 0
175#define INC_PERF_COUNTER(cnt) do {} while (0)
176#define ADD_PERF_COUNTER(cnt, add) do {} while (0)
177#define AVG_PERF_COUNTER(cnt, sample) do {} while (0)
178#define GET_PERF_COUNTER(cnt) (0)
179#define GET_AVG_PERF_COUNTER(cnt) (0)
180#endif /* MLX4_EN_PERF_STAT */
181
182/*
183 * Configurables
184 */
185
186enum cq_type {
187 RX = 0,
188 TX = 1,
189};
190
191
192/*
193 * Useful macros
194 */
195#define ROUNDUP_LOG2(x) ilog2(roundup_pow_of_two(x))
196#define XNOR(x, y) (!(x) == !(y))
197#define ILLEGAL_MAC(addr) (addr == 0xffffffffffffULL || addr == 0x0)
198
199
200struct mlx4_en_tx_info {
201 struct sk_buff *skb;
202 u32 nr_txbb;
203 u8 linear;
204 u8 data_offset;
Yevgeny Petrilin41efea52009-01-08 10:57:15 -0800205 u8 inl;
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -0700206};
207
208
209#define MLX4_EN_BIT_DESC_OWN 0x80000000
210#define CTRL_SIZE sizeof(struct mlx4_wqe_ctrl_seg)
211#define MLX4_EN_MEMTYPE_PAD 0x100
212#define DS_SIZE sizeof(struct mlx4_wqe_data_seg)
213
214
215struct mlx4_en_tx_desc {
216 struct mlx4_wqe_ctrl_seg ctrl;
217 union {
218 struct mlx4_wqe_data_seg data; /* at least one data segment */
219 struct mlx4_wqe_lso_seg lso;
220 struct mlx4_wqe_inline_seg inl;
221 };
222};
223
224#define MLX4_EN_USE_SRQ 0x01000000
225
226struct mlx4_en_rx_alloc {
227 struct page *page;
228 u16 offset;
229};
230
231struct mlx4_en_tx_ring {
232 struct mlx4_hwq_resources wqres;
233 u32 size ; /* number of TXBBs */
234 u32 size_mask;
235 u16 stride;
236 u16 cqn; /* index of port CQ associated with this ring */
237 u32 prod;
238 u32 cons;
239 u32 buf_size;
240 u32 doorbell_qpn;
241 void *buf;
242 u16 poll_cnt;
243 int blocked;
244 struct mlx4_en_tx_info *tx_info;
245 u8 *bounce_buf;
246 u32 last_nr_txbb;
247 struct mlx4_qp qp;
248 struct mlx4_qp_context context;
249 int qpn;
250 enum mlx4_qp_state qp_state;
251 struct mlx4_srq dummy;
252 unsigned long bytes;
253 unsigned long packets;
254 spinlock_t comp_lock;
255};
256
257struct mlx4_en_rx_desc {
258 struct mlx4_wqe_srq_next_seg next;
259 /* actual number of entries depends on rx ring stride */
260 struct mlx4_wqe_data_seg data[0];
261};
262
263struct mlx4_en_rx_ring {
264 struct mlx4_srq srq;
265 struct mlx4_hwq_resources wqres;
266 struct mlx4_en_rx_alloc page_alloc[MLX4_EN_MAX_RX_FRAGS];
267 struct net_lro_mgr lro;
268 u32 size ; /* number of Rx descs*/
269 u32 actual_size;
270 u32 size_mask;
271 u16 stride;
272 u16 log_stride;
273 u16 cqn; /* index of port CQ associated with this ring */
274 u32 prod;
275 u32 cons;
276 u32 buf_size;
277 int need_refill;
278 int full;
279 void *buf;
280 void *rx_info;
281 unsigned long bytes;
282 unsigned long packets;
283};
284
285
286static inline int mlx4_en_can_lro(__be16 status)
287{
288 return (status & cpu_to_be16(MLX4_CQE_STATUS_IPV4 |
289 MLX4_CQE_STATUS_IPV4F |
290 MLX4_CQE_STATUS_IPV6 |
291 MLX4_CQE_STATUS_IPV4OPT |
292 MLX4_CQE_STATUS_TCP |
293 MLX4_CQE_STATUS_UDP |
294 MLX4_CQE_STATUS_IPOK)) ==
295 cpu_to_be16(MLX4_CQE_STATUS_IPV4 |
296 MLX4_CQE_STATUS_IPOK |
297 MLX4_CQE_STATUS_TCP);
298}
299
300struct mlx4_en_cq {
301 struct mlx4_cq mcq;
302 struct mlx4_hwq_resources wqres;
303 int ring;
304 spinlock_t lock;
305 struct net_device *dev;
306 struct napi_struct napi;
307 /* Per-core Tx cq processing support */
308 struct timer_list timer;
309 int size;
310 int buf_size;
311 unsigned vector;
312 enum cq_type is_tx;
313 u16 moder_time;
314 u16 moder_cnt;
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -0700315 struct mlx4_cqe *buf;
316#define MLX4_EN_OPCODE_ERROR 0x1e
317};
318
319struct mlx4_en_port_profile {
320 u32 flags;
321 u32 tx_ring_num;
322 u32 rx_ring_num;
323 u32 tx_ring_size;
324 u32 rx_ring_size;
Yevgeny Petrilind53b93f2008-11-05 04:48:36 +0000325 u8 rx_pause;
326 u8 rx_ppp;
327 u8 tx_pause;
328 u8 tx_ppp;
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -0700329};
330
331struct mlx4_en_profile {
332 int rss_xor;
333 int num_lro;
334 u8 rss_mask;
335 u32 active_ports;
336 u32 small_pkt_int;
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -0700337 u8 no_reset;
338 struct mlx4_en_port_profile prof[MLX4_MAX_PORTS + 1];
339};
340
341struct mlx4_en_dev {
342 struct mlx4_dev *dev;
343 struct pci_dev *pdev;
344 struct mutex state_lock;
345 struct net_device *pndev[MLX4_MAX_PORTS + 1];
346 u32 port_cnt;
347 bool device_up;
348 struct mlx4_en_profile profile;
349 u32 LSO_support;
350 struct workqueue_struct *workqueue;
351 struct device *dma_device;
352 void __iomem *uar_map;
353 struct mlx4_uar priv_uar;
354 struct mlx4_mr mr;
355 u32 priv_pdn;
356 spinlock_t uar_lock;
357};
358
359
360struct mlx4_en_rss_map {
361 int size;
362 int base_qpn;
363 u16 map[MAX_RSS_MAP_SIZE];
364 struct mlx4_qp qps[MAX_RSS_MAP_SIZE];
365 enum mlx4_qp_state state[MAX_RSS_MAP_SIZE];
366 struct mlx4_qp indir_qp;
367 enum mlx4_qp_state indir_state;
368};
369
370struct mlx4_en_rss_context {
371 __be32 base_qpn;
372 __be32 default_qpn;
373 u16 reserved;
374 u8 hash_fn;
375 u8 flags;
376 __be32 rss_key[10];
377};
378
379struct mlx4_en_pkt_stats {
380 unsigned long broadcast;
381 unsigned long rx_prio[8];
382 unsigned long tx_prio[8];
383#define NUM_PKT_STATS 17
384};
385
386struct mlx4_en_port_stats {
387 unsigned long lro_aggregated;
388 unsigned long lro_flushed;
389 unsigned long lro_no_desc;
390 unsigned long tso_packets;
391 unsigned long queue_stopped;
392 unsigned long wake_queue;
393 unsigned long tx_timeout;
394 unsigned long rx_alloc_failed;
395 unsigned long rx_chksum_good;
396 unsigned long rx_chksum_none;
397 unsigned long tx_chksum_offload;
398#define NUM_PORT_STATS 11
399};
400
401struct mlx4_en_perf_stats {
402 u32 tx_poll;
403 u64 tx_pktsz_avg;
404 u32 inflight_avg;
405 u16 tx_coal_avg;
406 u16 rx_coal_avg;
407 u32 napi_quota;
408#define NUM_PERF_COUNTERS 6
409};
410
411struct mlx4_en_frag_info {
412 u16 frag_size;
413 u16 frag_prefix_size;
414 u16 frag_stride;
415 u16 frag_align;
416 u16 last_offset;
417
418};
419
420struct mlx4_en_priv {
421 struct mlx4_en_dev *mdev;
422 struct mlx4_en_port_profile *prof;
423 struct net_device *dev;
424 struct vlan_group *vlgrp;
425 struct net_device_stats stats;
426 struct net_device_stats ret_stats;
427 spinlock_t stats_lock;
428
429 unsigned long last_moder_packets;
430 unsigned long last_moder_tx_packets;
431 unsigned long last_moder_bytes;
432 unsigned long last_moder_jiffies;
433 int last_moder_time;
434 u16 rx_usecs;
435 u16 rx_frames;
436 u16 tx_usecs;
437 u16 tx_frames;
438 u32 pkt_rate_low;
439 u16 rx_usecs_low;
440 u32 pkt_rate_high;
441 u16 rx_usecs_high;
442 u16 sample_interval;
443 u16 adaptive_rx_coal;
444 u32 msg_enable;
445
446 struct mlx4_hwq_resources res;
447 int link_state;
448 int last_link_state;
449 bool port_up;
450 int port;
451 int registered;
452 int allocated;
453 int stride;
454 int rx_csum;
455 u64 mac;
456 int mac_index;
457 unsigned max_mtu;
458 int base_qpn;
459
460 struct mlx4_en_rss_map rss_map;
461 u16 tx_prio_map[8];
462 u32 flags;
463#define MLX4_EN_FLAG_PROMISC 0x1
464 u32 tx_ring_num;
465 u32 rx_ring_num;
466 u32 rx_skb_size;
467 struct mlx4_en_frag_info frag_info[MLX4_EN_MAX_RX_FRAGS];
468 u16 num_frags;
469 u16 log_rx_info;
470
471 struct mlx4_en_tx_ring tx_ring[MAX_TX_RINGS];
472 struct mlx4_en_rx_ring rx_ring[MAX_RX_RINGS];
473 struct mlx4_en_cq tx_cq[MAX_TX_RINGS];
474 struct mlx4_en_cq rx_cq[MAX_RX_RINGS];
475 struct work_struct mcast_task;
476 struct work_struct mac_task;
477 struct delayed_work refill_task;
478 struct work_struct watchdog_task;
479 struct work_struct linkstate_task;
480 struct delayed_work stats_task;
481 struct mlx4_en_perf_stats pstats;
482 struct mlx4_en_pkt_stats pkstats;
483 struct mlx4_en_port_stats port_stats;
484 struct dev_mc_list *mc_list;
485 struct mlx4_en_stat_out_mbox hw_stats;
486};
487
488
489void mlx4_en_destroy_netdev(struct net_device *dev);
490int mlx4_en_init_netdev(struct mlx4_en_dev *mdev, int port,
491 struct mlx4_en_port_profile *prof);
492
Yevgeny Petrilin18cc42a2008-12-29 18:39:20 -0800493int mlx4_en_start_port(struct net_device *dev);
494void mlx4_en_stop_port(struct net_device *dev);
495
496void mlx4_en_free_resources(struct mlx4_en_priv *priv);
497int mlx4_en_alloc_resources(struct mlx4_en_priv *priv);
498
Yevgeny Petrilinc27a02c2008-10-22 15:47:49 -0700499int mlx4_en_get_profile(struct mlx4_en_dev *mdev);
500
501int mlx4_en_create_cq(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq,
502 int entries, int ring, enum cq_type mode);
503void mlx4_en_destroy_cq(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq);
504int mlx4_en_activate_cq(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq);
505void mlx4_en_deactivate_cq(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq);
506int mlx4_en_set_cq_moder(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq);
507int mlx4_en_arm_cq(struct mlx4_en_priv *priv, struct mlx4_en_cq *cq);
508
509void mlx4_en_poll_tx_cq(unsigned long data);
510void mlx4_en_tx_irq(struct mlx4_cq *mcq);
511int mlx4_en_xmit(struct sk_buff *skb, struct net_device *dev);
512
513int mlx4_en_create_tx_ring(struct mlx4_en_priv *priv, struct mlx4_en_tx_ring *ring,
514 u32 size, u16 stride);
515void mlx4_en_destroy_tx_ring(struct mlx4_en_priv *priv, struct mlx4_en_tx_ring *ring);
516int mlx4_en_activate_tx_ring(struct mlx4_en_priv *priv,
517 struct mlx4_en_tx_ring *ring,
518 int cq, int srqn);
519void mlx4_en_deactivate_tx_ring(struct mlx4_en_priv *priv,
520 struct mlx4_en_tx_ring *ring);
521
522int mlx4_en_create_rx_ring(struct mlx4_en_priv *priv,
523 struct mlx4_en_rx_ring *ring,
524 u32 size, u16 stride);
525void mlx4_en_destroy_rx_ring(struct mlx4_en_priv *priv,
526 struct mlx4_en_rx_ring *ring);
527int mlx4_en_activate_rx_rings(struct mlx4_en_priv *priv);
528void mlx4_en_deactivate_rx_ring(struct mlx4_en_priv *priv,
529 struct mlx4_en_rx_ring *ring);
530int mlx4_en_process_rx_cq(struct net_device *dev,
531 struct mlx4_en_cq *cq,
532 int budget);
533int mlx4_en_poll_rx_cq(struct napi_struct *napi, int budget);
534void mlx4_en_fill_qp_context(struct mlx4_en_priv *priv, int size, int stride,
535 int is_tx, int rss, int qpn, int cqn, int srqn,
536 struct mlx4_qp_context *context);
537int mlx4_en_map_buffer(struct mlx4_buf *buf);
538void mlx4_en_unmap_buffer(struct mlx4_buf *buf);
539
540void mlx4_en_calc_rx_buf(struct net_device *dev);
541void mlx4_en_set_default_rss_map(struct mlx4_en_priv *priv,
542 struct mlx4_en_rss_map *rss_map,
543 int num_entries, int num_rings);
544void mlx4_en_set_prio_map(struct mlx4_en_priv *priv, u16 *prio_map, u32 ring_num);
545int mlx4_en_config_rss_steer(struct mlx4_en_priv *priv);
546void mlx4_en_release_rss_steer(struct mlx4_en_priv *priv);
547int mlx4_en_free_tx_buf(struct net_device *dev, struct mlx4_en_tx_ring *ring);
548void mlx4_en_rx_refill(struct work_struct *work);
549void mlx4_en_rx_irq(struct mlx4_cq *mcq);
550
551int mlx4_SET_MCAST_FLTR(struct mlx4_dev *dev, u8 port, u64 mac, u64 clear, u8 mode);
552int mlx4_SET_VLAN_FLTR(struct mlx4_dev *dev, u8 port, struct vlan_group *grp);
553int mlx4_SET_PORT_general(struct mlx4_dev *dev, u8 port, int mtu,
554 u8 pptx, u8 pfctx, u8 pprx, u8 pfcrx);
555int mlx4_SET_PORT_qpn_calc(struct mlx4_dev *dev, u8 port, u32 base_qpn,
556 u8 promisc);
557
558int mlx4_en_DUMP_ETH_STATS(struct mlx4_en_dev *mdev, u8 port, u8 reset);
559
560/*
561 * Globals
562 */
563extern const struct ethtool_ops mlx4_en_ethtool_ops;
564#endif