Blame - drivers/net/ethernet/qlogic/qede/qede_fp.c - kernel/msm-5.4

blob: c61cfcfbbd56ef29ea7d09154af2d732e32fc5dd [file] [log] [blame]

Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1	/* QLogic qede NIC Driver
				2	* Copyright (c) 2015-2017 QLogic Corporation
				3	*
				4	* This software is available to you under a choice of one of two
				5	* licenses. You may choose to be licensed under the terms of the GNU
				6	* General Public License (GPL) Version 2, available from the file
				7	* COPYING in the main directory of this source tree, or the
				8	* OpenIB.org BSD license below:
				9	*
				10	* Redistribution and use in source and binary forms, with or
				11	* without modification, are permitted provided that the following
				12	* conditions are met:
				13	*
				14	* - Redistributions of source code must retain the above
				15	* copyright notice, this list of conditions and the following
				16	* disclaimer.
				17	*
				18	* - Redistributions in binary form must reproduce the above
				19	* copyright notice, this list of conditions and the following
				20	* disclaimer in the documentation and /or other materials
				21	* provided with the distribution.
				22	*
				23	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
				24	* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
				25	* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
				26	* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
				27	* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
				28	* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
				29	* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				30	* SOFTWARE.
				31	*/
				32	#include <linux/netdevice.h>
				33	#include <linux/etherdevice.h>
				34	#include <linux/skbuff.h>
Daniel Borkmann	a67edbf	2017-01-25 02:28:18 +0100	[diff] [blame]	35	#include <linux/bpf_trace.h>
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	36	#include <net/udp_tunnel.h>
				37	#include <linux/ip.h>
				38	#include <net/ipv6.h>
				39	#include <net/tcp.h>
				40	#include <linux/if_ether.h>
				41	#include <linux/if_vlan.h>
				42	#include <net/ip6_checksum.h>
Sudarsana Reddy Kalluru	4c55215	2017-02-15 10:24:11 +0200	[diff] [blame]	43	#include "qede_ptp.h"
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	44
				45	#include <linux/qed/qed_if.h>
				46	#include "qede.h"
				47	/*********************************
				48	* Content also used by slowpath *
				49	*********************************/
				50
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	51	int qede_alloc_rx_buffer(struct qede_rx_queue *rxq, bool allow_lazy)
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	52	{
				53	struct sw_rx_data *sw_rx_data;
				54	struct eth_rx_bd *rx_bd;
				55	dma_addr_t mapping;
				56	struct page *data;
				57
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	58	/* In case lazy-allocation is allowed, postpone allocation until the
				59	* end of the NAPI run. We'd still need to make sure the Rx ring has
				60	* sufficient buffers to guarantee an additional Rx interrupt.
				61	*/
				62	if (allow_lazy && likely(rxq->filled_buffers > 12)) {
				63	rxq->filled_buffers--;
				64	return 0;
				65	}
				66
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	67	data = alloc_pages(GFP_ATOMIC, 0);
				68	if (unlikely(!data))
				69	return -ENOMEM;
				70
				71	/* Map the entire page as it would be used
				72	* for multiple RX buffer segment size mapping.
				73	*/
				74	mapping = dma_map_page(rxq->dev, data, 0,
				75	PAGE_SIZE, rxq->data_direction);
				76	if (unlikely(dma_mapping_error(rxq->dev, mapping))) {
				77	__free_page(data);
				78	return -ENOMEM;
				79	}
				80
				81	sw_rx_data = &rxq->sw_rx_ring[rxq->sw_rx_prod & NUM_RX_BDS_MAX];
				82	sw_rx_data->page_offset = 0;
				83	sw_rx_data->data = data;
				84	sw_rx_data->mapping = mapping;
				85
				86	/* Advance PROD and get BD pointer */
				87	rx_bd = (struct eth_rx_bd *)qed_chain_produce(&rxq->rx_bd_ring);
				88	WARN_ON(!rx_bd);
				89	rx_bd->addr.hi = cpu_to_le32(upper_32_bits(mapping));
				90	rx_bd->addr.lo = cpu_to_le32(lower_32_bits(mapping));
				91
				92	rxq->sw_rx_prod++;
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	93	rxq->filled_buffers++;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	94
				95	return 0;
				96	}
				97
				98	/* Unmap the data and free skb */
				99	int qede_free_tx_pkt(struct qede_dev edev, struct qede_tx_queue txq, int *len)
				100	{
				101	u16 idx = txq->sw_tx_cons & NUM_TX_BDS_MAX;
				102	struct sk_buff *skb = txq->sw_tx_ring.skbs[idx].skb;
				103	struct eth_tx_1st_bd *first_bd;
				104	struct eth_tx_bd *tx_data_bd;
				105	int bds_consumed = 0;
				106	int nbds;
				107	bool data_split = txq->sw_tx_ring.skbs[idx].flags & QEDE_TSO_SPLIT_BD;
				108	int i, split_bd_len = 0;
				109
				110	if (unlikely(!skb)) {
				111	DP_ERR(edev,
				112	"skb is null for txq idx=%d txq->sw_tx_cons=%d txq->sw_tx_prod=%d\n",
				113	idx, txq->sw_tx_cons, txq->sw_tx_prod);
				114	return -1;
				115	}
				116
				117	*len = skb->len;
				118
				119	first_bd = (struct eth_tx_1st_bd *)qed_chain_consume(&txq->tx_pbl);
				120
				121	bds_consumed++;
				122
				123	nbds = first_bd->data.nbds;
				124
				125	if (data_split) {
				126	struct eth_tx_bd split = (struct eth_tx_bd )
				127	qed_chain_consume(&txq->tx_pbl);
				128	split_bd_len = BD_UNMAP_LEN(split);
				129	bds_consumed++;
				130	}
				131	dma_unmap_single(&edev->pdev->dev, BD_UNMAP_ADDR(first_bd),
				132	BD_UNMAP_LEN(first_bd) + split_bd_len, DMA_TO_DEVICE);
				133
				134	/* Unmap the data of the skb frags */
				135	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++, bds_consumed++) {
				136	tx_data_bd = (struct eth_tx_bd *)
				137	qed_chain_consume(&txq->tx_pbl);
				138	dma_unmap_page(&edev->pdev->dev, BD_UNMAP_ADDR(tx_data_bd),
				139	BD_UNMAP_LEN(tx_data_bd), DMA_TO_DEVICE);
				140	}
				141
				142	while (bds_consumed++ < nbds)
				143	qed_chain_consume(&txq->tx_pbl);
				144
				145	/* Free skb */
				146	dev_kfree_skb_any(skb);
				147	txq->sw_tx_ring.skbs[idx].skb = NULL;
				148	txq->sw_tx_ring.skbs[idx].flags = 0;
				149
				150	return 0;
				151	}
				152
				153	/* Unmap the data and free skb when mapping failed during start_xmit */
				154	static void qede_free_failed_tx_pkt(struct qede_tx_queue *txq,
				155	struct eth_tx_1st_bd *first_bd,
				156	int nbd, bool data_split)
				157	{
				158	u16 idx = txq->sw_tx_prod & NUM_TX_BDS_MAX;
				159	struct sk_buff *skb = txq->sw_tx_ring.skbs[idx].skb;
				160	struct eth_tx_bd *tx_data_bd;
				161	int i, split_bd_len = 0;
				162
				163	/* Return prod to its position before this skb was handled */
				164	qed_chain_set_prod(&txq->tx_pbl,
				165	le16_to_cpu(txq->tx_db.data.bd_prod), first_bd);
				166
				167	first_bd = (struct eth_tx_1st_bd *)qed_chain_produce(&txq->tx_pbl);
				168
				169	if (data_split) {
				170	struct eth_tx_bd split = (struct eth_tx_bd )
				171	qed_chain_produce(&txq->tx_pbl);
				172	split_bd_len = BD_UNMAP_LEN(split);
				173	nbd--;
				174	}
				175
				176	dma_unmap_single(txq->dev, BD_UNMAP_ADDR(first_bd),
				177	BD_UNMAP_LEN(first_bd) + split_bd_len, DMA_TO_DEVICE);
				178
				179	/* Unmap the data of the skb frags */
				180	for (i = 0; i < nbd; i++) {
				181	tx_data_bd = (struct eth_tx_bd *)
				182	qed_chain_produce(&txq->tx_pbl);
				183	if (tx_data_bd->nbytes)
				184	dma_unmap_page(txq->dev,
				185	BD_UNMAP_ADDR(tx_data_bd),
				186	BD_UNMAP_LEN(tx_data_bd), DMA_TO_DEVICE);
				187	}
				188
				189	/* Return again prod to its position before this skb was handled */
				190	qed_chain_set_prod(&txq->tx_pbl,
				191	le16_to_cpu(txq->tx_db.data.bd_prod), first_bd);
				192
				193	/* Free skb */
				194	dev_kfree_skb_any(skb);
				195	txq->sw_tx_ring.skbs[idx].skb = NULL;
				196	txq->sw_tx_ring.skbs[idx].flags = 0;
				197	}
				198
				199	static u32 qede_xmit_type(struct sk_buff skb, int ipv6_ext)
				200	{
				201	u32 rc = XMIT_L4_CSUM;
				202	__be16 l3_proto;
				203
				204	if (skb->ip_summed != CHECKSUM_PARTIAL)
				205	return XMIT_PLAIN;
				206
				207	l3_proto = vlan_get_protocol(skb);
				208	if (l3_proto == htons(ETH_P_IPV6) &&
				209	(ipv6_hdr(skb)->nexthdr == NEXTHDR_IPV6))
				210	*ipv6_ext = 1;
				211
				212	if (skb->encapsulation) {
				213	rc \|= XMIT_ENC;
				214	if (skb_is_gso(skb)) {
				215	unsigned short gso_type = skb_shinfo(skb)->gso_type;
				216
				217	if ((gso_type & SKB_GSO_UDP_TUNNEL_CSUM) \|\|
				218	(gso_type & SKB_GSO_GRE_CSUM))
				219	rc \|= XMIT_ENC_GSO_L4_CSUM;
				220
				221	rc \|= XMIT_LSO;
				222	return rc;
				223	}
				224	}
				225
				226	if (skb_is_gso(skb))
				227	rc \|= XMIT_LSO;
				228
				229	return rc;
				230	}
				231
				232	static void qede_set_params_for_ipv6_ext(struct sk_buff *skb,
				233	struct eth_tx_2nd_bd *second_bd,
				234	struct eth_tx_3rd_bd *third_bd)
				235	{
				236	u8 l4_proto;
				237	u16 bd2_bits1 = 0, bd2_bits2 = 0;
				238
				239	bd2_bits1 \|= (1 << ETH_TX_DATA_2ND_BD_IPV6_EXT_SHIFT);
				240
				241	bd2_bits2 \|= ((((u8 *)skb_transport_header(skb) - skb->data) >> 1) &
				242	ETH_TX_DATA_2ND_BD_L4_HDR_START_OFFSET_W_MASK)
				243	<< ETH_TX_DATA_2ND_BD_L4_HDR_START_OFFSET_W_SHIFT;
				244
				245	bd2_bits1 \|= (ETH_L4_PSEUDO_CSUM_CORRECT_LENGTH <<
				246	ETH_TX_DATA_2ND_BD_L4_PSEUDO_CSUM_MODE_SHIFT);
				247
				248	if (vlan_get_protocol(skb) == htons(ETH_P_IPV6))
				249	l4_proto = ipv6_hdr(skb)->nexthdr;
				250	else
				251	l4_proto = ip_hdr(skb)->protocol;
				252
				253	if (l4_proto == IPPROTO_UDP)
				254	bd2_bits1 \|= 1 << ETH_TX_DATA_2ND_BD_L4_UDP_SHIFT;
				255
				256	if (third_bd)
				257	third_bd->data.bitfields \|=
				258	cpu_to_le16(((tcp_hdrlen(skb) / 4) &
				259	ETH_TX_DATA_3RD_BD_TCP_HDR_LEN_DW_MASK) <<
				260	ETH_TX_DATA_3RD_BD_TCP_HDR_LEN_DW_SHIFT);
				261
				262	second_bd->data.bitfields1 = cpu_to_le16(bd2_bits1);
				263	second_bd->data.bitfields2 = cpu_to_le16(bd2_bits2);
				264	}
				265
				266	static int map_frag_to_bd(struct qede_tx_queue *txq,
				267	skb_frag_t frag, struct eth_tx_bd bd)
				268	{
				269	dma_addr_t mapping;
				270
				271	/* Map skb non-linear frag data for DMA */
				272	mapping = skb_frag_dma_map(txq->dev, frag, 0,
				273	skb_frag_size(frag), DMA_TO_DEVICE);
				274	if (unlikely(dma_mapping_error(txq->dev, mapping)))
				275	return -ENOMEM;
				276
				277	/* Setup the data pointer of the frag data */
				278	BD_SET_UNMAP_ADDR_LEN(bd, mapping, skb_frag_size(frag));
				279
				280	return 0;
				281	}
				282
				283	static u16 qede_get_skb_hlen(struct sk_buff *skb, bool is_encap_pkt)
				284	{
				285	if (is_encap_pkt)
				286	return (skb_inner_transport_header(skb) +
				287	inner_tcp_hdrlen(skb) - skb->data);
				288	else
				289	return (skb_transport_header(skb) +
				290	tcp_hdrlen(skb) - skb->data);
				291	}
				292
				293	/* +2 for 1st BD for headers and 2nd BD for headlen (if required) */
				294	#if ((MAX_SKB_FRAGS + 2) > ETH_TX_MAX_BDS_PER_NON_LSO_PACKET)
				295	static bool qede_pkt_req_lin(struct sk_buff *skb, u8 xmit_type)
				296	{
				297	int allowed_frags = ETH_TX_MAX_BDS_PER_NON_LSO_PACKET - 1;
				298
				299	if (xmit_type & XMIT_LSO) {
				300	int hlen;
				301
				302	hlen = qede_get_skb_hlen(skb, xmit_type & XMIT_ENC);
				303
				304	/* linear payload would require its own BD */
				305	if (skb_headlen(skb) > hlen)
				306	allowed_frags--;
				307	}
				308
				309	return (skb_shinfo(skb)->nr_frags > allowed_frags);
				310	}
				311	#endif
				312
				313	static inline void qede_update_tx_producer(struct qede_tx_queue *txq)
				314	{
				315	/* wmb makes sure that the BDs data is updated before updating the
				316	* producer, otherwise FW may read old data from the BDs.
				317	*/
				318	wmb();
				319	barrier();
				320	writel(txq->tx_db.raw, txq->doorbell_addr);
				321
				322	/* mmiowb is needed to synchronize doorbell writes from more than one
				323	* processor. It guarantees that the write arrives to the device before
				324	* the queue lock is released and another start_xmit is called (possibly
				325	* on another CPU). Without this barrier, the next doorbell can bypass
				326	* this doorbell. This is applicable to IA64/Altix systems.
				327	*/
				328	mmiowb();
				329	}
				330
				331	static int qede_xdp_xmit(struct qede_dev edev, struct qede_fastpath fp,
				332	struct sw_rx_data *metadata, u16 padding, u16 length)
				333	{
				334	struct qede_tx_queue *txq = fp->xdp_tx;
				335	u16 idx = txq->sw_tx_prod & NUM_TX_BDS_MAX;
				336	struct eth_tx_1st_bd *first_bd;
				337
				338	if (!qed_chain_get_elem_left(&txq->tx_pbl)) {
				339	txq->stopped_cnt++;
				340	return -ENOMEM;
				341	}
				342
				343	first_bd = (struct eth_tx_1st_bd *)qed_chain_produce(&txq->tx_pbl);
				344
				345	memset(first_bd, 0, sizeof(*first_bd));
				346	first_bd->data.bd_flags.bitfields =
				347	BIT(ETH_TX_1ST_BD_FLAGS_START_BD_SHIFT);
				348	first_bd->data.bitfields \|=
				349	(length & ETH_TX_DATA_1ST_BD_PKT_LEN_MASK) <<
				350	ETH_TX_DATA_1ST_BD_PKT_LEN_SHIFT;
				351	first_bd->data.nbds = 1;
				352
				353	/* We can safely ignore the offset, as it's 0 for XDP */
				354	BD_SET_UNMAP_ADDR_LEN(first_bd, metadata->mapping + padding, length);
				355
				356	/* Synchronize the buffer back to device, as program [probably]
				357	* has changed it.
				358	*/
				359	dma_sync_single_for_device(&edev->pdev->dev,
				360	metadata->mapping + padding,
				361	length, PCI_DMA_TODEVICE);
				362
Mintz, Yuval	89e1afc	2017-04-07 11:04:58 +0300	[diff] [blame^]	363	txq->sw_tx_ring.xdp[idx].page = metadata->data;
				364	txq->sw_tx_ring.xdp[idx].mapping = metadata->mapping;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	365	txq->sw_tx_prod++;
				366
				367	/* Mark the fastpath for future XDP doorbell */
				368	fp->xdp_xmit = 1;
				369
				370	return 0;
				371	}
				372
				373	int qede_txq_has_work(struct qede_tx_queue *txq)
				374	{
				375	u16 hw_bd_cons;
				376
				377	/* Tell compiler that consumer and producer can change */
				378	barrier();
				379	hw_bd_cons = le16_to_cpu(*txq->hw_cons_ptr);
				380	if (qed_chain_get_cons_idx(&txq->tx_pbl) == hw_bd_cons + 1)
				381	return 0;
				382
				383	return hw_bd_cons != qed_chain_get_cons_idx(&txq->tx_pbl);
				384	}
				385
				386	static void qede_xdp_tx_int(struct qede_dev edev, struct qede_tx_queue txq)
				387	{
Mintz, Yuval	89e1afc	2017-04-07 11:04:58 +0300	[diff] [blame^]	388	u16 hw_bd_cons, idx;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	389
				390	hw_bd_cons = le16_to_cpu(*txq->hw_cons_ptr);
				391	barrier();
				392
				393	while (hw_bd_cons != qed_chain_get_cons_idx(&txq->tx_pbl)) {
Mintz, Yuval	89e1afc	2017-04-07 11:04:58 +0300	[diff] [blame^]	394	qed_chain_consume(&txq->tx_pbl);
				395	idx = txq->sw_tx_cons & NUM_TX_BDS_MAX;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	396
Mintz, Yuval	89e1afc	2017-04-07 11:04:58 +0300	[diff] [blame^]	397	dma_unmap_page(&edev->pdev->dev,
				398	txq->sw_tx_ring.xdp[idx].mapping,
				399	PAGE_SIZE, DMA_BIDIRECTIONAL);
				400	__free_page(txq->sw_tx_ring.xdp[idx].page);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	401
				402	txq->sw_tx_cons++;
				403	txq->xmit_pkts++;
				404	}
				405	}
				406
				407	static int qede_tx_int(struct qede_dev edev, struct qede_tx_queue txq)
				408	{
				409	struct netdev_queue *netdev_txq;
				410	u16 hw_bd_cons;
				411	unsigned int pkts_compl = 0, bytes_compl = 0;
				412	int rc;
				413
				414	netdev_txq = netdev_get_tx_queue(edev->ndev, txq->index);
				415
				416	hw_bd_cons = le16_to_cpu(*txq->hw_cons_ptr);
				417	barrier();
				418
				419	while (hw_bd_cons != qed_chain_get_cons_idx(&txq->tx_pbl)) {
				420	int len = 0;
				421
				422	rc = qede_free_tx_pkt(edev, txq, &len);
				423	if (rc) {
				424	DP_NOTICE(edev, "hw_bd_cons = %d, chain_cons=%d\n",
				425	hw_bd_cons,
				426	qed_chain_get_cons_idx(&txq->tx_pbl));
				427	break;
				428	}
				429
				430	bytes_compl += len;
				431	pkts_compl++;
				432	txq->sw_tx_cons++;
				433	txq->xmit_pkts++;
				434	}
				435
				436	netdev_tx_completed_queue(netdev_txq, pkts_compl, bytes_compl);
				437
				438	/* Need to make the tx_bd_cons update visible to start_xmit()
				439	* before checking for netif_tx_queue_stopped(). Without the
				440	* memory barrier, there is a small possibility that
				441	* start_xmit() will miss it and cause the queue to be stopped
				442	* forever.
				443	* On the other hand we need an rmb() here to ensure the proper
				444	* ordering of bit testing in the following
				445	* netif_tx_queue_stopped(txq) call.
				446	*/
				447	smp_mb();
				448
				449	if (unlikely(netif_tx_queue_stopped(netdev_txq))) {
				450	/* Taking tx_lock is needed to prevent reenabling the queue
				451	* while it's empty. This could have happen if rx_action() gets
				452	* suspended in qede_tx_int() after the condition before
				453	* netif_tx_wake_queue(), while tx_action (qede_start_xmit()):
				454	*
				455	* stops the queue->sees fresh tx_bd_cons->releases the queue->
				456	* sends some packets consuming the whole queue again->
				457	* stops the queue
				458	*/
				459
				460	__netif_tx_lock(netdev_txq, smp_processor_id());
				461
				462	if ((netif_tx_queue_stopped(netdev_txq)) &&
				463	(edev->state == QEDE_STATE_OPEN) &&
				464	(qed_chain_get_elem_left(&txq->tx_pbl)
				465	>= (MAX_SKB_FRAGS + 1))) {
				466	netif_tx_wake_queue(netdev_txq);
				467	DP_VERBOSE(edev, NETIF_MSG_TX_DONE,
				468	"Wake queue was called\n");
				469	}
				470
				471	__netif_tx_unlock(netdev_txq);
				472	}
				473
				474	return 0;
				475	}
				476
				477	bool qede_has_rx_work(struct qede_rx_queue *rxq)
				478	{
				479	u16 hw_comp_cons, sw_comp_cons;
				480
				481	/* Tell compiler that status block fields can change */
				482	barrier();
				483
				484	hw_comp_cons = le16_to_cpu(*rxq->hw_cons_ptr);
				485	sw_comp_cons = qed_chain_get_cons_idx(&rxq->rx_comp_ring);
				486
				487	return hw_comp_cons != sw_comp_cons;
				488	}
				489
				490	static inline void qede_rx_bd_ring_consume(struct qede_rx_queue *rxq)
				491	{
				492	qed_chain_consume(&rxq->rx_bd_ring);
				493	rxq->sw_rx_cons++;
				494	}
				495
				496	/* This function reuses the buffer(from an offset) from
				497	* consumer index to producer index in the bd ring
				498	*/
				499	static inline void qede_reuse_page(struct qede_rx_queue *rxq,
				500	struct sw_rx_data *curr_cons)
				501	{
				502	struct eth_rx_bd *rx_bd_prod = qed_chain_produce(&rxq->rx_bd_ring);
				503	struct sw_rx_data *curr_prod;
				504	dma_addr_t new_mapping;
				505
				506	curr_prod = &rxq->sw_rx_ring[rxq->sw_rx_prod & NUM_RX_BDS_MAX];
				507	curr_prod = curr_cons;
				508
				509	new_mapping = curr_prod->mapping + curr_prod->page_offset;
				510
				511	rx_bd_prod->addr.hi = cpu_to_le32(upper_32_bits(new_mapping));
				512	rx_bd_prod->addr.lo = cpu_to_le32(lower_32_bits(new_mapping));
				513
				514	rxq->sw_rx_prod++;
				515	curr_cons->data = NULL;
				516	}
				517
				518	/* In case of allocation failures reuse buffers
				519	* from consumer index to produce buffers for firmware
				520	*/
				521	void qede_recycle_rx_bd_ring(struct qede_rx_queue *rxq, u8 count)
				522	{
				523	struct sw_rx_data *curr_cons;
				524
				525	for (; count > 0; count--) {
				526	curr_cons = &rxq->sw_rx_ring[rxq->sw_rx_cons & NUM_RX_BDS_MAX];
				527	qede_reuse_page(rxq, curr_cons);
				528	qede_rx_bd_ring_consume(rxq);
				529	}
				530	}
				531
				532	static inline int qede_realloc_rx_buffer(struct qede_rx_queue *rxq,
				533	struct sw_rx_data *curr_cons)
				534	{
				535	/* Move to the next segment in the page */
				536	curr_cons->page_offset += rxq->rx_buf_seg_size;
				537
				538	if (curr_cons->page_offset == PAGE_SIZE) {
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	539	if (unlikely(qede_alloc_rx_buffer(rxq, true))) {
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	540	/* Since we failed to allocate new buffer
				541	* current buffer can be used again.
				542	*/
				543	curr_cons->page_offset -= rxq->rx_buf_seg_size;
				544
				545	return -ENOMEM;
				546	}
				547
				548	dma_unmap_page(rxq->dev, curr_cons->mapping,
				549	PAGE_SIZE, rxq->data_direction);
				550	} else {
				551	/* Increment refcount of the page as we don't want
				552	* network stack to take the ownership of the page
				553	* which can be recycled multiple times by the driver.
				554	*/
				555	page_ref_inc(curr_cons->data);
				556	qede_reuse_page(rxq, curr_cons);
				557	}
				558
				559	return 0;
				560	}
				561
				562	void qede_update_rx_prod(struct qede_dev edev, struct qede_rx_queue rxq)
				563	{
				564	u16 bd_prod = qed_chain_get_prod_idx(&rxq->rx_bd_ring);
				565	u16 cqe_prod = qed_chain_get_prod_idx(&rxq->rx_comp_ring);
				566	struct eth_rx_prod_data rx_prods = {0};
				567
				568	/* Update producers */
				569	rx_prods.bd_prod = cpu_to_le16(bd_prod);
				570	rx_prods.cqe_prod = cpu_to_le16(cqe_prod);
				571
				572	/* Make sure that the BD and SGE data is updated before updating the
				573	* producers since FW might read the BD/SGE right after the producer
				574	* is updated.
				575	*/
				576	wmb();
				577
				578	internal_ram_wr(rxq->hw_rxq_prod_addr, sizeof(rx_prods),
				579	(u32 *)&rx_prods);
				580
				581	/* mmiowb is needed to synchronize doorbell writes from more than one
				582	* processor. It guarantees that the write arrives to the device before
				583	* the napi lock is released and another qede_poll is called (possibly
				584	* on another CPU). Without this barrier, the next doorbell can bypass
				585	* this doorbell. This is applicable to IA64/Altix systems.
				586	*/
				587	mmiowb();
				588	}
				589
				590	static void qede_get_rxhash(struct sk_buff *skb, u8 bitfields, __le32 rss_hash)
				591	{
				592	enum pkt_hash_types hash_type = PKT_HASH_TYPE_NONE;
				593	enum rss_hash_type htype;
				594	u32 hash = 0;
				595
				596	htype = GET_FIELD(bitfields, ETH_FAST_PATH_RX_REG_CQE_RSS_HASH_TYPE);
				597	if (htype) {
				598	hash_type = ((htype == RSS_HASH_TYPE_IPV4) \|\|
				599	(htype == RSS_HASH_TYPE_IPV6)) ?
				600	PKT_HASH_TYPE_L3 : PKT_HASH_TYPE_L4;
				601	hash = le32_to_cpu(rss_hash);
				602	}
				603	skb_set_hash(skb, hash, hash_type);
				604	}
				605
				606	static void qede_set_skb_csum(struct sk_buff *skb, u8 csum_flag)
				607	{
				608	skb_checksum_none_assert(skb);
				609
				610	if (csum_flag & QEDE_CSUM_UNNECESSARY)
				611	skb->ip_summed = CHECKSUM_UNNECESSARY;
				612
Manish Chopra	7ca547b	2017-01-01 13:57:05 +0200	[diff] [blame]	613	if (csum_flag & QEDE_TUNN_CSUM_UNNECESSARY) {
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	614	skb->csum_level = 1;
Manish Chopra	7ca547b	2017-01-01 13:57:05 +0200	[diff] [blame]	615	skb->encapsulation = 1;
				616	}
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	617	}
				618
				619	static inline void qede_skb_receive(struct qede_dev *edev,
				620	struct qede_fastpath *fp,
				621	struct qede_rx_queue *rxq,
				622	struct sk_buff *skb, u16 vlan_tag)
				623	{
				624	if (vlan_tag)
				625	__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), vlan_tag);
				626
				627	napi_gro_receive(&fp->napi, skb);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	628	}
				629
				630	static void qede_set_gro_params(struct qede_dev *edev,
				631	struct sk_buff *skb,
				632	struct eth_fast_path_rx_tpa_start_cqe *cqe)
				633	{
				634	u16 parsing_flags = le16_to_cpu(cqe->pars_flags.flags);
				635
				636	if (((parsing_flags >> PARSING_AND_ERR_FLAGS_L3TYPE_SHIFT) &
				637	PARSING_AND_ERR_FLAGS_L3TYPE_MASK) == 2)
				638	skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
				639	else
				640	skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
				641
				642	skb_shinfo(skb)->gso_size = __le16_to_cpu(cqe->len_on_first_bd) -
				643	cqe->header_len;
				644	}
				645
				646	static int qede_fill_frag_skb(struct qede_dev *edev,
				647	struct qede_rx_queue *rxq,
				648	u8 tpa_agg_index, u16 len_on_bd)
				649	{
				650	struct sw_rx_data *current_bd = &rxq->sw_rx_ring[rxq->sw_rx_cons &
				651	NUM_RX_BDS_MAX];
				652	struct qede_agg_info *tpa_info = &rxq->tpa_info[tpa_agg_index];
				653	struct sk_buff *skb = tpa_info->skb;
				654
				655	if (unlikely(tpa_info->state != QEDE_AGG_STATE_START))
				656	goto out;
				657
				658	/* Add one frag and update the appropriate fields in the skb */
				659	skb_fill_page_desc(skb, tpa_info->frag_id++,
				660	current_bd->data, current_bd->page_offset,
				661	len_on_bd);
				662
				663	if (unlikely(qede_realloc_rx_buffer(rxq, current_bd))) {
				664	/* Incr page ref count to reuse on allocation failure
				665	* so that it doesn't get freed while freeing SKB.
				666	*/
				667	page_ref_inc(current_bd->data);
				668	goto out;
				669	}
				670
				671	qed_chain_consume(&rxq->rx_bd_ring);
				672	rxq->sw_rx_cons++;
				673
				674	skb->data_len += len_on_bd;
				675	skb->truesize += rxq->rx_buf_seg_size;
				676	skb->len += len_on_bd;
				677
				678	return 0;
				679
				680	out:
				681	tpa_info->state = QEDE_AGG_STATE_ERROR;
				682	qede_recycle_rx_bd_ring(rxq, 1);
				683
				684	return -ENOMEM;
				685	}
				686
				687	static bool qede_tunn_exist(u16 flag)
				688	{
				689	return !!(flag & (PARSING_AND_ERR_FLAGS_TUNNELEXIST_MASK <<
				690	PARSING_AND_ERR_FLAGS_TUNNELEXIST_SHIFT));
				691	}
				692
				693	static u8 qede_check_tunn_csum(u16 flag)
				694	{
				695	u16 csum_flag = 0;
				696	u8 tcsum = 0;
				697
				698	if (flag & (PARSING_AND_ERR_FLAGS_TUNNELL4CHKSMWASCALCULATED_MASK <<
				699	PARSING_AND_ERR_FLAGS_TUNNELL4CHKSMWASCALCULATED_SHIFT))
				700	csum_flag \|= PARSING_AND_ERR_FLAGS_TUNNELL4CHKSMERROR_MASK <<
				701	PARSING_AND_ERR_FLAGS_TUNNELL4CHKSMERROR_SHIFT;
				702
				703	if (flag & (PARSING_AND_ERR_FLAGS_L4CHKSMWASCALCULATED_MASK <<
				704	PARSING_AND_ERR_FLAGS_L4CHKSMWASCALCULATED_SHIFT)) {
				705	csum_flag \|= PARSING_AND_ERR_FLAGS_L4CHKSMERROR_MASK <<
				706	PARSING_AND_ERR_FLAGS_L4CHKSMERROR_SHIFT;
				707	tcsum = QEDE_TUNN_CSUM_UNNECESSARY;
				708	}
				709
				710	csum_flag \|= PARSING_AND_ERR_FLAGS_TUNNELIPHDRERROR_MASK <<
				711	PARSING_AND_ERR_FLAGS_TUNNELIPHDRERROR_SHIFT \|
				712	PARSING_AND_ERR_FLAGS_IPHDRERROR_MASK <<
				713	PARSING_AND_ERR_FLAGS_IPHDRERROR_SHIFT;
				714
				715	if (csum_flag & flag)
				716	return QEDE_CSUM_ERROR;
				717
				718	return QEDE_CSUM_UNNECESSARY \| tcsum;
				719	}
				720
				721	static void qede_tpa_start(struct qede_dev *edev,
				722	struct qede_rx_queue *rxq,
				723	struct eth_fast_path_rx_tpa_start_cqe *cqe)
				724	{
				725	struct qede_agg_info *tpa_info = &rxq->tpa_info[cqe->tpa_agg_index];
				726	struct eth_rx_bd *rx_bd_cons = qed_chain_consume(&rxq->rx_bd_ring);
				727	struct eth_rx_bd *rx_bd_prod = qed_chain_produce(&rxq->rx_bd_ring);
				728	struct sw_rx_data *replace_buf = &tpa_info->buffer;
				729	dma_addr_t mapping = tpa_info->buffer_mapping;
				730	struct sw_rx_data *sw_rx_data_cons;
				731	struct sw_rx_data *sw_rx_data_prod;
				732
				733	sw_rx_data_cons = &rxq->sw_rx_ring[rxq->sw_rx_cons & NUM_RX_BDS_MAX];
				734	sw_rx_data_prod = &rxq->sw_rx_ring[rxq->sw_rx_prod & NUM_RX_BDS_MAX];
				735
				736	/* Use pre-allocated replacement buffer - we can't release the agg.
				737	* start until its over and we don't want to risk allocation failing
				738	* here, so re-allocate when aggregation will be over.
				739	*/
				740	sw_rx_data_prod->mapping = replace_buf->mapping;
				741
				742	sw_rx_data_prod->data = replace_buf->data;
				743	rx_bd_prod->addr.hi = cpu_to_le32(upper_32_bits(mapping));
				744	rx_bd_prod->addr.lo = cpu_to_le32(lower_32_bits(mapping));
				745	sw_rx_data_prod->page_offset = replace_buf->page_offset;
				746
				747	rxq->sw_rx_prod++;
				748
				749	/* move partial skb from cons to pool (don't unmap yet)
				750	* save mapping, incase we drop the packet later on.
				751	*/
				752	tpa_info->buffer = *sw_rx_data_cons;
				753	mapping = HILO_U64(le32_to_cpu(rx_bd_cons->addr.hi),
				754	le32_to_cpu(rx_bd_cons->addr.lo));
				755
				756	tpa_info->buffer_mapping = mapping;
				757	rxq->sw_rx_cons++;
				758
				759	/* set tpa state to start only if we are able to allocate skb
				760	* for this aggregation, otherwise mark as error and aggregation will
				761	* be dropped
				762	*/
				763	tpa_info->skb = netdev_alloc_skb(edev->ndev,
				764	le16_to_cpu(cqe->len_on_first_bd));
				765	if (unlikely(!tpa_info->skb)) {
				766	DP_NOTICE(edev, "Failed to allocate SKB for gro\n");
				767	tpa_info->state = QEDE_AGG_STATE_ERROR;
				768	goto cons_buf;
				769	}
				770
				771	/* Start filling in the aggregation info */
				772	skb_put(tpa_info->skb, le16_to_cpu(cqe->len_on_first_bd));
				773	tpa_info->frag_id = 0;
				774	tpa_info->state = QEDE_AGG_STATE_START;
				775
				776	/* Store some information from first CQE */
				777	tpa_info->start_cqe_placement_offset = cqe->placement_offset;
				778	tpa_info->start_cqe_bd_len = le16_to_cpu(cqe->len_on_first_bd);
				779	if ((le16_to_cpu(cqe->pars_flags.flags) >>
				780	PARSING_AND_ERR_FLAGS_TAG8021QEXIST_SHIFT) &
				781	PARSING_AND_ERR_FLAGS_TAG8021QEXIST_MASK)
				782	tpa_info->vlan_tag = le16_to_cpu(cqe->vlan_tag);
				783	else
				784	tpa_info->vlan_tag = 0;
				785
				786	qede_get_rxhash(tpa_info->skb, cqe->bitfields, cqe->rss_hash);
				787
				788	/* This is needed in order to enable forwarding support */
				789	qede_set_gro_params(edev, tpa_info->skb, cqe);
				790
				791	cons_buf: /* We still need to handle bd_len_list to consume buffers */
				792	if (likely(cqe->ext_bd_len_list[0]))
				793	qede_fill_frag_skb(edev, rxq, cqe->tpa_agg_index,
				794	le16_to_cpu(cqe->ext_bd_len_list[0]));
				795
				796	if (unlikely(cqe->ext_bd_len_list[1])) {
				797	DP_ERR(edev,
				798	"Unlikely - got a TPA aggregation with more than one ext_bd_len_list entry in the TPA start\n");
				799	tpa_info->state = QEDE_AGG_STATE_ERROR;
				800	}
				801	}
				802
				803	#ifdef CONFIG_INET
				804	static void qede_gro_ip_csum(struct sk_buff *skb)
				805	{
				806	const struct iphdr *iph = ip_hdr(skb);
				807	struct tcphdr *th;
				808
				809	skb_set_transport_header(skb, sizeof(struct iphdr));
				810	th = tcp_hdr(skb);
				811
				812	th->check = ~tcp_v4_check(skb->len - skb_transport_offset(skb),
				813	iph->saddr, iph->daddr, 0);
				814
				815	tcp_gro_complete(skb);
				816	}
				817
				818	static void qede_gro_ipv6_csum(struct sk_buff *skb)
				819	{
				820	struct ipv6hdr *iph = ipv6_hdr(skb);
				821	struct tcphdr *th;
				822
				823	skb_set_transport_header(skb, sizeof(struct ipv6hdr));
				824	th = tcp_hdr(skb);
				825
				826	th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
				827	&iph->saddr, &iph->daddr, 0);
				828	tcp_gro_complete(skb);
				829	}
				830	#endif
				831
				832	static void qede_gro_receive(struct qede_dev *edev,
				833	struct qede_fastpath *fp,
				834	struct sk_buff *skb,
				835	u16 vlan_tag)
				836	{
				837	/* FW can send a single MTU sized packet from gro flow
				838	* due to aggregation timeout/last segment etc. which
				839	* is not expected to be a gro packet. If a skb has zero
				840	* frags then simply push it in the stack as non gso skb.
				841	*/
				842	if (unlikely(!skb->data_len)) {
				843	skb_shinfo(skb)->gso_type = 0;
				844	skb_shinfo(skb)->gso_size = 0;
				845	goto send_skb;
				846	}
				847
				848	#ifdef CONFIG_INET
				849	if (skb_shinfo(skb)->gso_size) {
				850	skb_reset_network_header(skb);
				851
				852	switch (skb->protocol) {
				853	case htons(ETH_P_IP):
				854	qede_gro_ip_csum(skb);
				855	break;
				856	case htons(ETH_P_IPV6):
				857	qede_gro_ipv6_csum(skb);
				858	break;
				859	default:
				860	DP_ERR(edev,
				861	"Error: FW GRO supports only IPv4/IPv6, not 0x%04x\n",
				862	ntohs(skb->protocol));
				863	}
				864	}
				865	#endif
				866
				867	send_skb:
				868	skb_record_rx_queue(skb, fp->rxq->rxq_id);
				869	qede_skb_receive(edev, fp, fp->rxq, skb, vlan_tag);
				870	}
				871
				872	static inline void qede_tpa_cont(struct qede_dev *edev,
				873	struct qede_rx_queue *rxq,
				874	struct eth_fast_path_rx_tpa_cont_cqe *cqe)
				875	{
				876	int i;
				877
				878	for (i = 0; cqe->len_list[i]; i++)
				879	qede_fill_frag_skb(edev, rxq, cqe->tpa_agg_index,
				880	le16_to_cpu(cqe->len_list[i]));
				881
				882	if (unlikely(i > 1))
				883	DP_ERR(edev,
				884	"Strange - TPA cont with more than a single len_list entry\n");
				885	}
				886
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	887	static int qede_tpa_end(struct qede_dev *edev,
				888	struct qede_fastpath *fp,
				889	struct eth_fast_path_rx_tpa_end_cqe *cqe)
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	890	{
				891	struct qede_rx_queue *rxq = fp->rxq;
				892	struct qede_agg_info *tpa_info;
				893	struct sk_buff *skb;
				894	int i;
				895
				896	tpa_info = &rxq->tpa_info[cqe->tpa_agg_index];
				897	skb = tpa_info->skb;
				898
				899	for (i = 0; cqe->len_list[i]; i++)
				900	qede_fill_frag_skb(edev, rxq, cqe->tpa_agg_index,
				901	le16_to_cpu(cqe->len_list[i]));
				902	if (unlikely(i > 1))
				903	DP_ERR(edev,
				904	"Strange - TPA emd with more than a single len_list entry\n");
				905
				906	if (unlikely(tpa_info->state != QEDE_AGG_STATE_START))
				907	goto err;
				908
				909	/* Sanity */
				910	if (unlikely(cqe->num_of_bds != tpa_info->frag_id + 1))
				911	DP_ERR(edev,
				912	"Strange - TPA had %02x BDs, but SKB has only %d frags\n",
				913	cqe->num_of_bds, tpa_info->frag_id);
				914	if (unlikely(skb->len != le16_to_cpu(cqe->total_packet_len)))
				915	DP_ERR(edev,
				916	"Strange - total packet len [cqe] is %4x but SKB has len %04x\n",
				917	le16_to_cpu(cqe->total_packet_len), skb->len);
				918
				919	memcpy(skb->data,
				920	page_address(tpa_info->buffer.data) +
				921	tpa_info->start_cqe_placement_offset +
				922	tpa_info->buffer.page_offset, tpa_info->start_cqe_bd_len);
				923
				924	/* Finalize the SKB */
				925	skb->protocol = eth_type_trans(skb, edev->ndev);
				926	skb->ip_summed = CHECKSUM_UNNECESSARY;
				927
				928	/* tcp_gro_complete() will copy NAPI_GRO_CB(skb)->count
				929	* to skb_shinfo(skb)->gso_segs
				930	*/
				931	NAPI_GRO_CB(skb)->count = le16_to_cpu(cqe->num_of_coalesced_segs);
				932
				933	qede_gro_receive(edev, fp, skb, tpa_info->vlan_tag);
				934
				935	tpa_info->state = QEDE_AGG_STATE_NONE;
				936
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	937	return 1;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	938	err:
				939	tpa_info->state = QEDE_AGG_STATE_NONE;
				940	dev_kfree_skb_any(tpa_info->skb);
				941	tpa_info->skb = NULL;
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	942	return 0;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	943	}
				944
				945	static u8 qede_check_notunn_csum(u16 flag)
				946	{
				947	u16 csum_flag = 0;
				948	u8 csum = 0;
				949
				950	if (flag & (PARSING_AND_ERR_FLAGS_L4CHKSMWASCALCULATED_MASK <<
				951	PARSING_AND_ERR_FLAGS_L4CHKSMWASCALCULATED_SHIFT)) {
				952	csum_flag \|= PARSING_AND_ERR_FLAGS_L4CHKSMERROR_MASK <<
				953	PARSING_AND_ERR_FLAGS_L4CHKSMERROR_SHIFT;
				954	csum = QEDE_CSUM_UNNECESSARY;
				955	}
				956
				957	csum_flag \|= PARSING_AND_ERR_FLAGS_IPHDRERROR_MASK <<
				958	PARSING_AND_ERR_FLAGS_IPHDRERROR_SHIFT;
				959
				960	if (csum_flag & flag)
				961	return QEDE_CSUM_ERROR;
				962
				963	return csum;
				964	}
				965
				966	static u8 qede_check_csum(u16 flag)
				967	{
				968	if (!qede_tunn_exist(flag))
				969	return qede_check_notunn_csum(flag);
				970	else
				971	return qede_check_tunn_csum(flag);
				972	}
				973
				974	static bool qede_pkt_is_ip_fragmented(struct eth_fast_path_rx_reg_cqe *cqe,
				975	u16 flag)
				976	{
				977	u8 tun_pars_flg = cqe->tunnel_pars_flags.flags;
				978
				979	if ((tun_pars_flg & (ETH_TUNNEL_PARSING_FLAGS_IPV4_FRAGMENT_MASK <<
				980	ETH_TUNNEL_PARSING_FLAGS_IPV4_FRAGMENT_SHIFT)) \|\|
				981	(flag & (PARSING_AND_ERR_FLAGS_IPV4FRAG_MASK <<
				982	PARSING_AND_ERR_FLAGS_IPV4FRAG_SHIFT)))
				983	return true;
				984
				985	return false;
				986	}
				987
				988	/* Return true iff packet is to be passed to stack */
				989	static bool qede_rx_xdp(struct qede_dev *edev,
				990	struct qede_fastpath *fp,
				991	struct qede_rx_queue *rxq,
				992	struct bpf_prog *prog,
				993	struct sw_rx_data *bd,
				994	struct eth_fast_path_rx_reg_cqe *cqe)
				995	{
				996	u16 len = le16_to_cpu(cqe->len_on_first_bd);
				997	struct xdp_buff xdp;
				998	enum xdp_action act;
				999
				1000	xdp.data = page_address(bd->data) + cqe->placement_offset;
				1001	xdp.data_end = xdp.data + len;
				1002
				1003	/* Queues always have a full reset currently, so for the time
				1004	* being until there's atomic program replace just mark read
				1005	* side for map helpers.
				1006	*/
				1007	rcu_read_lock();
				1008	act = bpf_prog_run_xdp(prog, &xdp);
				1009	rcu_read_unlock();
				1010
				1011	if (act == XDP_PASS)
				1012	return true;
				1013
				1014	/* Count number of packets not to be passed to stack */
				1015	rxq->xdp_no_pass++;
				1016
				1017	switch (act) {
				1018	case XDP_TX:
				1019	/* We need the replacement buffer before transmit. */
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	1020	if (qede_alloc_rx_buffer(rxq, true)) {
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1021	qede_recycle_rx_bd_ring(rxq, 1);
Daniel Borkmann	a67edbf	2017-01-25 02:28:18 +0100	[diff] [blame]	1022	trace_xdp_exception(edev->ndev, prog, act);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1023	return false;
				1024	}
				1025
				1026	/* Now if there's a transmission problem, we'd still have to
				1027	* throw current buffer, as replacement was already allocated.
				1028	*/
				1029	if (qede_xdp_xmit(edev, fp, bd, cqe->placement_offset, len)) {
				1030	dma_unmap_page(rxq->dev, bd->mapping,
				1031	PAGE_SIZE, DMA_BIDIRECTIONAL);
				1032	__free_page(bd->data);
Daniel Borkmann	a67edbf	2017-01-25 02:28:18 +0100	[diff] [blame]	1033	trace_xdp_exception(edev->ndev, prog, act);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1034	}
				1035
				1036	/* Regardless, we've consumed an Rx BD */
				1037	qede_rx_bd_ring_consume(rxq);
				1038	return false;
				1039
				1040	default:
				1041	bpf_warn_invalid_xdp_action(act);
				1042	case XDP_ABORTED:
Daniel Borkmann	a67edbf	2017-01-25 02:28:18 +0100	[diff] [blame]	1043	trace_xdp_exception(edev->ndev, prog, act);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1044	case XDP_DROP:
				1045	qede_recycle_rx_bd_ring(rxq, cqe->bd_num);
				1046	}
				1047
				1048	return false;
				1049	}
				1050
				1051	static struct sk_buff qede_rx_allocate_skb(struct qede_dev edev,
				1052	struct qede_rx_queue *rxq,
				1053	struct sw_rx_data *bd, u16 len,
				1054	u16 pad)
				1055	{
				1056	unsigned int offset = bd->page_offset;
				1057	struct skb_frag_struct *frag;
				1058	struct page *page = bd->data;
				1059	unsigned int pull_len;
				1060	struct sk_buff *skb;
				1061	unsigned char *va;
				1062
				1063	/* Allocate a new SKB with a sufficient large header len */
				1064	skb = netdev_alloc_skb(edev->ndev, QEDE_RX_HDR_SIZE);
				1065	if (unlikely(!skb))
				1066	return NULL;
				1067
				1068	/* Copy data into SKB - if it's small, we can simply copy it and
				1069	* re-use the already allcoated & mapped memory.
				1070	*/
				1071	if (len + pad <= edev->rx_copybreak) {
				1072	memcpy(skb_put(skb, len),
				1073	page_address(page) + pad + offset, len);
				1074	qede_reuse_page(rxq, bd);
				1075	goto out;
				1076	}
				1077
				1078	frag = &skb_shinfo(skb)->frags[0];
				1079
				1080	skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags,
				1081	page, pad + offset, len, rxq->rx_buf_seg_size);
				1082
				1083	va = skb_frag_address(frag);
				1084	pull_len = eth_get_headlen(va, QEDE_RX_HDR_SIZE);
				1085
				1086	/* Align the pull_len to optimize memcpy */
				1087	memcpy(skb->data, va, ALIGN(pull_len, sizeof(long)));
				1088
				1089	/* Correct the skb & frag sizes offset after the pull */
				1090	skb_frag_size_sub(frag, pull_len);
				1091	frag->page_offset += pull_len;
				1092	skb->data_len -= pull_len;
				1093	skb->tail += pull_len;
				1094
				1095	if (unlikely(qede_realloc_rx_buffer(rxq, bd))) {
				1096	/* Incr page ref count to reuse on allocation failure so
				1097	* that it doesn't get freed while freeing SKB [as its
				1098	* already mapped there].
				1099	*/
				1100	page_ref_inc(page);
				1101	dev_kfree_skb_any(skb);
				1102	return NULL;
				1103	}
				1104
				1105	out:
				1106	/* We've consumed the first BD and prepared an SKB */
				1107	qede_rx_bd_ring_consume(rxq);
				1108	return skb;
				1109	}
				1110
				1111	static int qede_rx_build_jumbo(struct qede_dev *edev,
				1112	struct qede_rx_queue *rxq,
				1113	struct sk_buff *skb,
				1114	struct eth_fast_path_rx_reg_cqe *cqe,
				1115	u16 first_bd_len)
				1116	{
				1117	u16 pkt_len = le16_to_cpu(cqe->pkt_len);
				1118	struct sw_rx_data *bd;
				1119	u16 bd_cons_idx;
				1120	u8 num_frags;
				1121
				1122	pkt_len -= first_bd_len;
				1123
				1124	/* We've already used one BD for the SKB. Now take care of the rest */
				1125	for (num_frags = cqe->bd_num - 1; num_frags > 0; num_frags--) {
				1126	u16 cur_size = pkt_len > rxq->rx_buf_size ? rxq->rx_buf_size :
				1127	pkt_len;
				1128
				1129	if (unlikely(!cur_size)) {
				1130	DP_ERR(edev,
				1131	"Still got %d BDs for mapping jumbo, but length became 0\n",
				1132	num_frags);
				1133	goto out;
				1134	}
				1135
				1136	/* We need a replacement buffer for each BD */
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	1137	if (unlikely(qede_alloc_rx_buffer(rxq, true)))
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1138	goto out;
				1139
				1140	/* Now that we've allocated the replacement buffer,
				1141	* we can safely consume the next BD and map it to the SKB.
				1142	*/
				1143	bd_cons_idx = rxq->sw_rx_cons & NUM_RX_BDS_MAX;
				1144	bd = &rxq->sw_rx_ring[bd_cons_idx];
				1145	qede_rx_bd_ring_consume(rxq);
				1146
				1147	dma_unmap_page(rxq->dev, bd->mapping,
				1148	PAGE_SIZE, DMA_FROM_DEVICE);
				1149
				1150	skb_fill_page_desc(skb, skb_shinfo(skb)->nr_frags++,
				1151	bd->data, 0, cur_size);
				1152
				1153	skb->truesize += PAGE_SIZE;
				1154	skb->data_len += cur_size;
				1155	skb->len += cur_size;
				1156	pkt_len -= cur_size;
				1157	}
				1158
				1159	if (unlikely(pkt_len))
				1160	DP_ERR(edev,
				1161	"Mapped all BDs of jumbo, but still have %d bytes\n",
				1162	pkt_len);
				1163
				1164	out:
				1165	return num_frags;
				1166	}
				1167
				1168	static int qede_rx_process_tpa_cqe(struct qede_dev *edev,
				1169	struct qede_fastpath *fp,
				1170	struct qede_rx_queue *rxq,
				1171	union eth_rx_cqe *cqe,
				1172	enum eth_rx_cqe_type type)
				1173	{
				1174	switch (type) {
				1175	case ETH_RX_CQE_TYPE_TPA_START:
				1176	qede_tpa_start(edev, rxq, &cqe->fast_path_tpa_start);
				1177	return 0;
				1178	case ETH_RX_CQE_TYPE_TPA_CONT:
				1179	qede_tpa_cont(edev, rxq, &cqe->fast_path_tpa_cont);
				1180	return 0;
				1181	case ETH_RX_CQE_TYPE_TPA_END:
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	1182	return qede_tpa_end(edev, fp, &cqe->fast_path_tpa_end);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1183	default:
				1184	return 0;
				1185	}
				1186	}
				1187
				1188	static int qede_rx_process_cqe(struct qede_dev *edev,
				1189	struct qede_fastpath *fp,
				1190	struct qede_rx_queue *rxq)
				1191	{
				1192	struct bpf_prog *xdp_prog = READ_ONCE(rxq->xdp_prog);
				1193	struct eth_fast_path_rx_reg_cqe *fp_cqe;
				1194	u16 len, pad, bd_cons_idx, parse_flag;
				1195	enum eth_rx_cqe_type cqe_type;
				1196	union eth_rx_cqe *cqe;
				1197	struct sw_rx_data *bd;
				1198	struct sk_buff *skb;
				1199	__le16 flags;
				1200	u8 csum_flag;
				1201
				1202	/* Get the CQE from the completion ring */
				1203	cqe = (union eth_rx_cqe *)qed_chain_consume(&rxq->rx_comp_ring);
				1204	cqe_type = cqe->fast_path_regular.type;
				1205
				1206	/* Process an unlikely slowpath event */
				1207	if (unlikely(cqe_type == ETH_RX_CQE_TYPE_SLOW_PATH)) {
				1208	struct eth_slow_path_rx_cqe *sp_cqe;
				1209
				1210	sp_cqe = (struct eth_slow_path_rx_cqe *)cqe;
				1211	edev->ops->eth_cqe_completion(edev->cdev, fp->id, sp_cqe);
				1212	return 0;
				1213	}
				1214
				1215	/* Handle TPA cqes */
				1216	if (cqe_type != ETH_RX_CQE_TYPE_REGULAR)
				1217	return qede_rx_process_tpa_cqe(edev, fp, rxq, cqe, cqe_type);
				1218
				1219	/* Get the data from the SW ring; Consume it only after it's evident
				1220	* we wouldn't recycle it.
				1221	*/
				1222	bd_cons_idx = rxq->sw_rx_cons & NUM_RX_BDS_MAX;
				1223	bd = &rxq->sw_rx_ring[bd_cons_idx];
				1224
				1225	fp_cqe = &cqe->fast_path_regular;
				1226	len = le16_to_cpu(fp_cqe->len_on_first_bd);
				1227	pad = fp_cqe->placement_offset;
				1228
				1229	/* Run eBPF program if one is attached */
				1230	if (xdp_prog)
				1231	if (!qede_rx_xdp(edev, fp, rxq, xdp_prog, bd, fp_cqe))
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	1232	return 0;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1233
				1234	/* If this is an error packet then drop it */
				1235	flags = cqe->fast_path_regular.pars_flags.flags;
				1236	parse_flag = le16_to_cpu(flags);
				1237
				1238	csum_flag = qede_check_csum(parse_flag);
				1239	if (unlikely(csum_flag == QEDE_CSUM_ERROR)) {
				1240	if (qede_pkt_is_ip_fragmented(fp_cqe, parse_flag)) {
				1241	rxq->rx_ip_frags++;
				1242	} else {
				1243	DP_NOTICE(edev,
				1244	"CQE has error, flags = %x, dropping incoming packet\n",
				1245	parse_flag);
				1246	rxq->rx_hw_errors++;
				1247	qede_recycle_rx_bd_ring(rxq, fp_cqe->bd_num);
				1248	return 0;
				1249	}
				1250	}
				1251
				1252	/* Basic validation passed; Need to prepare an SKB. This would also
				1253	* guarantee to finally consume the first BD upon success.
				1254	*/
				1255	skb = qede_rx_allocate_skb(edev, rxq, bd, len, pad);
				1256	if (!skb) {
				1257	rxq->rx_alloc_errors++;
				1258	qede_recycle_rx_bd_ring(rxq, fp_cqe->bd_num);
				1259	return 0;
				1260	}
				1261
				1262	/* In case of Jumbo packet, several PAGE_SIZEd buffers will be pointed
				1263	* by a single cqe.
				1264	*/
				1265	if (fp_cqe->bd_num > 1) {
				1266	u16 unmapped_frags = qede_rx_build_jumbo(edev, rxq, skb,
				1267	fp_cqe, len);
				1268
				1269	if (unlikely(unmapped_frags > 0)) {
				1270	qede_recycle_rx_bd_ring(rxq, unmapped_frags);
				1271	dev_kfree_skb_any(skb);
				1272	return 0;
				1273	}
				1274	}
				1275
				1276	/* The SKB contains all the data. Now prepare meta-magic */
				1277	skb->protocol = eth_type_trans(skb, edev->ndev);
				1278	qede_get_rxhash(skb, fp_cqe->bitfields, fp_cqe->rss_hash);
				1279	qede_set_skb_csum(skb, csum_flag);
				1280	skb_record_rx_queue(skb, rxq->rxq_id);
Sudarsana Reddy Kalluru	4c55215	2017-02-15 10:24:11 +0200	[diff] [blame]	1281	qede_ptp_record_rx_ts(edev, cqe, skb);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1282
				1283	/* SKB is prepared - pass it to stack */
				1284	qede_skb_receive(edev, fp, rxq, skb, le16_to_cpu(fp_cqe->vlan_tag));
				1285
				1286	return 1;
				1287	}
				1288
				1289	static int qede_rx_int(struct qede_fastpath *fp, int budget)
				1290	{
				1291	struct qede_rx_queue *rxq = fp->rxq;
				1292	struct qede_dev *edev = fp->edev;
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	1293	int work_done = 0, rcv_pkts = 0;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1294	u16 hw_comp_cons, sw_comp_cons;
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1295
				1296	hw_comp_cons = le16_to_cpu(*rxq->hw_cons_ptr);
				1297	sw_comp_cons = qed_chain_get_cons_idx(&rxq->rx_comp_ring);
				1298
				1299	/* Memory barrier to prevent the CPU from doing speculative reads of CQE
				1300	* / BD in the while-loop before reading hw_comp_cons. If the CQE is
				1301	* read before it is written by FW, then FW writes CQE and SB, and then
				1302	* the CPU reads the hw_comp_cons, it will use an old CQE.
				1303	*/
				1304	rmb();
				1305
				1306	/* Loop to complete all indicated BDs */
				1307	while ((sw_comp_cons != hw_comp_cons) && (work_done < budget)) {
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	1308	rcv_pkts += qede_rx_process_cqe(edev, fp, rxq);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1309	qed_chain_recycle_consumed(&rxq->rx_comp_ring);
				1310	sw_comp_cons = qed_chain_get_cons_idx(&rxq->rx_comp_ring);
				1311	work_done++;
				1312	}
				1313
Mintz, Yuval	10a0176	2017-04-07 11:04:57 +0300	[diff] [blame]	1314	rxq->rcv_pkts += rcv_pkts;
				1315
Mintz, Yuval	e3eef7e	2017-01-01 13:57:04 +0200	[diff] [blame]	1316	/* Allocate replacement buffers */
				1317	while (rxq->num_rx_buffers - rxq->filled_buffers)
				1318	if (qede_alloc_rx_buffer(rxq, false))
				1319	break;
				1320
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1321	/* Update producers */
				1322	qede_update_rx_prod(edev, rxq);
				1323
				1324	return work_done;
				1325	}
				1326
				1327	static bool qede_poll_is_more_work(struct qede_fastpath *fp)
				1328	{
				1329	qed_sb_update_sb_idx(fp->sb_info);
				1330
				1331	/* _has__work() reads the status block, thus we need to ensure that
				1332	* status block indices have been actually read (qed_sb_update_sb_idx)
				1333	* prior to this check (_has__work) so that we won't write the
				1334	* "newer" value of the status block to HW (if there was a DMA right
				1335	* after qede_has_rx_work and if there is no rmb, the memory reading
				1336	* (qed_sb_update_sb_idx) may be postponed to right before *_ack_sb).
				1337	* In this case there will never be another interrupt until there is
				1338	* another update of the status block, while there is still unhandled
				1339	* work.
				1340	*/
				1341	rmb();
				1342
				1343	if (likely(fp->type & QEDE_FASTPATH_RX))
				1344	if (qede_has_rx_work(fp->rxq))
				1345	return true;
				1346
				1347	if (fp->type & QEDE_FASTPATH_XDP)
				1348	if (qede_txq_has_work(fp->xdp_tx))
				1349	return true;
				1350
				1351	if (likely(fp->type & QEDE_FASTPATH_TX))
				1352	if (qede_txq_has_work(fp->txq))
				1353	return true;
				1354
				1355	return false;
				1356	}
				1357
				1358	/*********************
				1359	* NDO & API related *
				1360	*********************/
				1361	int qede_poll(struct napi_struct *napi, int budget)
				1362	{
				1363	struct qede_fastpath *fp = container_of(napi, struct qede_fastpath,
				1364	napi);
				1365	struct qede_dev *edev = fp->edev;
				1366	int rx_work_done = 0;
				1367
				1368	if (likely(fp->type & QEDE_FASTPATH_TX) && qede_txq_has_work(fp->txq))
				1369	qede_tx_int(edev, fp->txq);
				1370
				1371	if ((fp->type & QEDE_FASTPATH_XDP) && qede_txq_has_work(fp->xdp_tx))
				1372	qede_xdp_tx_int(edev, fp->xdp_tx);
				1373
				1374	rx_work_done = (likely(fp->type & QEDE_FASTPATH_RX) &&
				1375	qede_has_rx_work(fp->rxq)) ?
				1376	qede_rx_int(fp, budget) : 0;
				1377	if (rx_work_done < budget) {
				1378	if (!qede_poll_is_more_work(fp)) {
Eric Dumazet	6ad2016	2017-01-30 08:22:01 -0800	[diff] [blame]	1379	napi_complete_done(napi, rx_work_done);
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1380
				1381	/* Update and reenable interrupts */
				1382	qed_sb_ack(fp->sb_info, IGU_INT_ENABLE, 1);
				1383	} else {
				1384	rx_work_done = budget;
				1385	}
				1386	}
				1387
				1388	if (fp->xdp_xmit) {
				1389	u16 xdp_prod = qed_chain_get_prod_idx(&fp->xdp_tx->tx_pbl);
				1390
				1391	fp->xdp_xmit = 0;
				1392	fp->xdp_tx->tx_db.data.bd_prod = cpu_to_le16(xdp_prod);
				1393	qede_update_tx_producer(fp->xdp_tx);
				1394	}
				1395
				1396	return rx_work_done;
				1397	}
				1398
				1399	irqreturn_t qede_msix_fp_int(int irq, void *fp_cookie)
				1400	{
				1401	struct qede_fastpath *fp = fp_cookie;
				1402
				1403	qed_sb_ack(fp->sb_info, IGU_INT_DISABLE, 0 /do not update/);
				1404
				1405	napi_schedule_irqoff(&fp->napi);
				1406	return IRQ_HANDLED;
				1407	}
				1408
				1409	/* Main transmit function */
				1410	netdev_tx_t qede_start_xmit(struct sk_buff skb, struct net_device ndev)
				1411	{
				1412	struct qede_dev *edev = netdev_priv(ndev);
				1413	struct netdev_queue *netdev_txq;
				1414	struct qede_tx_queue *txq;
				1415	struct eth_tx_1st_bd *first_bd;
				1416	struct eth_tx_2nd_bd *second_bd = NULL;
				1417	struct eth_tx_3rd_bd *third_bd = NULL;
				1418	struct eth_tx_bd *tx_data_bd = NULL;
				1419	u16 txq_index;
				1420	u8 nbd = 0;
				1421	dma_addr_t mapping;
				1422	int rc, frag_idx = 0, ipv6_ext = 0;
				1423	u8 xmit_type;
				1424	u16 idx;
				1425	u16 hlen;
				1426	bool data_split = false;
				1427
				1428	/* Get tx-queue context and netdev index */
				1429	txq_index = skb_get_queue_mapping(skb);
				1430	WARN_ON(txq_index >= QEDE_TSS_COUNT(edev));
				1431	txq = edev->fp_array[edev->fp_num_rx + txq_index].txq;
				1432	netdev_txq = netdev_get_tx_queue(ndev, txq_index);
				1433
				1434	WARN_ON(qed_chain_get_elem_left(&txq->tx_pbl) < (MAX_SKB_FRAGS + 1));
				1435
				1436	xmit_type = qede_xmit_type(skb, &ipv6_ext);
				1437
				1438	#if ((MAX_SKB_FRAGS + 2) > ETH_TX_MAX_BDS_PER_NON_LSO_PACKET)
				1439	if (qede_pkt_req_lin(skb, xmit_type)) {
				1440	if (skb_linearize(skb)) {
				1441	DP_NOTICE(edev,
				1442	"SKB linearization failed - silently dropping this SKB\n");
				1443	dev_kfree_skb_any(skb);
				1444	return NETDEV_TX_OK;
				1445	}
				1446	}
				1447	#endif
				1448
				1449	/* Fill the entry in the SW ring and the BDs in the FW ring */
				1450	idx = txq->sw_tx_prod & NUM_TX_BDS_MAX;
				1451	txq->sw_tx_ring.skbs[idx].skb = skb;
				1452	first_bd = (struct eth_tx_1st_bd *)
				1453	qed_chain_produce(&txq->tx_pbl);
				1454	memset(first_bd, 0, sizeof(*first_bd));
				1455	first_bd->data.bd_flags.bitfields =
				1456	1 << ETH_TX_1ST_BD_FLAGS_START_BD_SHIFT;
				1457
Sudarsana Reddy Kalluru	4c55215	2017-02-15 10:24:11 +0200	[diff] [blame]	1458	if (unlikely(skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP))
				1459	qede_ptp_tx_ts(edev, skb);
				1460
Mintz, Yuval	cdda926	2017-01-01 13:57:01 +0200	[diff] [blame]	1461	/* Map skb linear data for DMA and set in the first BD */
				1462	mapping = dma_map_single(txq->dev, skb->data,
				1463	skb_headlen(skb), DMA_TO_DEVICE);
				1464	if (unlikely(dma_mapping_error(txq->dev, mapping))) {
				1465	DP_NOTICE(edev, "SKB mapping failed\n");
				1466	qede_free_failed_tx_pkt(txq, first_bd, 0, false);
				1467	qede_update_tx_producer(txq);
				1468	return NETDEV_TX_OK;
				1469	}
				1470	nbd++;
				1471	BD_SET_UNMAP_ADDR_LEN(first_bd, mapping, skb_headlen(skb));
				1472
				1473	/* In case there is IPv6 with extension headers or LSO we need 2nd and
				1474	* 3rd BDs.
				1475	*/
				1476	if (unlikely((xmit_type & XMIT_LSO) \| ipv6_ext)) {
				1477	second_bd = (struct eth_tx_2nd_bd *)
				1478	qed_chain_produce(&txq->tx_pbl);
				1479	memset(second_bd, 0, sizeof(*second_bd));
				1480
				1481	nbd++;
				1482	third_bd = (struct eth_tx_3rd_bd *)
				1483	qed_chain_produce(&txq->tx_pbl);
				1484	memset(third_bd, 0, sizeof(*third_bd));
				1485
				1486	nbd++;
				1487	/* We need to fill in additional data in second_bd... */
				1488	tx_data_bd = (struct eth_tx_bd *)second_bd;
				1489	}
				1490
				1491	if (skb_vlan_tag_present(skb)) {
				1492	first_bd->data.vlan = cpu_to_le16(skb_vlan_tag_get(skb));
				1493	first_bd->data.bd_flags.bitfields \|=
				1494	1 << ETH_TX_1ST_BD_FLAGS_VLAN_INSERTION_SHIFT;
				1495	}
				1496
				1497	/* Fill the parsing flags & params according to the requested offload */
				1498	if (xmit_type & XMIT_L4_CSUM) {
				1499	/* We don't re-calculate IP checksum as it is already done by
				1500	* the upper stack
				1501	*/
				1502	first_bd->data.bd_flags.bitfields \|=
				1503	1 << ETH_TX_1ST_BD_FLAGS_L4_CSUM_SHIFT;
				1504
				1505	if (xmit_type & XMIT_ENC) {
				1506	first_bd->data.bd_flags.bitfields \|=
				1507	1 << ETH_TX_1ST_BD_FLAGS_IP_CSUM_SHIFT;
				1508	first_bd->data.bitfields \|=
				1509	1 << ETH_TX_DATA_1ST_BD_TUNN_FLAG_SHIFT;
				1510	}
				1511
				1512	/* Legacy FW had flipped behavior in regard to this bit -
				1513	* I.e., needed to set to prevent FW from touching encapsulated
				1514	* packets when it didn't need to.
				1515	*/
				1516	if (unlikely(txq->is_legacy))
				1517	first_bd->data.bitfields ^=
				1518	1 << ETH_TX_DATA_1ST_BD_TUNN_FLAG_SHIFT;
				1519
				1520	/* If the packet is IPv6 with extension header, indicate that
				1521	* to FW and pass few params, since the device cracker doesn't
				1522	* support parsing IPv6 with extension header/s.
				1523	*/
				1524	if (unlikely(ipv6_ext))
				1525	qede_set_params_for_ipv6_ext(skb, second_bd, third_bd);
				1526	}
				1527
				1528	if (xmit_type & XMIT_LSO) {
				1529	first_bd->data.bd_flags.bitfields \|=
				1530	(1 << ETH_TX_1ST_BD_FLAGS_LSO_SHIFT);
				1531	third_bd->data.lso_mss =
				1532	cpu_to_le16(skb_shinfo(skb)->gso_size);
				1533
				1534	if (unlikely(xmit_type & XMIT_ENC)) {
				1535	first_bd->data.bd_flags.bitfields \|=
				1536	1 << ETH_TX_1ST_BD_FLAGS_TUNN_IP_CSUM_SHIFT;
				1537
				1538	if (xmit_type & XMIT_ENC_GSO_L4_CSUM) {
				1539	u8 tmp = ETH_TX_1ST_BD_FLAGS_TUNN_L4_CSUM_SHIFT;
				1540
				1541	first_bd->data.bd_flags.bitfields \|= 1 << tmp;
				1542	}
				1543	hlen = qede_get_skb_hlen(skb, true);
				1544	} else {
				1545	first_bd->data.bd_flags.bitfields \|=
				1546	1 << ETH_TX_1ST_BD_FLAGS_IP_CSUM_SHIFT;
				1547	hlen = qede_get_skb_hlen(skb, false);
				1548	}
				1549
				1550	/* @@@TBD - if will not be removed need to check */
				1551	third_bd->data.bitfields \|=
				1552	cpu_to_le16(1 << ETH_TX_DATA_3RD_BD_HDR_NBD_SHIFT);
				1553
				1554	/* Make life easier for FW guys who can't deal with header and
				1555	* data on same BD. If we need to split, use the second bd...
				1556	*/
				1557	if (unlikely(skb_headlen(skb) > hlen)) {
				1558	DP_VERBOSE(edev, NETIF_MSG_TX_QUEUED,
				1559	"TSO split header size is %d (%x:%x)\n",
				1560	first_bd->nbytes, first_bd->addr.hi,
				1561	first_bd->addr.lo);
				1562
				1563	mapping = HILO_U64(le32_to_cpu(first_bd->addr.hi),
				1564	le32_to_cpu(first_bd->addr.lo)) +
				1565	hlen;
				1566
				1567	BD_SET_UNMAP_ADDR_LEN(tx_data_bd, mapping,
				1568	le16_to_cpu(first_bd->nbytes) -
				1569	hlen);
				1570
				1571	/* this marks the BD as one that has no
				1572	* individual mapping
				1573	*/
				1574	txq->sw_tx_ring.skbs[idx].flags \|= QEDE_TSO_SPLIT_BD;
				1575
				1576	first_bd->nbytes = cpu_to_le16(hlen);
				1577
				1578	tx_data_bd = (struct eth_tx_bd *)third_bd;
				1579	data_split = true;
				1580	}
				1581	} else {
				1582	first_bd->data.bitfields \|=
				1583	(skb->len & ETH_TX_DATA_1ST_BD_PKT_LEN_MASK) <<
				1584	ETH_TX_DATA_1ST_BD_PKT_LEN_SHIFT;
				1585	}
				1586
				1587	/* Handle fragmented skb */
				1588	/* special handle for frags inside 2nd and 3rd bds.. */
				1589	while (tx_data_bd && frag_idx < skb_shinfo(skb)->nr_frags) {
				1590	rc = map_frag_to_bd(txq,
				1591	&skb_shinfo(skb)->frags[frag_idx],
				1592	tx_data_bd);
				1593	if (rc) {
				1594	qede_free_failed_tx_pkt(txq, first_bd, nbd, data_split);
				1595	qede_update_tx_producer(txq);
				1596	return NETDEV_TX_OK;
				1597	}
				1598
				1599	if (tx_data_bd == (struct eth_tx_bd *)second_bd)
				1600	tx_data_bd = (struct eth_tx_bd *)third_bd;
				1601	else
				1602	tx_data_bd = NULL;
				1603
				1604	frag_idx++;
				1605	}
				1606
				1607	/* map last frags into 4th, 5th .... */
				1608	for (; frag_idx < skb_shinfo(skb)->nr_frags; frag_idx++, nbd++) {
				1609	tx_data_bd = (struct eth_tx_bd *)
				1610	qed_chain_produce(&txq->tx_pbl);
				1611
				1612	memset(tx_data_bd, 0, sizeof(*tx_data_bd));
				1613
				1614	rc = map_frag_to_bd(txq,
				1615	&skb_shinfo(skb)->frags[frag_idx],
				1616	tx_data_bd);
				1617	if (rc) {
				1618	qede_free_failed_tx_pkt(txq, first_bd, nbd, data_split);
				1619	qede_update_tx_producer(txq);
				1620	return NETDEV_TX_OK;
				1621	}
				1622	}
				1623
				1624	/* update the first BD with the actual num BDs */
				1625	first_bd->data.nbds = nbd;
				1626
				1627	netdev_tx_sent_queue(netdev_txq, skb->len);
				1628
				1629	skb_tx_timestamp(skb);
				1630
				1631	/* Advance packet producer only before sending the packet since mapping
				1632	* of pages may fail.
				1633	*/
				1634	txq->sw_tx_prod++;
				1635
				1636	/* 'next page' entries are counted in the producer value */
				1637	txq->tx_db.data.bd_prod =
				1638	cpu_to_le16(qed_chain_get_prod_idx(&txq->tx_pbl));
				1639
				1640	if (!skb->xmit_more \|\| netif_xmit_stopped(netdev_txq))
				1641	qede_update_tx_producer(txq);
				1642
				1643	if (unlikely(qed_chain_get_elem_left(&txq->tx_pbl)
				1644	< (MAX_SKB_FRAGS + 1))) {
				1645	if (skb->xmit_more)
				1646	qede_update_tx_producer(txq);
				1647
				1648	netif_tx_stop_queue(netdev_txq);
				1649	txq->stopped_cnt++;
				1650	DP_VERBOSE(edev, NETIF_MSG_TX_QUEUED,
				1651	"Stop queue was called\n");
				1652	/* paired memory barrier is in qede_tx_int(), we have to keep
				1653	* ordering of set_bit() in netif_tx_stop_queue() and read of
				1654	* fp->bd_tx_cons
				1655	*/
				1656	smp_mb();
				1657
				1658	if ((qed_chain_get_elem_left(&txq->tx_pbl) >=
				1659	(MAX_SKB_FRAGS + 1)) &&
				1660	(edev->state == QEDE_STATE_OPEN)) {
				1661	netif_tx_wake_queue(netdev_txq);
				1662	DP_VERBOSE(edev, NETIF_MSG_TX_QUEUED,
				1663	"Wake queue was called\n");
				1664	}
				1665	}
				1666
				1667	return NETDEV_TX_OK;
				1668	}
				1669
				1670	/* 8B udp header + 8B base tunnel header + 32B option length */
				1671	#define QEDE_MAX_TUN_HDR_LEN 48
				1672
				1673	netdev_features_t qede_features_check(struct sk_buff *skb,
				1674	struct net_device *dev,
				1675	netdev_features_t features)
				1676	{
				1677	if (skb->encapsulation) {
				1678	u8 l4_proto = 0;
				1679
				1680	switch (vlan_get_protocol(skb)) {
				1681	case htons(ETH_P_IP):
				1682	l4_proto = ip_hdr(skb)->protocol;
				1683	break;
				1684	case htons(ETH_P_IPV6):
				1685	l4_proto = ipv6_hdr(skb)->nexthdr;
				1686	break;
				1687	default:
				1688	return features;
				1689	}
				1690
				1691	/* Disable offloads for geneve tunnels, as HW can't parse
				1692	* the geneve header which has option length greater than 32B.
				1693	*/
				1694	if ((l4_proto == IPPROTO_UDP) &&
				1695	((skb_inner_mac_header(skb) -
				1696	skb_transport_header(skb)) > QEDE_MAX_TUN_HDR_LEN))
				1697	return features & ~(NETIF_F_CSUM_MASK \|
				1698	NETIF_F_GSO_MASK);
				1699	}
				1700
				1701	return features;
				1702	}