diff options
Diffstat (limited to 'drivers/net/ethernet/pensando/ionic/ionic_txrx.c')
| -rw-r--r-- | drivers/net/ethernet/pensando/ionic/ionic_txrx.c | 882 | 
1 files changed, 493 insertions, 389 deletions
| diff --git a/drivers/net/ethernet/pensando/ionic/ionic_txrx.c b/drivers/net/ethernet/pensando/ionic/ionic_txrx.c index 162a1ff1e9d2..08934888575c 100644 --- a/drivers/net/ethernet/pensando/ionic/ionic_txrx.c +++ b/drivers/net/ethernet/pensando/ionic/ionic_txrx.c @@ -10,14 +10,6 @@  #include "ionic_lif.h"  #include "ionic_txrx.h" -static void ionic_rx_clean(struct ionic_queue *q, -			   struct ionic_desc_info *desc_info, -			   struct ionic_cq_info *cq_info, -			   void *cb_arg); - -static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info); - -static bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info);  static inline void ionic_txq_post(struct ionic_queue *q, bool ring_dbell,  				  ionic_desc_cb cb_func, void *cb_arg) @@ -40,72 +32,149 @@ static inline struct netdev_queue *q_to_ndq(struct ionic_queue *q)  	return netdev_get_tx_queue(q->lif->netdev, q->index);  } -static struct sk_buff *ionic_rx_skb_alloc(struct ionic_queue *q, -					  unsigned int len, bool frags) +static void ionic_rx_buf_reset(struct ionic_buf_info *buf_info) +{ +	buf_info->page = NULL; +	buf_info->page_offset = 0; +	buf_info->dma_addr = 0; +} + +static int ionic_rx_page_alloc(struct ionic_queue *q, +			       struct ionic_buf_info *buf_info)  { -	struct ionic_lif *lif = q->lif; +	struct net_device *netdev = q->lif->netdev;  	struct ionic_rx_stats *stats; -	struct net_device *netdev; -	struct sk_buff *skb; +	struct device *dev; -	netdev = lif->netdev; -	stats = &q->lif->rxqstats[q->index]; +	dev = q->dev; +	stats = q_to_rx_stats(q); -	if (frags) -		skb = napi_get_frags(&q_to_qcq(q)->napi); -	else -		skb = netdev_alloc_skb_ip_align(netdev, len); +	if (unlikely(!buf_info)) { +		net_err_ratelimited("%s: %s invalid buf_info in alloc\n", +				    netdev->name, q->name); +		return -EINVAL; +	} -	if (unlikely(!skb)) { -		net_warn_ratelimited("%s: SKB alloc failed on %s!\n", -				     netdev->name, q->name); +	buf_info->page = alloc_pages(IONIC_PAGE_GFP_MASK, 0); +	if (unlikely(!buf_info->page)) { +		net_err_ratelimited("%s: %s page alloc failed\n", +				    netdev->name, q->name);  		stats->alloc_err++; -		return NULL; +		return -ENOMEM;  	} +	buf_info->page_offset = 0; -	return skb; +	buf_info->dma_addr = dma_map_page(dev, buf_info->page, buf_info->page_offset, +					  IONIC_PAGE_SIZE, DMA_FROM_DEVICE); +	if (unlikely(dma_mapping_error(dev, buf_info->dma_addr))) { +		__free_pages(buf_info->page, 0); +		ionic_rx_buf_reset(buf_info); +		net_err_ratelimited("%s: %s dma map failed\n", +				    netdev->name, q->name); +		stats->dma_map_err++; +		return -EIO; +	} + +	return 0; +} + +static void ionic_rx_page_free(struct ionic_queue *q, +			       struct ionic_buf_info *buf_info) +{ +	struct net_device *netdev = q->lif->netdev; +	struct device *dev = q->dev; + +	if (unlikely(!buf_info)) { +		net_err_ratelimited("%s: %s invalid buf_info in free\n", +				    netdev->name, q->name); +		return; +	} + +	if (!buf_info->page) +		return; + +	dma_unmap_page(dev, buf_info->dma_addr, IONIC_PAGE_SIZE, DMA_FROM_DEVICE); +	__free_pages(buf_info->page, 0); +	ionic_rx_buf_reset(buf_info); +} + +static bool ionic_rx_buf_recycle(struct ionic_queue *q, +				 struct ionic_buf_info *buf_info, u32 used) +{ +	u32 size; + +	/* don't re-use pages allocated in low-mem condition */ +	if (page_is_pfmemalloc(buf_info->page)) +		return false; + +	/* don't re-use buffers from non-local numa nodes */ +	if (page_to_nid(buf_info->page) != numa_mem_id()) +		return false; + +	size = ALIGN(used, IONIC_PAGE_SPLIT_SZ); +	buf_info->page_offset += size; +	if (buf_info->page_offset >= IONIC_PAGE_SIZE) +		return false; + +	get_page(buf_info->page); + +	return true;  }  static struct sk_buff *ionic_rx_frags(struct ionic_queue *q,  				      struct ionic_desc_info *desc_info, -				      struct ionic_cq_info *cq_info) +				      struct ionic_rxq_comp *comp)  { -	struct ionic_rxq_comp *comp = cq_info->cq_desc; -	struct device *dev = q->lif->ionic->dev; -	struct ionic_page_info *page_info; +	struct net_device *netdev = q->lif->netdev; +	struct ionic_buf_info *buf_info; +	struct ionic_rx_stats *stats; +	struct device *dev = q->dev;  	struct sk_buff *skb;  	unsigned int i;  	u16 frag_len;  	u16 len; -	page_info = &desc_info->pages[0]; +	stats = q_to_rx_stats(q); + +	buf_info = &desc_info->bufs[0];  	len = le16_to_cpu(comp->len); -	prefetch(page_address(page_info->page) + NET_IP_ALIGN); +	prefetch(buf_info->page); -	skb = ionic_rx_skb_alloc(q, len, true); -	if (unlikely(!skb)) +	skb = napi_get_frags(&q_to_qcq(q)->napi); +	if (unlikely(!skb)) { +		net_warn_ratelimited("%s: SKB alloc failed on %s!\n", +				     netdev->name, q->name); +		stats->alloc_err++;  		return NULL; +	}  	i = comp->num_sg_elems + 1;  	do { -		if (unlikely(!page_info->page)) { -			struct napi_struct *napi = &q_to_qcq(q)->napi; - -			napi->skb = NULL; +		if (unlikely(!buf_info->page)) {  			dev_kfree_skb(skb);  			return NULL;  		} -		frag_len = min(len, (u16)PAGE_SIZE); +		frag_len = min_t(u16, len, IONIC_PAGE_SIZE - buf_info->page_offset);  		len -= frag_len; -		dma_unmap_page(dev, dma_unmap_addr(page_info, dma_addr), -			       PAGE_SIZE, DMA_FROM_DEVICE); +		dma_sync_single_for_cpu(dev, +					buf_info->dma_addr + buf_info->page_offset, +					frag_len, DMA_FROM_DEVICE); +  		skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags, -				page_info->page, 0, frag_len, PAGE_SIZE); -		page_info->page = NULL; -		page_info++; +				buf_info->page, buf_info->page_offset, frag_len, +				IONIC_PAGE_SIZE); + +		if (!ionic_rx_buf_recycle(q, buf_info, frag_len)) { +			dma_unmap_page(dev, buf_info->dma_addr, +				       IONIC_PAGE_SIZE, DMA_FROM_DEVICE); +			ionic_rx_buf_reset(buf_info); +		} + +		buf_info++; +  		i--;  	} while (i > 0); @@ -114,30 +183,37 @@ static struct sk_buff *ionic_rx_frags(struct ionic_queue *q,  static struct sk_buff *ionic_rx_copybreak(struct ionic_queue *q,  					  struct ionic_desc_info *desc_info, -					  struct ionic_cq_info *cq_info) +					  struct ionic_rxq_comp *comp)  { -	struct ionic_rxq_comp *comp = cq_info->cq_desc; -	struct device *dev = q->lif->ionic->dev; -	struct ionic_page_info *page_info; +	struct net_device *netdev = q->lif->netdev; +	struct ionic_buf_info *buf_info; +	struct ionic_rx_stats *stats; +	struct device *dev = q->dev;  	struct sk_buff *skb;  	u16 len; -	page_info = &desc_info->pages[0]; +	stats = q_to_rx_stats(q); + +	buf_info = &desc_info->bufs[0];  	len = le16_to_cpu(comp->len); -	skb = ionic_rx_skb_alloc(q, len, false); -	if (unlikely(!skb)) +	skb = napi_alloc_skb(&q_to_qcq(q)->napi, len); +	if (unlikely(!skb)) { +		net_warn_ratelimited("%s: SKB alloc failed on %s!\n", +				     netdev->name, q->name); +		stats->alloc_err++;  		return NULL; +	} -	if (unlikely(!page_info->page)) { +	if (unlikely(!buf_info->page)) {  		dev_kfree_skb(skb);  		return NULL;  	} -	dma_sync_single_for_cpu(dev, dma_unmap_addr(page_info, dma_addr), +	dma_sync_single_for_cpu(dev, buf_info->dma_addr + buf_info->page_offset,  				len, DMA_FROM_DEVICE); -	skb_copy_to_linear_data(skb, page_address(page_info->page), len); -	dma_sync_single_for_device(dev, dma_unmap_addr(page_info, dma_addr), +	skb_copy_to_linear_data(skb, page_address(buf_info->page) + buf_info->page_offset, len); +	dma_sync_single_for_device(dev, buf_info->dma_addr + buf_info->page_offset,  				   len, DMA_FROM_DEVICE);  	skb_put(skb, len); @@ -151,14 +227,15 @@ static void ionic_rx_clean(struct ionic_queue *q,  			   struct ionic_cq_info *cq_info,  			   void *cb_arg)  { -	struct ionic_rxq_comp *comp = cq_info->cq_desc; +	struct net_device *netdev = q->lif->netdev;  	struct ionic_qcq *qcq = q_to_qcq(q);  	struct ionic_rx_stats *stats; -	struct net_device *netdev; +	struct ionic_rxq_comp *comp;  	struct sk_buff *skb; +	comp = cq_info->cq_desc + qcq->cq.desc_size - sizeof(*comp); +  	stats = q_to_rx_stats(q); -	netdev = q->lif->netdev;  	if (comp->status) {  		stats->dropped++; @@ -169,9 +246,9 @@ static void ionic_rx_clean(struct ionic_queue *q,  	stats->bytes += le16_to_cpu(comp->len);  	if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak) -		skb = ionic_rx_copybreak(q, desc_info, cq_info); +		skb = ionic_rx_copybreak(q, desc_info, comp);  	else -		skb = ionic_rx_frags(q, desc_info, cq_info); +		skb = ionic_rx_frags(q, desc_info, comp);  	if (unlikely(!skb)) {  		stats->dropped++; @@ -219,17 +296,39 @@ static void ionic_rx_clean(struct ionic_queue *q,  		stats->vlan_stripped++;  	} +	if (unlikely(q->features & IONIC_RXQ_F_HWSTAMP)) { +		__le64 *cq_desc_hwstamp; +		u64 hwstamp; + +		cq_desc_hwstamp = +			cq_info->cq_desc + +			qcq->cq.desc_size - +			sizeof(struct ionic_rxq_comp) - +			IONIC_HWSTAMP_CQ_NEGOFFSET; + +		hwstamp = le64_to_cpu(*cq_desc_hwstamp); + +		if (hwstamp != IONIC_HWSTAMP_INVALID) { +			skb_hwtstamps(skb)->hwtstamp = ionic_lif_phc_ktime(q->lif, hwstamp); +			stats->hwstamp_valid++; +		} else { +			stats->hwstamp_invalid++; +		} +	} +  	if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak)  		napi_gro_receive(&qcq->napi, skb);  	else  		napi_gro_frags(&qcq->napi);  } -static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info) +bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)  { -	struct ionic_rxq_comp *comp = cq_info->cq_desc;  	struct ionic_queue *q = cq->bound_q;  	struct ionic_desc_info *desc_info; +	struct ionic_rxq_comp *comp; + +	comp = cq_info->cq_desc + cq->desc_size - sizeof(*comp);  	if (!color_match(comp->pkt_type_color, cq->done_color))  		return false; @@ -253,138 +352,75 @@ static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)  	return true;  } -static int ionic_rx_page_alloc(struct ionic_queue *q, -			       struct ionic_page_info *page_info) -{ -	struct ionic_lif *lif = q->lif; -	struct ionic_rx_stats *stats; -	struct net_device *netdev; -	struct device *dev; - -	netdev = lif->netdev; -	dev = lif->ionic->dev; -	stats = q_to_rx_stats(q); - -	if (unlikely(!page_info)) { -		net_err_ratelimited("%s: %s invalid page_info in alloc\n", -				    netdev->name, q->name); -		return -EINVAL; -	} - -	page_info->page = dev_alloc_page(); -	if (unlikely(!page_info->page)) { -		net_err_ratelimited("%s: %s page alloc failed\n", -				    netdev->name, q->name); -		stats->alloc_err++; -		return -ENOMEM; -	} - -	page_info->dma_addr = dma_map_page(dev, page_info->page, 0, PAGE_SIZE, -					   DMA_FROM_DEVICE); -	if (unlikely(dma_mapping_error(dev, page_info->dma_addr))) { -		put_page(page_info->page); -		page_info->dma_addr = 0; -		page_info->page = NULL; -		net_err_ratelimited("%s: %s dma map failed\n", -				    netdev->name, q->name); -		stats->dma_map_err++; -		return -EIO; -	} - -	return 0; -} - -static void ionic_rx_page_free(struct ionic_queue *q, -			       struct ionic_page_info *page_info) -{ -	struct ionic_lif *lif = q->lif; -	struct net_device *netdev; -	struct device *dev; - -	netdev = lif->netdev; -	dev = lif->ionic->dev; - -	if (unlikely(!page_info)) { -		net_err_ratelimited("%s: %s invalid page_info in free\n", -				    netdev->name, q->name); -		return; -	} - -	if (unlikely(!page_info->page)) { -		net_err_ratelimited("%s: %s invalid page in free\n", -				    netdev->name, q->name); -		return; -	} - -	dma_unmap_page(dev, page_info->dma_addr, PAGE_SIZE, DMA_FROM_DEVICE); - -	put_page(page_info->page); -	page_info->dma_addr = 0; -	page_info->page = NULL; -} -  void ionic_rx_fill(struct ionic_queue *q)  {  	struct net_device *netdev = q->lif->netdev;  	struct ionic_desc_info *desc_info; -	struct ionic_page_info *page_info;  	struct ionic_rxq_sg_desc *sg_desc;  	struct ionic_rxq_sg_elem *sg_elem; +	struct ionic_buf_info *buf_info;  	struct ionic_rxq_desc *desc;  	unsigned int remain_len; -	unsigned int seg_len; +	unsigned int frag_len;  	unsigned int nfrags;  	unsigned int i, j;  	unsigned int len;  	len = netdev->mtu + ETH_HLEN + VLAN_HLEN; -	nfrags = round_up(len, PAGE_SIZE) / PAGE_SIZE;  	for (i = ionic_q_space_avail(q); i; i--) { +		nfrags = 0;  		remain_len = len;  		desc_info = &q->info[q->head_idx];  		desc = desc_info->desc; -		sg_desc = desc_info->sg_desc; -		page_info = &desc_info->pages[0]; - -		if (page_info->page) { /* recycle the buffer */ -			ionic_rxq_post(q, false, ionic_rx_clean, NULL); -			continue; -		} +		buf_info = &desc_info->bufs[0]; -		/* fill main descriptor - pages[0] */ -		desc->opcode = (nfrags > 1) ? IONIC_RXQ_DESC_OPCODE_SG : -					      IONIC_RXQ_DESC_OPCODE_SIMPLE; -		desc_info->npages = nfrags; -		if (unlikely(ionic_rx_page_alloc(q, page_info))) { -			desc->addr = 0; -			desc->len = 0; -			return; +		if (!buf_info->page) { /* alloc a new buffer? */ +			if (unlikely(ionic_rx_page_alloc(q, buf_info))) { +				desc->addr = 0; +				desc->len = 0; +				return; +			}  		} -		desc->addr = cpu_to_le64(page_info->dma_addr); -		seg_len = min_t(unsigned int, PAGE_SIZE, len); -		desc->len = cpu_to_le16(seg_len); -		remain_len -= seg_len; -		page_info++; -		/* fill sg descriptors - pages[1..n] */ -		for (j = 0; j < nfrags - 1; j++) { -			if (page_info->page) /* recycle the sg buffer */ -				continue; +		/* fill main descriptor - buf[0] */ +		desc->addr = cpu_to_le64(buf_info->dma_addr + buf_info->page_offset); +		frag_len = min_t(u16, len, IONIC_PAGE_SIZE - buf_info->page_offset); +		desc->len = cpu_to_le16(frag_len); +		remain_len -= frag_len; +		buf_info++; +		nfrags++; +		/* fill sg descriptors - buf[1..n] */ +		sg_desc = desc_info->sg_desc; +		for (j = 0; remain_len > 0 && j < q->max_sg_elems; j++) {  			sg_elem = &sg_desc->elems[j]; -			if (unlikely(ionic_rx_page_alloc(q, page_info))) { -				sg_elem->addr = 0; -				sg_elem->len = 0; -				return; +			if (!buf_info->page) { /* alloc a new sg buffer? */ +				if (unlikely(ionic_rx_page_alloc(q, buf_info))) { +					sg_elem->addr = 0; +					sg_elem->len = 0; +					return; +				}  			} -			sg_elem->addr = cpu_to_le64(page_info->dma_addr); -			seg_len = min_t(unsigned int, PAGE_SIZE, remain_len); -			sg_elem->len = cpu_to_le16(seg_len); -			remain_len -= seg_len; -			page_info++; + +			sg_elem->addr = cpu_to_le64(buf_info->dma_addr + buf_info->page_offset); +			frag_len = min_t(u16, remain_len, IONIC_PAGE_SIZE - buf_info->page_offset); +			sg_elem->len = cpu_to_le16(frag_len); +			remain_len -= frag_len; +			buf_info++; +			nfrags++;  		} +		/* clear end sg element as a sentinel */ +		if (j < q->max_sg_elems) { +			sg_elem = &sg_desc->elems[j]; +			memset(sg_elem, 0, sizeof(*sg_elem)); +		} + +		desc->opcode = (nfrags > 1) ? IONIC_RXQ_DESC_OPCODE_SG : +					      IONIC_RXQ_DESC_OPCODE_SIMPLE; +		desc_info->nbufs = nfrags; +  		ionic_rxq_post(q, false, ionic_rx_clean, NULL);  	} @@ -395,21 +431,24 @@ void ionic_rx_fill(struct ionic_queue *q)  void ionic_rx_empty(struct ionic_queue *q)  {  	struct ionic_desc_info *desc_info; -	struct ionic_page_info *page_info; +	struct ionic_buf_info *buf_info;  	unsigned int i, j;  	for (i = 0; i < q->num_descs; i++) {  		desc_info = &q->info[i];  		for (j = 0; j < IONIC_RX_MAX_SG_ELEMS + 1; j++) { -			page_info = &desc_info->pages[j]; -			if (page_info->page) -				ionic_rx_page_free(q, page_info); +			buf_info = &desc_info->bufs[j]; +			if (buf_info->page) +				ionic_rx_page_free(q, buf_info);  		} -		desc_info->npages = 0; +		desc_info->nbufs = 0;  		desc_info->cb = NULL;  		desc_info->cb_arg = NULL;  	} + +	q->head_idx = 0; +	q->tail_idx = 0;  }  static void ionic_dim_update(struct ionic_qcq *qcq) @@ -525,7 +564,7 @@ int ionic_txrx_napi(struct napi_struct *napi, int budget)  	idev = &lif->ionic->idev;  	txcq = &lif->txqcqs[qi]->cq; -	tx_work_done = ionic_cq_service(txcq, lif->tx_budget, +	tx_work_done = ionic_cq_service(txcq, IONIC_TX_BUDGET_DEFAULT,  					ionic_tx_service, NULL, NULL);  	rx_work_done = ionic_cq_service(rxcq, budget, @@ -558,7 +597,7 @@ static dma_addr_t ionic_tx_map_single(struct ionic_queue *q,  				      void *data, size_t len)  {  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct device *dev = q->lif->ionic->dev; +	struct device *dev = q->dev;  	dma_addr_t dma_addr;  	dma_addr = dma_map_single(dev, data, len, DMA_TO_DEVICE); @@ -576,7 +615,7 @@ static dma_addr_t ionic_tx_map_frag(struct ionic_queue *q,  				    size_t offset, size_t len)  {  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct device *dev = q->lif->ionic->dev; +	struct device *dev = q->dev;  	dma_addr_t dma_addr;  	dma_addr = skb_frag_dma_map(dev, frag, offset, len, DMA_TO_DEVICE); @@ -588,62 +627,130 @@ static dma_addr_t ionic_tx_map_frag(struct ionic_queue *q,  	return dma_addr;  } +static int ionic_tx_map_skb(struct ionic_queue *q, struct sk_buff *skb, +			    struct ionic_desc_info *desc_info) +{ +	struct ionic_buf_info *buf_info = desc_info->bufs; +	struct ionic_tx_stats *stats = q_to_tx_stats(q); +	struct device *dev = q->dev; +	dma_addr_t dma_addr; +	unsigned int nfrags; +	skb_frag_t *frag; +	int frag_idx; + +	dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb)); +	if (dma_mapping_error(dev, dma_addr)) { +		stats->dma_map_err++; +		return -EIO; +	} +	buf_info->dma_addr = dma_addr; +	buf_info->len = skb_headlen(skb); +	buf_info++; + +	frag = skb_shinfo(skb)->frags; +	nfrags = skb_shinfo(skb)->nr_frags; +	for (frag_idx = 0; frag_idx < nfrags; frag_idx++, frag++) { +		dma_addr = ionic_tx_map_frag(q, frag, 0, skb_frag_size(frag)); +		if (dma_mapping_error(dev, dma_addr)) { +			stats->dma_map_err++; +			goto dma_fail; +		} +		buf_info->dma_addr = dma_addr; +		buf_info->len = skb_frag_size(frag); +		buf_info++; +	} + +	desc_info->nbufs = 1 + nfrags; + +	return 0; + +dma_fail: +	/* unwind the frag mappings and the head mapping */ +	while (frag_idx > 0) { +		frag_idx--; +		buf_info--; +		dma_unmap_page(dev, buf_info->dma_addr, +			       buf_info->len, DMA_TO_DEVICE); +	} +	dma_unmap_single(dev, buf_info->dma_addr, buf_info->len, DMA_TO_DEVICE); +	return -EIO; +} +  static void ionic_tx_clean(struct ionic_queue *q,  			   struct ionic_desc_info *desc_info,  			   struct ionic_cq_info *cq_info,  			   void *cb_arg)  { -	struct ionic_txq_sg_desc *sg_desc = desc_info->sg_desc; -	struct ionic_txq_sg_elem *elem = sg_desc->elems; +	struct ionic_buf_info *buf_info = desc_info->bufs;  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct ionic_txq_desc *desc = desc_info->desc; -	struct device *dev = q->lif->ionic->dev; -	u8 opcode, flags, nsge; -	u16 queue_index; +	struct ionic_qcq *qcq = q_to_qcq(q); +	struct sk_buff *skb = cb_arg; +	struct device *dev = q->dev;  	unsigned int i; -	u64 addr; +	u16 qi; + +	if (desc_info->nbufs) { +		dma_unmap_single(dev, (dma_addr_t)buf_info->dma_addr, +				 buf_info->len, DMA_TO_DEVICE); +		buf_info++; +		for (i = 1; i < desc_info->nbufs; i++, buf_info++) +			dma_unmap_page(dev, (dma_addr_t)buf_info->dma_addr, +				       buf_info->len, DMA_TO_DEVICE); +	} -	decode_txq_desc_cmd(le64_to_cpu(desc->cmd), -			    &opcode, &flags, &nsge, &addr); +	if (!skb) +		return; -	/* use unmap_single only if either this is not TSO, -	 * or this is first descriptor of a TSO -	 */ -	if (opcode != IONIC_TXQ_DESC_OPCODE_TSO || -	    flags & IONIC_TXQ_DESC_FLAG_TSO_SOT) -		dma_unmap_single(dev, (dma_addr_t)addr, -				 le16_to_cpu(desc->len), DMA_TO_DEVICE); -	else -		dma_unmap_page(dev, (dma_addr_t)addr, -			       le16_to_cpu(desc->len), DMA_TO_DEVICE); - -	for (i = 0; i < nsge; i++, elem++) -		dma_unmap_page(dev, (dma_addr_t)le64_to_cpu(elem->addr), -			       le16_to_cpu(elem->len), DMA_TO_DEVICE); - -	if (cb_arg) { -		struct sk_buff *skb = cb_arg; -		u32 len = skb->len; - -		queue_index = skb_get_queue_mapping(skb); -		if (unlikely(__netif_subqueue_stopped(q->lif->netdev, -						      queue_index))) { -			netif_wake_subqueue(q->lif->netdev, queue_index); -			q->wake++; +	qi = skb_get_queue_mapping(skb); + +	if (unlikely(q->features & IONIC_TXQ_F_HWSTAMP)) { +		if (cq_info) { +			struct skb_shared_hwtstamps hwts = {}; +			__le64 *cq_desc_hwstamp; +			u64 hwstamp; + +			cq_desc_hwstamp = +				cq_info->cq_desc + +				qcq->cq.desc_size - +				sizeof(struct ionic_txq_comp) - +				IONIC_HWSTAMP_CQ_NEGOFFSET; + +			hwstamp = le64_to_cpu(*cq_desc_hwstamp); + +			if (hwstamp != IONIC_HWSTAMP_INVALID) { +				hwts.hwtstamp = ionic_lif_phc_ktime(q->lif, hwstamp); + +				skb_shinfo(skb)->tx_flags |= SKBTX_IN_PROGRESS; +				skb_tstamp_tx(skb, &hwts); + +				stats->hwstamp_valid++; +			} else { +				stats->hwstamp_invalid++; +			}  		} -		dev_kfree_skb_any(skb); -		stats->clean++; -		netdev_tx_completed_queue(q_to_ndq(q), 1, len); + +	} else if (unlikely(__netif_subqueue_stopped(q->lif->netdev, qi))) { +		netif_wake_subqueue(q->lif->netdev, qi); +		q->wake++;  	} + +	desc_info->bytes = skb->len; +	stats->clean++; + +	dev_consume_skb_any(skb);  } -static bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info) +bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)  { -	struct ionic_txq_comp *comp = cq_info->cq_desc;  	struct ionic_queue *q = cq->bound_q;  	struct ionic_desc_info *desc_info; +	struct ionic_txq_comp *comp; +	int bytes = 0; +	int pkts = 0;  	u16 index; +	comp = cq_info->cq_desc + cq->desc_size - sizeof(*comp); +  	if (!color_match(comp->color, cq->done_color))  		return false; @@ -652,13 +759,21 @@ static bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)  	 */  	do {  		desc_info = &q->info[q->tail_idx]; +		desc_info->bytes = 0;  		index = q->tail_idx;  		q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);  		ionic_tx_clean(q, desc_info, cq_info, desc_info->cb_arg); +		if (desc_info->cb_arg) { +			pkts++; +			bytes += desc_info->bytes; +		}  		desc_info->cb = NULL;  		desc_info->cb_arg = NULL;  	} while (index != le16_to_cpu(comp->comp_index)); +	if (pkts && bytes && !unlikely(q->features & IONIC_TXQ_F_HWSTAMP)) +		netdev_tx_completed_queue(q_to_ndq(q), pkts, bytes); +  	return true;  } @@ -677,15 +792,25 @@ void ionic_tx_flush(struct ionic_cq *cq)  void ionic_tx_empty(struct ionic_queue *q)  {  	struct ionic_desc_info *desc_info; +	int bytes = 0; +	int pkts = 0;  	/* walk the not completed tx entries, if any */  	while (q->head_idx != q->tail_idx) {  		desc_info = &q->info[q->tail_idx]; +		desc_info->bytes = 0;  		q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);  		ionic_tx_clean(q, desc_info, NULL, desc_info->cb_arg); +		if (desc_info->cb_arg) { +			pkts++; +			bytes += desc_info->bytes; +		}  		desc_info->cb = NULL;  		desc_info->cb_arg = NULL;  	} + +	if (pkts && bytes && !unlikely(q->features & IONIC_TXQ_F_HWSTAMP)) +		netdev_tx_completed_queue(q_to_ndq(q), pkts, bytes);  }  static int ionic_tx_tcp_inner_pseudo_csum(struct sk_buff *skb) @@ -756,50 +881,34 @@ static void ionic_tx_tso_post(struct ionic_queue *q, struct ionic_txq_desc *desc  	desc->hdr_len = cpu_to_le16(hdrlen);  	desc->mss = cpu_to_le16(mss); -	if (done) { +	if (start) {  		skb_tx_timestamp(skb); -		netdev_tx_sent_queue(q_to_ndq(q), skb->len); -		ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb); +		if (!unlikely(q->features & IONIC_TXQ_F_HWSTAMP)) +			netdev_tx_sent_queue(q_to_ndq(q), skb->len); +		ionic_txq_post(q, false, ionic_tx_clean, skb);  	} else { -		ionic_txq_post(q, false, ionic_tx_clean, NULL); +		ionic_txq_post(q, done, NULL, NULL);  	}  } -static struct ionic_txq_desc *ionic_tx_tso_next(struct ionic_queue *q, -						struct ionic_txq_sg_elem **elem) -{ -	struct ionic_txq_sg_desc *sg_desc = q->info[q->head_idx].txq_sg_desc; -	struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc; - -	*elem = sg_desc->elems; -	return desc; -} -  static int ionic_tx_tso(struct ionic_queue *q, struct sk_buff *skb)  {  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct ionic_desc_info *rewind_desc_info; -	struct device *dev = q->lif->ionic->dev; +	struct ionic_desc_info *desc_info; +	struct ionic_buf_info *buf_info;  	struct ionic_txq_sg_elem *elem;  	struct ionic_txq_desc *desc; -	unsigned int frag_left = 0; -	unsigned int offset = 0; -	u16 abort = q->head_idx; -	unsigned int len_left; +	unsigned int chunk_len; +	unsigned int frag_rem; +	unsigned int tso_rem; +	unsigned int seg_rem;  	dma_addr_t desc_addr; +	dma_addr_t frag_addr;  	unsigned int hdrlen; -	unsigned int nfrags; -	unsigned int seglen; -	u64 total_bytes = 0; -	u64 total_pkts = 0; -	u16 rewind = abort; -	unsigned int left;  	unsigned int len;  	unsigned int mss; -	skb_frag_t *frag;  	bool start, done;  	bool outer_csum; -	dma_addr_t addr;  	bool has_vlan;  	u16 desc_len;  	u8 desc_nsge; @@ -807,9 +916,14 @@ static int ionic_tx_tso(struct ionic_queue *q, struct sk_buff *skb)  	bool encap;  	int err; +	desc_info = &q->info[q->head_idx]; +	buf_info = desc_info->bufs; + +	if (unlikely(ionic_tx_map_skb(q, skb, desc_info))) +		return -EIO; + +	len = skb->len;  	mss = skb_shinfo(skb)->gso_size; -	nfrags = skb_shinfo(skb)->nr_frags; -	len_left = skb->len - skb_headlen(skb);  	outer_csum = (skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM) ||  		     (skb_shinfo(skb)->gso_type & SKB_GSO_UDP_TUNNEL_CSUM);  	has_vlan = !!skb_vlan_tag_present(skb); @@ -834,125 +948,75 @@ static int ionic_tx_tso(struct ionic_queue *q, struct sk_buff *skb)  	else  		hdrlen = skb_transport_offset(skb) + tcp_hdrlen(skb); -	seglen = hdrlen + mss; -	left = skb_headlen(skb); +	tso_rem = len; +	seg_rem = min(tso_rem, hdrlen + mss); -	desc = ionic_tx_tso_next(q, &elem); -	start = true; +	frag_addr = 0; +	frag_rem = 0; -	/* Chop skb->data up into desc segments */ +	start = true; -	while (left > 0) { -		len = min(seglen, left); -		frag_left = seglen - len; -		desc_addr = ionic_tx_map_single(q, skb->data + offset, len); -		if (dma_mapping_error(dev, desc_addr)) -			goto err_out_abort; -		desc_len = len; +	while (tso_rem > 0) { +		desc = NULL; +		elem = NULL; +		desc_addr = 0; +		desc_len = 0;  		desc_nsge = 0; -		left -= len; -		offset += len; -		if (nfrags > 0 && frag_left > 0) -			continue; -		done = (nfrags == 0 && left == 0); -		ionic_tx_tso_post(q, desc, skb, -				  desc_addr, desc_nsge, desc_len, -				  hdrlen, mss, -				  outer_csum, -				  vlan_tci, has_vlan, -				  start, done); -		total_pkts++; -		total_bytes += start ? len : len + hdrlen; -		desc = ionic_tx_tso_next(q, &elem); -		start = false; -		seglen = mss; -	} - -	/* Chop skb frags into desc segments */ - -	for (frag = skb_shinfo(skb)->frags; len_left; frag++) { -		offset = 0; -		left = skb_frag_size(frag); -		len_left -= left; -		nfrags--; -		stats->frags++; - -		while (left > 0) { -			if (frag_left > 0) { -				len = min(frag_left, left); -				frag_left -= len; -				addr = ionic_tx_map_frag(q, frag, offset, len); -				if (dma_mapping_error(dev, addr)) -					goto err_out_abort; -				elem->addr = cpu_to_le64(addr); -				elem->len = cpu_to_le16(len); +		/* use fragments until we have enough to post a single descriptor */ +		while (seg_rem > 0) { +			/* if the fragment is exhausted then move to the next one */ +			if (frag_rem == 0) { +				/* grab the next fragment */ +				frag_addr = buf_info->dma_addr; +				frag_rem = buf_info->len; +				buf_info++; +			} +			chunk_len = min(frag_rem, seg_rem); +			if (!desc) { +				/* fill main descriptor */ +				desc = desc_info->txq_desc; +				elem = desc_info->txq_sg_desc->elems; +				desc_addr = frag_addr; +				desc_len = chunk_len; +			} else { +				/* fill sg descriptor */ +				elem->addr = cpu_to_le64(frag_addr); +				elem->len = cpu_to_le16(chunk_len);  				elem++;  				desc_nsge++; -				left -= len; -				offset += len; -				if (nfrags > 0 && frag_left > 0) -					continue; -				done = (nfrags == 0 && left == 0); -				ionic_tx_tso_post(q, desc, skb, desc_addr, -						  desc_nsge, desc_len, -						  hdrlen, mss, outer_csum, -						  vlan_tci, has_vlan, -						  start, done); -				total_pkts++; -				total_bytes += start ? len : len + hdrlen; -				desc = ionic_tx_tso_next(q, &elem); -				start = false; -			} else { -				len = min(mss, left); -				frag_left = mss - len; -				desc_addr = ionic_tx_map_frag(q, frag, -							      offset, len); -				if (dma_mapping_error(dev, desc_addr)) -					goto err_out_abort; -				desc_len = len; -				desc_nsge = 0; -				left -= len; -				offset += len; -				if (nfrags > 0 && frag_left > 0) -					continue; -				done = (nfrags == 0 && left == 0); -				ionic_tx_tso_post(q, desc, skb, desc_addr, -						  desc_nsge, desc_len, -						  hdrlen, mss, outer_csum, -						  vlan_tci, has_vlan, -						  start, done); -				total_pkts++; -				total_bytes += start ? len : len + hdrlen; -				desc = ionic_tx_tso_next(q, &elem); -				start = false;  			} +			frag_addr += chunk_len; +			frag_rem -= chunk_len; +			tso_rem -= chunk_len; +			seg_rem -= chunk_len;  		} +		seg_rem = min(tso_rem, mss); +		done = (tso_rem == 0); +		/* post descriptor */ +		ionic_tx_tso_post(q, desc, skb, +				  desc_addr, desc_nsge, desc_len, +				  hdrlen, mss, outer_csum, vlan_tci, has_vlan, +				  start, done); +		start = false; +		/* Buffer information is stored with the first tso descriptor */ +		desc_info = &q->info[q->head_idx]; +		desc_info->nbufs = 0;  	} -	stats->pkts += total_pkts; -	stats->bytes += total_bytes; +	stats->pkts += DIV_ROUND_UP(len - hdrlen, mss); +	stats->bytes += len;  	stats->tso++; -	stats->tso_bytes += total_bytes; +	stats->tso_bytes = len;  	return 0; - -err_out_abort: -	while (rewind != q->head_idx) { -		rewind_desc_info = &q->info[rewind]; -		ionic_tx_clean(q, rewind_desc_info, NULL, NULL); -		rewind = (rewind + 1) & (q->num_descs - 1); -	} -	q->head_idx = abort; - -	return -ENOMEM;  } -static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb) +static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb, +			      struct ionic_desc_info *desc_info)  { -	struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc; +	struct ionic_txq_desc *desc = desc_info->txq_desc; +	struct ionic_buf_info *buf_info = desc_info->bufs;  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct device *dev = q->lif->ionic->dev; -	dma_addr_t dma_addr;  	bool has_vlan;  	u8 flags = 0;  	bool encap; @@ -961,23 +1025,22 @@ static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb)  	has_vlan = !!skb_vlan_tag_present(skb);  	encap = skb->encapsulation; -	dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb)); -	if (dma_mapping_error(dev, dma_addr)) -		return -ENOMEM; -  	flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;  	flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;  	cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_PARTIAL, -				  flags, skb_shinfo(skb)->nr_frags, dma_addr); +				  flags, skb_shinfo(skb)->nr_frags, +				  buf_info->dma_addr);  	desc->cmd = cpu_to_le64(cmd); -	desc->len = cpu_to_le16(skb_headlen(skb)); -	desc->csum_start = cpu_to_le16(skb_checksum_start_offset(skb)); -	desc->csum_offset = cpu_to_le16(skb->csum_offset); +	desc->len = cpu_to_le16(buf_info->len);  	if (has_vlan) {  		desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));  		stats->vlan_inserted++; +	} else { +		desc->vlan_tci = 0;  	} +	desc->csum_start = cpu_to_le16(skb_checksum_start_offset(skb)); +	desc->csum_offset = cpu_to_le16(skb->csum_offset);  	if (skb_csum_is_sctp(skb))  		stats->crc32_csum++; @@ -987,12 +1050,12 @@ static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb)  	return 0;  } -static int ionic_tx_calc_no_csum(struct ionic_queue *q, struct sk_buff *skb) +static int ionic_tx_calc_no_csum(struct ionic_queue *q, struct sk_buff *skb, +				 struct ionic_desc_info *desc_info)  { -	struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc; +	struct ionic_txq_desc *desc = desc_info->txq_desc; +	struct ionic_buf_info *buf_info = desc_info->bufs;  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct device *dev = q->lif->ionic->dev; -	dma_addr_t dma_addr;  	bool has_vlan;  	u8 flags = 0;  	bool encap; @@ -1001,67 +1064,66 @@ static int ionic_tx_calc_no_csum(struct ionic_queue *q, struct sk_buff *skb)  	has_vlan = !!skb_vlan_tag_present(skb);  	encap = skb->encapsulation; -	dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb)); -	if (dma_mapping_error(dev, dma_addr)) -		return -ENOMEM; -  	flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;  	flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;  	cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_NONE, -				  flags, skb_shinfo(skb)->nr_frags, dma_addr); +				  flags, skb_shinfo(skb)->nr_frags, +				  buf_info->dma_addr);  	desc->cmd = cpu_to_le64(cmd); -	desc->len = cpu_to_le16(skb_headlen(skb)); +	desc->len = cpu_to_le16(buf_info->len);  	if (has_vlan) {  		desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));  		stats->vlan_inserted++; +	} else { +		desc->vlan_tci = 0;  	} +	desc->csum_start = 0; +	desc->csum_offset = 0;  	stats->csum_none++;  	return 0;  } -static int ionic_tx_skb_frags(struct ionic_queue *q, struct sk_buff *skb) +static int ionic_tx_skb_frags(struct ionic_queue *q, struct sk_buff *skb, +			      struct ionic_desc_info *desc_info)  { -	struct ionic_txq_sg_desc *sg_desc = q->info[q->head_idx].txq_sg_desc; -	unsigned int len_left = skb->len - skb_headlen(skb); +	struct ionic_txq_sg_desc *sg_desc = desc_info->txq_sg_desc; +	struct ionic_buf_info *buf_info = &desc_info->bufs[1];  	struct ionic_txq_sg_elem *elem = sg_desc->elems;  	struct ionic_tx_stats *stats = q_to_tx_stats(q); -	struct device *dev = q->lif->ionic->dev; -	dma_addr_t dma_addr; -	skb_frag_t *frag; -	u16 len; +	unsigned int i; -	for (frag = skb_shinfo(skb)->frags; len_left; frag++, elem++) { -		len = skb_frag_size(frag); -		elem->len = cpu_to_le16(len); -		dma_addr = ionic_tx_map_frag(q, frag, 0, len); -		if (dma_mapping_error(dev, dma_addr)) -			return -ENOMEM; -		elem->addr = cpu_to_le64(dma_addr); -		len_left -= len; -		stats->frags++; +	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++, buf_info++, elem++) { +		elem->addr = cpu_to_le64(buf_info->dma_addr); +		elem->len = cpu_to_le16(buf_info->len);  	} +	stats->frags += skb_shinfo(skb)->nr_frags; +  	return 0;  }  static int ionic_tx(struct ionic_queue *q, struct sk_buff *skb)  { +	struct ionic_desc_info *desc_info = &q->info[q->head_idx];  	struct ionic_tx_stats *stats = q_to_tx_stats(q);  	int err; +	if (unlikely(ionic_tx_map_skb(q, skb, desc_info))) +		return -EIO; +  	/* set up the initial descriptor */  	if (skb->ip_summed == CHECKSUM_PARTIAL) -		err = ionic_tx_calc_csum(q, skb); +		err = ionic_tx_calc_csum(q, skb, desc_info);  	else -		err = ionic_tx_calc_no_csum(q, skb); +		err = ionic_tx_calc_no_csum(q, skb, desc_info);  	if (err)  		return err;  	/* add frags */ -	err = ionic_tx_skb_frags(q, skb); +	err = ionic_tx_skb_frags(q, skb, desc_info);  	if (err)  		return err; @@ -1069,7 +1131,8 @@ static int ionic_tx(struct ionic_queue *q, struct sk_buff *skb)  	stats->pkts++;  	stats->bytes += skb->len; -	netdev_tx_sent_queue(q_to_ndq(q), skb->len); +	if (!unlikely(q->features & IONIC_TXQ_F_HWSTAMP)) +		netdev_tx_sent_queue(q_to_ndq(q), skb->len);  	ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb);  	return 0; @@ -1077,17 +1140,19 @@ static int ionic_tx(struct ionic_queue *q, struct sk_buff *skb)  static int ionic_tx_descs_needed(struct ionic_queue *q, struct sk_buff *skb)  { -	int sg_elems = q->lif->qtype_info[IONIC_QTYPE_TXQ].max_sg_elems;  	struct ionic_tx_stats *stats = q_to_tx_stats(q); +	int ndescs;  	int err; -	/* If TSO, need roundup(skb->len/mss) descs */ +	/* Each desc is mss long max, so a descriptor for each gso_seg */  	if (skb_is_gso(skb)) -		return (skb->len / skb_shinfo(skb)->gso_size) + 1; +		ndescs = skb_shinfo(skb)->gso_segs; +	else +		ndescs = 1;  	/* If non-TSO, just need 1 desc and nr_frags sg elems */ -	if (skb_shinfo(skb)->nr_frags <= sg_elems) -		return 1; +	if (skb_shinfo(skb)->nr_frags <= q->max_sg_elems) +		return ndescs;  	/* Too many frags, so linearize */  	err = skb_linearize(skb); @@ -1096,8 +1161,7 @@ static int ionic_tx_descs_needed(struct ionic_queue *q, struct sk_buff *skb)  	stats->linearize++; -	/* Need 1 desc and zero sg elems */ -	return 1; +	return ndescs;  }  static int ionic_maybe_stop_tx(struct ionic_queue *q, int ndescs) @@ -1120,6 +1184,42 @@ static int ionic_maybe_stop_tx(struct ionic_queue *q, int ndescs)  	return stopped;  } +static netdev_tx_t ionic_start_hwstamp_xmit(struct sk_buff *skb, +					    struct net_device *netdev) +{ +	struct ionic_lif *lif = netdev_priv(netdev); +	struct ionic_queue *q = &lif->hwstamp_txq->q; +	int err, ndescs; + +	/* Does not stop/start txq, because we post to a separate tx queue +	 * for timestamping, and if a packet can't be posted immediately to +	 * the timestamping queue, it is dropped. +	 */ + +	ndescs = ionic_tx_descs_needed(q, skb); +	if (unlikely(ndescs < 0)) +		goto err_out_drop; + +	if (unlikely(!ionic_q_has_space(q, ndescs))) +		goto err_out_drop; + +	skb_shinfo(skb)->tx_flags |= SKBTX_HW_TSTAMP; +	if (skb_is_gso(skb)) +		err = ionic_tx_tso(q, skb); +	else +		err = ionic_tx(q, skb); + +	if (err) +		goto err_out_drop; + +	return NETDEV_TX_OK; + +err_out_drop: +	q->drop++; +	dev_kfree_skb(skb); +	return NETDEV_TX_OK; +} +  netdev_tx_t ionic_start_xmit(struct sk_buff *skb, struct net_device *netdev)  {  	u16 queue_index = skb_get_queue_mapping(skb); @@ -1133,6 +1233,10 @@ netdev_tx_t ionic_start_xmit(struct sk_buff *skb, struct net_device *netdev)  		return NETDEV_TX_OK;  	} +	if (unlikely(skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP)) +		if (lif->hwstamp_txq && lif->phc->ts_config_tx_mode) +			return ionic_start_hwstamp_xmit(skb, netdev); +  	if (unlikely(queue_index >= lif->nxqs))  		queue_index = 0;  	q = &lif->txqcqs[queue_index]->q; | 
