Hi Lorenzo, On Sat, Oct 05, 2019 at 10:44:36PM +0200, Lorenzo Bianconi wrote: > Refactor mvneta_rx_swbm code introducing mvneta_swbm_rx_frame and > mvneta_swbm_add_rx_fragment routines. Rely on build_skb in order to > allocate skb since the previous patch introduced buffer recycling using > the page_pool API > > Tested-by: Ilias Apalodimas <ilias.apalodi...@linaro.org> > Signed-off-by: Ilias Apalodimas <ilias.apalodi...@linaro.org> > Signed-off-by: Jesper Dangaard Brouer <bro...@redhat.com> > Signed-off-by: Lorenzo Bianconi <lore...@kernel.org> > --- > drivers/net/ethernet/marvell/mvneta.c | 198 ++++++++++++++------------ > 1 file changed, 104 insertions(+), 94 deletions(-) > > diff --git a/drivers/net/ethernet/marvell/mvneta.c > b/drivers/net/ethernet/marvell/mvneta.c > index 8beae0e1eda7..d775fcae9353 100644 > --- a/drivers/net/ethernet/marvell/mvneta.c > +++ b/drivers/net/ethernet/marvell/mvneta.c > @@ -323,6 +323,11 @@ > ETH_HLEN + ETH_FCS_LEN, \ > cache_line_size()) > > +#define MVNETA_SKB_PAD (SKB_DATA_ALIGN(sizeof(struct skb_shared_info) > + \ > + NET_SKB_PAD)) > +#define MVNETA_SKB_SIZE(len) (SKB_DATA_ALIGN(len) + MVNETA_SKB_PAD) > +#define MVNETA_MAX_RX_BUF_SIZE (PAGE_SIZE - MVNETA_SKB_PAD) > + > #define IS_TSO_HEADER(txq, addr) \ > ((addr >= txq->tso_hdrs_phys) && \ > (addr < txq->tso_hdrs_phys + txq->size * TSO_HEADER_SIZE)) > @@ -646,7 +651,6 @@ static int txq_number = 8; > static int rxq_def; > > static int rx_copybreak __read_mostly = 256; > -static int rx_header_size __read_mostly = 128; > > /* HW BM need that each port be identify by a unique ID */ > static int global_port_id; > @@ -1941,30 +1945,102 @@ int mvneta_rx_refill_queue(struct mvneta_port *pp, > struct mvneta_rx_queue *rxq) > return i; > } > > +static int > +mvneta_swbm_rx_frame(struct mvneta_port *pp, > + struct mvneta_rx_desc *rx_desc, > + struct mvneta_rx_queue *rxq, > + struct page *page) > +{ > + unsigned char *data = page_address(page); > + int data_len = -MVNETA_MH_SIZE, len; > + struct net_device *dev = pp->dev; > + enum dma_data_direction dma_dir; > + > + if (MVNETA_SKB_SIZE(rx_desc->data_size) > PAGE_SIZE) { > + len = MVNETA_MAX_RX_BUF_SIZE; > + data_len += len; > + } else { > + len = rx_desc->data_size; > + data_len += len - ETH_FCS_LEN; > + } > + > + dma_dir = page_pool_get_dma_dir(rxq->page_pool); > + dma_sync_single_range_for_cpu(dev->dev.parent, > + rx_desc->buf_phys_addr, 0, > + len, dma_dir); > + > + rxq->skb = build_skb(data, PAGE_SIZE); > + if (unlikely(!rxq->skb)) { > + netdev_err(dev, > + "Can't allocate skb on queue %d\n", > + rxq->id); > + dev->stats.rx_dropped++; > + rxq->skb_alloc_err++; > + return -ENOMEM; > + } > + page_pool_release_page(rxq->page_pool, page); > + > + skb_reserve(rxq->skb, MVNETA_MH_SIZE + NET_SKB_PAD); > + skb_put(rxq->skb, data_len); > + mvneta_rx_csum(pp, rx_desc->status, rxq->skb); > + > + rxq->left_size = rx_desc->data_size - len; > + rx_desc->buf_phys_addr = 0; > + > + return 0; > +} > + > +static void > +mvneta_swbm_add_rx_fragment(struct mvneta_port *pp, > + struct mvneta_rx_desc *rx_desc, > + struct mvneta_rx_queue *rxq, > + struct page *page) > +{ > + struct net_device *dev = pp->dev; > + enum dma_data_direction dma_dir; > + int data_len, len; > + > + if (rxq->left_size > MVNETA_MAX_RX_BUF_SIZE) { > + len = MVNETA_MAX_RX_BUF_SIZE; > + data_len = len; > + } else { > + len = rxq->left_size; > + data_len = len - ETH_FCS_LEN; > + } > + dma_dir = page_pool_get_dma_dir(rxq->page_pool); > + dma_sync_single_range_for_cpu(dev->dev.parent, > + rx_desc->buf_phys_addr, 0, > + len, dma_dir); > + if (data_len > 0) { > + /* refill descriptor with new buffer later */ > + skb_add_rx_frag(rxq->skb, > + skb_shinfo(rxq->skb)->nr_frags, > + page, NET_SKB_PAD, data_len, > + PAGE_SIZE); > + > + page_pool_release_page(rxq->page_pool, page); > + rx_desc->buf_phys_addr = 0; > + } > + rxq->left_size -= len; > +} > + > /* Main rx processing when using software buffer management */ > static int mvneta_rx_swbm(struct napi_struct *napi, > struct mvneta_port *pp, int budget, > struct mvneta_rx_queue *rxq) > { > - struct net_device *dev = pp->dev; > - int rx_todo, rx_proc; > - int refill = 0; > - u32 rcvd_pkts = 0; > - u32 rcvd_bytes = 0; > + int rcvd_pkts = 0, rcvd_bytes = 0; > + int rx_pending, refill, done = 0; > > /* Get number of received packets */ > - rx_todo = mvneta_rxq_busy_desc_num_get(pp, rxq); > - rx_proc = 0; > + rx_pending = mvneta_rxq_busy_desc_num_get(pp, rxq); > > /* Fairness NAPI loop */ > - while ((rcvd_pkts < budget) && (rx_proc < rx_todo)) { > + while (done < budget && done < rx_pending) { > struct mvneta_rx_desc *rx_desc = mvneta_rxq_next_desc_get(rxq); > unsigned char *data; > struct page *page; > - dma_addr_t phys_addr; > - u32 rx_status, index; > - int rx_bytes, skb_size, copy_size; > - int frag_num, frag_size, frag_offset; > + int index; > > index = rx_desc - rxq->descs; > page = (struct page *)rxq->buf_virt_addr[index]; > @@ -1972,98 +2048,33 @@ static int mvneta_rx_swbm(struct napi_struct *napi, > /* Prefetch header */ > prefetch(data); > > - phys_addr = rx_desc->buf_phys_addr; > - rx_status = rx_desc->status; > - rx_proc++; > rxq->refill_num++; > + done++; > + > + if (rx_desc->status & MVNETA_RXD_FIRST_DESC) { > + int err; > > - if (rx_status & MVNETA_RXD_FIRST_DESC) { > /* Check errors only for FIRST descriptor */ > - if (rx_status & MVNETA_RXD_ERR_SUMMARY) { > + if (rx_desc->status & MVNETA_RXD_ERR_SUMMARY) { > mvneta_rx_error(pp, rx_desc); > - dev->stats.rx_errors++; > + pp->dev->stats.rx_errors++; > /* leave the descriptor untouched */ > continue; > } > - rx_bytes = rx_desc->data_size - > - (ETH_FCS_LEN + MVNETA_MH_SIZE); > > - /* Allocate small skb for each new packet */ > - skb_size = max(rx_copybreak, rx_header_size); > - rxq->skb = netdev_alloc_skb_ip_align(dev, skb_size); > - if (unlikely(!rxq->skb)) { > - netdev_err(dev, > - "Can't allocate skb on queue %d\n", > - rxq->id); > - dev->stats.rx_dropped++; > - rxq->skb_alloc_err++; > + err = mvneta_swbm_rx_frame(pp, rx_desc, rxq, page); > + if (err) > continue;
The error is practically a build_skb failure probably due to low memory. I think it's better to break the loop and let the system reclaim some of it's free memory instead of continuing to process (and allocate more skb's) > - } > - copy_size = min(skb_size, rx_bytes); > - > - /* Copy data from buffer to SKB, skip Marvell header */ > - memcpy(rxq->skb->data, data + MVNETA_MH_SIZE, > - copy_size); > - skb_put(rxq->skb, copy_size); > - rxq->left_size = rx_bytes - copy_size; > - > - mvneta_rx_csum(pp, rx_status, rxq->skb); > - if (rxq->left_size == 0) { > - int size = copy_size + MVNETA_MH_SIZE; > - > - dma_sync_single_range_for_cpu(dev->dev.parent, > - phys_addr, 0, > - size, > - DMA_FROM_DEVICE); > - > - /* leave the descriptor and buffer untouched */ > - } else { > - /* refill descriptor with new buffer later */ > - rx_desc->buf_phys_addr = 0; > - > - frag_num = 0; > - frag_offset = copy_size + MVNETA_MH_SIZE; > - frag_size = min(rxq->left_size, > - (int)(PAGE_SIZE - frag_offset)); > - skb_add_rx_frag(rxq->skb, frag_num, page, > - frag_offset, frag_size, > - PAGE_SIZE); > - page_pool_release_page(rxq->page_pool, page); > - rxq->left_size -= frag_size; > - } > } else { > - /* Middle or Last descriptor */ > if (unlikely(!rxq->skb)) { > pr_debug("no skb for rx_status 0x%x\n", > - rx_status); > + rx_desc->status); > continue; > } > - if (!rxq->left_size) { > - /* last descriptor has only FCS */ > - /* and can be discarded */ > - dma_sync_single_range_for_cpu(dev->dev.parent, > - phys_addr, 0, > - ETH_FCS_LEN, > - DMA_FROM_DEVICE); > - /* leave the descriptor and buffer untouched */ > - } else { > - /* refill descriptor with new buffer later */ > - rx_desc->buf_phys_addr = 0; > - > - frag_num = skb_shinfo(rxq->skb)->nr_frags; > - frag_offset = 0; > - frag_size = min(rxq->left_size, > - (int)(PAGE_SIZE - frag_offset)); > - skb_add_rx_frag(rxq->skb, frag_num, page, > - frag_offset, frag_size, > - PAGE_SIZE); > - > - page_pool_release_page(rxq->page_pool, page); > - rxq->left_size -= frag_size; > - } > + mvneta_swbm_add_rx_fragment(pp, rx_desc, rxq, page); > } /* Middle or Last descriptor */ > > - if (!(rx_status & MVNETA_RXD_LAST_DESC)) > + if (!(rx_desc->status & MVNETA_RXD_LAST_DESC)) > /* no last descriptor this time */ > continue; > > @@ -2079,13 +2090,12 @@ static int mvneta_rx_swbm(struct napi_struct *napi, > rcvd_bytes += rxq->skb->len; > > /* Linux processing */ > - rxq->skb->protocol = eth_type_trans(rxq->skb, dev); > + rxq->skb->protocol = eth_type_trans(rxq->skb, pp->dev); > > napi_gro_receive(napi, rxq->skb); > > /* clean uncomplete skb pointer in queue */ > rxq->skb = NULL; > - rxq->left_size = 0; > } > > mvneta_update_stats(pp, rcvd_pkts, rcvd_bytes, false); > @@ -2094,7 +2104,7 @@ static int mvneta_rx_swbm(struct napi_struct *napi, > refill = mvneta_rx_refill_queue(pp, rxq); > > /* Update rxq management counters */ > - mvneta_rxq_desc_num_update(pp, rxq, rx_proc, refill); > + mvneta_rxq_desc_num_update(pp, rxq, done, refill); > > return rcvd_pkts; > } > @@ -2945,7 +2955,7 @@ static void mvneta_rxq_hw_init(struct mvneta_port *pp, > /* Set Offset */ > mvneta_rxq_offset_set(pp, rxq, 0); > mvneta_rxq_buf_size_set(pp, rxq, PAGE_SIZE < SZ_64K ? > - PAGE_SIZE : > + MVNETA_MAX_RX_BUF_SIZE : > MVNETA_RX_BUF_SIZE(pp->pkt_size)); > mvneta_rxq_bm_disable(pp, rxq); > mvneta_rxq_fill(pp, rxq, rxq->size); > @@ -4655,7 +4665,7 @@ static int mvneta_probe(struct platform_device *pdev) > SET_NETDEV_DEV(dev, &pdev->dev); > > pp->id = global_port_id++; > - pp->rx_offset_correction = 0; /* not relevant for SW BM */ > + pp->rx_offset_correction = NET_SKB_PAD; > > /* Obtain access to BM resources if enabled and already initialized */ > bm_node = of_parse_phandle(dn, "buffer-manager", 0); > -- > 2.21.0 > Regards /Ilias