Message ID | d616c727e8890c43f3e2c93bfd62b396292a7378.1617885385.git.lorenzo@kernel.org |
---|---|
State | New |
Headers | show |
Series | mvneta: introduce XDP multi-buffer support | expand |
> On Thu, Apr 08, 2021 at 02:50:56PM +0200, Lorenzo Bianconi wrote: > > Take into account if the received xdp_buff/xdp_frame is non-linear > > recycling/returning the frame memory to the allocator or into > > xdp_frame_bulk. > > Introduce xdp_return_num_frags_from_buff to return a given number of > > fragments from a xdp multi-buff starting from the tail. > > > > Signed-off-by: Lorenzo Bianconi <lorenzo@kernel.org> > > --- > > include/net/xdp.h | 19 ++++++++++-- > > net/core/xdp.c | 76 ++++++++++++++++++++++++++++++++++++++++++++++- > > 2 files changed, 92 insertions(+), 3 deletions(-) > > > > diff --git a/include/net/xdp.h b/include/net/xdp.h > > index 02aea7696d15..c8eb7cf4ebed 100644 > > --- a/include/net/xdp.h > > +++ b/include/net/xdp.h > > @@ -289,6 +289,7 @@ void xdp_return_buff(struct xdp_buff *xdp); > > void xdp_flush_frame_bulk(struct xdp_frame_bulk *bq); > > void xdp_return_frame_bulk(struct xdp_frame *xdpf, > > struct xdp_frame_bulk *bq); > > +void xdp_return_num_frags_from_buff(struct xdp_buff *xdp, u16 num_frags); > > > > /* When sending xdp_frame into the network stack, then there is no > > * return point callback, which is needed to release e.g. DMA-mapping > > @@ -299,10 +300,24 @@ void __xdp_release_frame(void *data, struct xdp_mem_info *mem); > > static inline void xdp_release_frame(struct xdp_frame *xdpf) > > { > > struct xdp_mem_info *mem = &xdpf->mem; > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > > > /* Curr only page_pool needs this */ > > - if (mem->type == MEM_TYPE_PAGE_POOL) > > - __xdp_release_frame(xdpf->data, mem); > > + if (mem->type != MEM_TYPE_PAGE_POOL) > > + return; > > + > > + if (likely(!xdpf->mb)) > > + goto out; > > + > > + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); > > + for (i = 0; i < xdp_sinfo->nr_frags; i++) { > > + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); > > + > > + __xdp_release_frame(page_address(page), mem); > > + } > > +out: > > + __xdp_release_frame(xdpf->data, mem); > > } > > > > int xdp_rxq_info_reg(struct xdp_rxq_info *xdp_rxq, > > diff --git a/net/core/xdp.c b/net/core/xdp.c > > index 05354976c1fc..430f516259d9 100644 > > --- a/net/core/xdp.c > > +++ b/net/core/xdp.c > > @@ -374,12 +374,38 @@ static void __xdp_return(void *data, struct xdp_mem_info *mem, bool napi_direct, > > > > void xdp_return_frame(struct xdp_frame *xdpf) > > { > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > + > > + if (likely(!xdpf->mb)) > > + goto out; > > + > > + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); > > + for (i = 0; i < xdp_sinfo->nr_frags; i++) { > > + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); > > + > > + __xdp_return(page_address(page), &xdpf->mem, false, NULL); > > + } > > +out: > > __xdp_return(xdpf->data, &xdpf->mem, false, NULL); > > } > > EXPORT_SYMBOL_GPL(xdp_return_frame); > > > > void xdp_return_frame_rx_napi(struct xdp_frame *xdpf) > > { > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > + > > + if (likely(!xdpf->mb)) > > + goto out; > > + > > + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); > > + for (i = 0; i < xdp_sinfo->nr_frags; i++) { > > + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); > > + > > + __xdp_return(page_address(page), &xdpf->mem, true, NULL); > > + } > > +out: > > __xdp_return(xdpf->data, &xdpf->mem, true, NULL); > > } > > EXPORT_SYMBOL_GPL(xdp_return_frame_rx_napi); > > @@ -415,7 +441,7 @@ void xdp_return_frame_bulk(struct xdp_frame *xdpf, > > struct xdp_mem_allocator *xa; > > > > if (mem->type != MEM_TYPE_PAGE_POOL) { > > - __xdp_return(xdpf->data, &xdpf->mem, false, NULL); > > + xdp_return_frame(xdpf); > > return; > > } > > > > @@ -434,15 +460,63 @@ void xdp_return_frame_bulk(struct xdp_frame *xdpf, > > bq->xa = rhashtable_lookup(mem_id_ht, &mem->id, mem_id_rht_params); > > } > > > > + if (unlikely(xdpf->mb)) { > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > + > > + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); > > + for (i = 0; i < xdp_sinfo->nr_frags; i++) { > > + skb_frag_t *frag = &xdp_sinfo->frags[i]; > > + > > + bq->q[bq->count++] = xdp_get_frag_address(frag); > > + if (bq->count == XDP_BULK_QUEUE_SIZE) > > + xdp_flush_frame_bulk(bq); > > + } > > + } > > bq->q[bq->count++] = xdpf->data; > > } > > EXPORT_SYMBOL_GPL(xdp_return_frame_bulk); > > > > void xdp_return_buff(struct xdp_buff *xdp) > > { > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > + > > + if (likely(!xdp->mb)) > > + goto out; > > + > > + xdp_sinfo = xdp_get_shared_info_from_buff(xdp); > > + for (i = 0; i < xdp_sinfo->nr_frags; i++) { > > + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); > > + > > + __xdp_return(page_address(page), &xdp->rxq->mem, true, xdp); > > + } > > +out: > > __xdp_return(xdp->data, &xdp->rxq->mem, true, xdp); > > } > > > > +void xdp_return_num_frags_from_buff(struct xdp_buff *xdp, u16 num_frags) > > +{ > > + struct xdp_shared_info *xdp_sinfo; > > + int i; > > + > > + if (unlikely(!xdp->mb)) > > + return; > > + > > + xdp_sinfo = xdp_get_shared_info_from_buff(xdp); > > + num_frags = min_t(u16, num_frags, xdp_sinfo->nr_frags); > > + for (i = 1; i <= num_frags; i++) { > > + skb_frag_t *frag = &xdp_sinfo->frags[xdp_sinfo->nr_frags - i]; > > + struct page *page = xdp_get_frag_page(frag); > > + > > + xdp_sinfo->data_length -= xdp_get_frag_size(frag); > > + __xdp_return(page_address(page), &xdp->rxq->mem, false, NULL); > > + } > > + xdp_sinfo->nr_frags -= num_frags; > > + xdp->mb = !!xdp_sinfo->nr_frags; > > +} > > +EXPORT_SYMBOL_GPL(xdp_return_num_frags_from_buff); > > + > > /* Only called for MEM_TYPE_PAGE_POOL see xdp.h */ > > void __xdp_release_frame(void *data, struct xdp_mem_info *mem) > > { > > None of this really benefits in any way from having the extra "mb" bit, > does it? I get the impression it would work just the same way without it. paged xdp_buff part is initialized only if xdp->mb is set. The reason is not hit performances in the most common single buffer use case. We always need to check xdp->mb or xdf->mb before accessing paged area. Regards, Lorenzo
diff --git a/include/net/xdp.h b/include/net/xdp.h index 02aea7696d15..c8eb7cf4ebed 100644 --- a/include/net/xdp.h +++ b/include/net/xdp.h @@ -289,6 +289,7 @@ void xdp_return_buff(struct xdp_buff *xdp); void xdp_flush_frame_bulk(struct xdp_frame_bulk *bq); void xdp_return_frame_bulk(struct xdp_frame *xdpf, struct xdp_frame_bulk *bq); +void xdp_return_num_frags_from_buff(struct xdp_buff *xdp, u16 num_frags); /* When sending xdp_frame into the network stack, then there is no * return point callback, which is needed to release e.g. DMA-mapping @@ -299,10 +300,24 @@ void __xdp_release_frame(void *data, struct xdp_mem_info *mem); static inline void xdp_release_frame(struct xdp_frame *xdpf) { struct xdp_mem_info *mem = &xdpf->mem; + struct xdp_shared_info *xdp_sinfo; + int i; /* Curr only page_pool needs this */ - if (mem->type == MEM_TYPE_PAGE_POOL) - __xdp_release_frame(xdpf->data, mem); + if (mem->type != MEM_TYPE_PAGE_POOL) + return; + + if (likely(!xdpf->mb)) + goto out; + + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); + for (i = 0; i < xdp_sinfo->nr_frags; i++) { + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); + + __xdp_release_frame(page_address(page), mem); + } +out: + __xdp_release_frame(xdpf->data, mem); } int xdp_rxq_info_reg(struct xdp_rxq_info *xdp_rxq, diff --git a/net/core/xdp.c b/net/core/xdp.c index 05354976c1fc..430f516259d9 100644 --- a/net/core/xdp.c +++ b/net/core/xdp.c @@ -374,12 +374,38 @@ static void __xdp_return(void *data, struct xdp_mem_info *mem, bool napi_direct, void xdp_return_frame(struct xdp_frame *xdpf) { + struct xdp_shared_info *xdp_sinfo; + int i; + + if (likely(!xdpf->mb)) + goto out; + + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); + for (i = 0; i < xdp_sinfo->nr_frags; i++) { + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); + + __xdp_return(page_address(page), &xdpf->mem, false, NULL); + } +out: __xdp_return(xdpf->data, &xdpf->mem, false, NULL); } EXPORT_SYMBOL_GPL(xdp_return_frame); void xdp_return_frame_rx_napi(struct xdp_frame *xdpf) { + struct xdp_shared_info *xdp_sinfo; + int i; + + if (likely(!xdpf->mb)) + goto out; + + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); + for (i = 0; i < xdp_sinfo->nr_frags; i++) { + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); + + __xdp_return(page_address(page), &xdpf->mem, true, NULL); + } +out: __xdp_return(xdpf->data, &xdpf->mem, true, NULL); } EXPORT_SYMBOL_GPL(xdp_return_frame_rx_napi); @@ -415,7 +441,7 @@ void xdp_return_frame_bulk(struct xdp_frame *xdpf, struct xdp_mem_allocator *xa; if (mem->type != MEM_TYPE_PAGE_POOL) { - __xdp_return(xdpf->data, &xdpf->mem, false, NULL); + xdp_return_frame(xdpf); return; } @@ -434,15 +460,63 @@ void xdp_return_frame_bulk(struct xdp_frame *xdpf, bq->xa = rhashtable_lookup(mem_id_ht, &mem->id, mem_id_rht_params); } + if (unlikely(xdpf->mb)) { + struct xdp_shared_info *xdp_sinfo; + int i; + + xdp_sinfo = xdp_get_shared_info_from_frame(xdpf); + for (i = 0; i < xdp_sinfo->nr_frags; i++) { + skb_frag_t *frag = &xdp_sinfo->frags[i]; + + bq->q[bq->count++] = xdp_get_frag_address(frag); + if (bq->count == XDP_BULK_QUEUE_SIZE) + xdp_flush_frame_bulk(bq); + } + } bq->q[bq->count++] = xdpf->data; } EXPORT_SYMBOL_GPL(xdp_return_frame_bulk); void xdp_return_buff(struct xdp_buff *xdp) { + struct xdp_shared_info *xdp_sinfo; + int i; + + if (likely(!xdp->mb)) + goto out; + + xdp_sinfo = xdp_get_shared_info_from_buff(xdp); + for (i = 0; i < xdp_sinfo->nr_frags; i++) { + struct page *page = xdp_get_frag_page(&xdp_sinfo->frags[i]); + + __xdp_return(page_address(page), &xdp->rxq->mem, true, xdp); + } +out: __xdp_return(xdp->data, &xdp->rxq->mem, true, xdp); } +void xdp_return_num_frags_from_buff(struct xdp_buff *xdp, u16 num_frags) +{ + struct xdp_shared_info *xdp_sinfo; + int i; + + if (unlikely(!xdp->mb)) + return; + + xdp_sinfo = xdp_get_shared_info_from_buff(xdp); + num_frags = min_t(u16, num_frags, xdp_sinfo->nr_frags); + for (i = 1; i <= num_frags; i++) { + skb_frag_t *frag = &xdp_sinfo->frags[xdp_sinfo->nr_frags - i]; + struct page *page = xdp_get_frag_page(frag); + + xdp_sinfo->data_length -= xdp_get_frag_size(frag); + __xdp_return(page_address(page), &xdp->rxq->mem, false, NULL); + } + xdp_sinfo->nr_frags -= num_frags; + xdp->mb = !!xdp_sinfo->nr_frags; +} +EXPORT_SYMBOL_GPL(xdp_return_num_frags_from_buff); + /* Only called for MEM_TYPE_PAGE_POOL see xdp.h */ void __xdp_release_frame(void *data, struct xdp_mem_info *mem) {
Take into account if the received xdp_buff/xdp_frame is non-linear recycling/returning the frame memory to the allocator or into xdp_frame_bulk. Introduce xdp_return_num_frags_from_buff to return a given number of fragments from a xdp multi-buff starting from the tail. Signed-off-by: Lorenzo Bianconi <lorenzo@kernel.org> --- include/net/xdp.h | 19 ++++++++++-- net/core/xdp.c | 76 ++++++++++++++++++++++++++++++++++++++++++++++- 2 files changed, 92 insertions(+), 3 deletions(-)