Skip to content

Commit 2f5c3c7

Browse files
LorenzoBianconinbd168
authored andcommitted
wifi: mt76: switch to page_pool allocator
In order to reduce possible memory allocation failures due to memory fragmentation caused by page_frag_cache allocator, switch to page_pool allocator for dma and usb mt76 drivers. Remove per rx-queue page_frag_cache Co-developed-by: Felix Fietkau <[email protected]> Tested-by: Deren Wu <[email protected]> Signed-off-by: Lorenzo Bianconi <[email protected]> Signed-off-by: Felix Fietkau <[email protected]>
1 parent 412d19b commit 2f5c3c7

File tree

6 files changed

+139
-94
lines changed

6 files changed

+139
-94
lines changed

drivers/net/wireless/mediatek/mt76/Kconfig

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
# SPDX-License-Identifier: GPL-2.0-only
22
config MT76_CORE
33
tristate
4+
select PAGE_POOL
45

56
config MT76_LEDS
67
bool

drivers/net/wireless/mediatek/mt76/dma.c

Lines changed: 35 additions & 37 deletions
Original file line numberDiff line numberDiff line change
@@ -173,7 +173,7 @@ mt76_free_pending_rxwi(struct mt76_dev *dev)
173173
local_bh_disable();
174174
while ((t = __mt76_get_rxwi(dev)) != NULL) {
175175
if (t->ptr)
176-
skb_free_frag(t->ptr);
176+
mt76_put_page_pool_buf(t->ptr, false);
177177
kfree(t);
178178
}
179179
local_bh_enable();
@@ -408,9 +408,9 @@ mt76_dma_get_buf(struct mt76_dev *dev, struct mt76_queue *q, int idx,
408408
if (!t)
409409
return NULL;
410410

411-
dma_unmap_single(dev->dma_dev, t->dma_addr,
412-
SKB_WITH_OVERHEAD(q->buf_size),
413-
DMA_FROM_DEVICE);
411+
dma_sync_single_for_cpu(dev->dma_dev, t->dma_addr,
412+
SKB_WITH_OVERHEAD(q->buf_size),
413+
page_pool_get_dma_dir(q->page_pool));
414414

415415
buf = t->ptr;
416416
t->dma_addr = 0;
@@ -427,9 +427,9 @@ mt76_dma_get_buf(struct mt76_dev *dev, struct mt76_queue *q, int idx,
427427
} else {
428428
buf = e->buf;
429429
e->buf = NULL;
430-
dma_unmap_single(dev->dma_dev, e->dma_addr[0],
431-
SKB_WITH_OVERHEAD(q->buf_size),
432-
DMA_FROM_DEVICE);
430+
dma_sync_single_for_cpu(dev->dma_dev, e->dma_addr[0],
431+
SKB_WITH_OVERHEAD(q->buf_size),
432+
page_pool_get_dma_dir(q->page_pool));
433433
}
434434

435435
return buf;
@@ -581,38 +581,37 @@ mt76_dma_tx_queue_skb(struct mt76_dev *dev, struct mt76_queue *q,
581581
}
582582

583583
static int
584-
mt76_dma_rx_fill(struct mt76_dev *dev, struct mt76_queue *q)
584+
mt76_dma_rx_fill(struct mt76_dev *dev, struct mt76_queue *q,
585+
bool allow_direct)
585586
{
586587
int len = SKB_WITH_OVERHEAD(q->buf_size);
587-
int frames = 0, offset = q->buf_offset;
588-
dma_addr_t addr;
588+
int frames = 0;
589589

590590
if (!q->ndesc)
591591
return 0;
592592

593593
spin_lock_bh(&q->lock);
594594

595595
while (q->queued < q->ndesc - 1) {
596+
enum dma_data_direction dir;
596597
struct mt76_queue_buf qbuf;
597-
void *buf = NULL;
598+
dma_addr_t addr;
599+
int offset;
600+
void *buf;
598601

599-
buf = page_frag_alloc(&q->rx_page, q->buf_size, GFP_ATOMIC);
602+
buf = mt76_get_page_pool_buf(q, &offset, q->buf_size);
600603
if (!buf)
601604
break;
602605

603-
addr = dma_map_single(dev->dma_dev, buf, len, DMA_FROM_DEVICE);
604-
if (unlikely(dma_mapping_error(dev->dma_dev, addr))) {
605-
skb_free_frag(buf);
606-
break;
607-
}
606+
addr = page_pool_get_dma_addr(virt_to_head_page(buf)) + offset;
607+
dir = page_pool_get_dma_dir(q->page_pool);
608+
dma_sync_single_for_device(dev->dma_dev, addr, len, dir);
608609

609-
qbuf.addr = addr + offset;
610-
qbuf.len = len - offset;
610+
qbuf.addr = addr + q->buf_offset;
611+
qbuf.len = len - q->buf_offset;
611612
qbuf.skip_unmap = false;
612613
if (mt76_dma_add_rx_buf(dev, q, &qbuf, buf) < 0) {
613-
dma_unmap_single(dev->dma_dev, addr, len,
614-
DMA_FROM_DEVICE);
615-
skb_free_frag(buf);
614+
mt76_put_page_pool_buf(buf, allow_direct);
616615
break;
617616
}
618617
frames++;
@@ -653,7 +652,7 @@ mt76_dma_wed_setup(struct mt76_dev *dev, struct mt76_queue *q)
653652
/* WED txfree queue needs ring to be initialized before setup */
654653
q->flags = 0;
655654
mt76_dma_queue_reset(dev, q);
656-
mt76_dma_rx_fill(dev, q);
655+
mt76_dma_rx_fill(dev, q, false);
657656
q->flags = flags;
658657

659658
ret = mtk_wed_device_txfree_ring_setup(wed, q->regs);
@@ -700,6 +699,10 @@ mt76_dma_alloc_queue(struct mt76_dev *dev, struct mt76_queue *q,
700699
if (!q->entry)
701700
return -ENOMEM;
702701

702+
ret = mt76_create_page_pool(dev, q);
703+
if (ret)
704+
return ret;
705+
703706
ret = mt76_dma_wed_setup(dev, q);
704707
if (ret)
705708
return ret;
@@ -713,7 +716,6 @@ mt76_dma_alloc_queue(struct mt76_dev *dev, struct mt76_queue *q,
713716
static void
714717
mt76_dma_rx_cleanup(struct mt76_dev *dev, struct mt76_queue *q)
715718
{
716-
struct page *page;
717719
void *buf;
718720
bool more;
719721

@@ -727,7 +729,7 @@ mt76_dma_rx_cleanup(struct mt76_dev *dev, struct mt76_queue *q)
727729
if (!buf)
728730
break;
729731

730-
skb_free_frag(buf);
732+
mt76_put_page_pool_buf(buf, false);
731733
} while (1);
732734

733735
if (q->rx_head) {
@@ -736,13 +738,6 @@ mt76_dma_rx_cleanup(struct mt76_dev *dev, struct mt76_queue *q)
736738
}
737739

738740
spin_unlock_bh(&q->lock);
739-
740-
if (!q->rx_page.va)
741-
return;
742-
743-
page = virt_to_page(q->rx_page.va);
744-
__page_frag_cache_drain(page, q->rx_page.pagecnt_bias);
745-
memset(&q->rx_page, 0, sizeof(q->rx_page));
746741
}
747742

748743
static void
@@ -759,7 +754,7 @@ mt76_dma_rx_reset(struct mt76_dev *dev, enum mt76_rxq_id qid)
759754

760755
mt76_dma_rx_cleanup(dev, q);
761756
mt76_dma_sync_idx(dev, q);
762-
mt76_dma_rx_fill(dev, q);
757+
mt76_dma_rx_fill(dev, q, false);
763758
}
764759

765760
static void
@@ -776,7 +771,7 @@ mt76_add_fragment(struct mt76_dev *dev, struct mt76_queue *q, void *data,
776771

777772
skb_add_rx_frag(skb, nr_frags, page, offset, len, q->buf_size);
778773
} else {
779-
skb_free_frag(data);
774+
mt76_put_page_pool_buf(data, true);
780775
}
781776

782777
if (more)
@@ -849,6 +844,7 @@ mt76_dma_rx_process(struct mt76_dev *dev, struct mt76_queue *q, int budget)
849844
goto free_frag;
850845

851846
skb_reserve(skb, q->buf_offset);
847+
skb_mark_for_recycle(skb);
852848

853849
*(u32 *)skb->cb = info;
854850

@@ -864,10 +860,10 @@ mt76_dma_rx_process(struct mt76_dev *dev, struct mt76_queue *q, int budget)
864860
continue;
865861

866862
free_frag:
867-
skb_free_frag(data);
863+
mt76_put_page_pool_buf(data, true);
868864
}
869865

870-
mt76_dma_rx_fill(dev, q);
866+
mt76_dma_rx_fill(dev, q, true);
871867
return done;
872868
}
873869

@@ -910,7 +906,7 @@ mt76_dma_init(struct mt76_dev *dev,
910906

911907
mt76_for_each_q_rx(dev, i) {
912908
netif_napi_add(&dev->napi_dev, &dev->napi[i], poll);
913-
mt76_dma_rx_fill(dev, &dev->q_rx[i]);
909+
mt76_dma_rx_fill(dev, &dev->q_rx[i], false);
914910
napi_enable(&dev->napi[i]);
915911
}
916912

@@ -961,6 +957,8 @@ void mt76_dma_cleanup(struct mt76_dev *dev)
961957

962958
netif_napi_del(&dev->napi[i]);
963959
mt76_dma_rx_cleanup(dev, q);
960+
961+
page_pool_destroy(q->page_pool);
964962
}
965963

966964
mt76_free_pending_txwi(dev);

drivers/net/wireless/mediatek/mt76/mac80211.c

Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
*/
55
#include <linux/sched.h>
66
#include <linux/of.h>
7+
#include <net/page_pool.h>
78
#include "mt76.h"
89

910
#define CHAN2G(_idx, _freq) { \
@@ -556,6 +557,47 @@ void mt76_unregister_phy(struct mt76_phy *phy)
556557
}
557558
EXPORT_SYMBOL_GPL(mt76_unregister_phy);
558559

560+
int mt76_create_page_pool(struct mt76_dev *dev, struct mt76_queue *q)
561+
{
562+
struct page_pool_params pp_params = {
563+
.order = 0,
564+
.flags = PP_FLAG_PAGE_FRAG,
565+
.nid = NUMA_NO_NODE,
566+
.dev = dev->dma_dev,
567+
};
568+
int idx = q - dev->q_rx;
569+
570+
switch (idx) {
571+
case MT_RXQ_MAIN:
572+
case MT_RXQ_BAND1:
573+
case MT_RXQ_BAND2:
574+
pp_params.pool_size = 256;
575+
break;
576+
default:
577+
pp_params.pool_size = 16;
578+
break;
579+
}
580+
581+
if (mt76_is_mmio(dev)) {
582+
/* rely on page_pool for DMA mapping */
583+
pp_params.flags |= PP_FLAG_DMA_MAP | PP_FLAG_DMA_SYNC_DEV;
584+
pp_params.dma_dir = DMA_FROM_DEVICE;
585+
pp_params.max_len = PAGE_SIZE;
586+
pp_params.offset = 0;
587+
}
588+
589+
q->page_pool = page_pool_create(&pp_params);
590+
if (IS_ERR(q->page_pool)) {
591+
int err = PTR_ERR(q->page_pool);
592+
593+
q->page_pool = NULL;
594+
return err;
595+
}
596+
597+
return 0;
598+
}
599+
EXPORT_SYMBOL_GPL(mt76_create_page_pool);
600+
559601
struct mt76_dev *
560602
mt76_alloc_device(struct device *pdev, unsigned int size,
561603
const struct ieee80211_ops *ops,

drivers/net/wireless/mediatek/mt76/mt76.h

Lines changed: 20 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -202,7 +202,7 @@ struct mt76_queue {
202202

203203
dma_addr_t desc_dma;
204204
struct sk_buff *rx_head;
205-
struct page_frag_cache rx_page;
205+
struct page_pool *page_pool;
206206
};
207207

208208
struct mt76_mcu_ops {
@@ -1423,6 +1423,25 @@ void __mt76_set_tx_blocked(struct mt76_dev *dev, bool blocked);
14231423
struct mt76_txwi_cache *mt76_rx_token_release(struct mt76_dev *dev, int token);
14241424
int mt76_rx_token_consume(struct mt76_dev *dev, void *ptr,
14251425
struct mt76_txwi_cache *r, dma_addr_t phys);
1426+
int mt76_create_page_pool(struct mt76_dev *dev, struct mt76_queue *q);
1427+
static inline void mt76_put_page_pool_buf(void *buf, bool allow_direct)
1428+
{
1429+
struct page *page = virt_to_head_page(buf);
1430+
1431+
page_pool_put_full_page(page->pp, page, allow_direct);
1432+
}
1433+
1434+
static inline void *
1435+
mt76_get_page_pool_buf(struct mt76_queue *q, u32 *offset, u32 size)
1436+
{
1437+
struct page *page;
1438+
1439+
page = page_pool_dev_alloc_frag(q->page_pool, offset, size);
1440+
if (!page)
1441+
return NULL;
1442+
1443+
return page_address(page) + *offset;
1444+
}
14261445

14271446
static inline void mt76_set_tx_blocked(struct mt76_dev *dev, bool blocked)
14281447
{

drivers/net/wireless/mediatek/mt76/mt7915/mmio.c

Lines changed: 21 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -594,23 +594,17 @@ static void mt7915_mmio_wed_offload_disable(struct mtk_wed_device *wed)
594594
static void mt7915_mmio_wed_release_rx_buf(struct mtk_wed_device *wed)
595595
{
596596
struct mt7915_dev *dev;
597-
u32 length;
598597
int i;
599598

600599
dev = container_of(wed, struct mt7915_dev, mt76.mmio.wed);
601-
length = SKB_DATA_ALIGN(NET_SKB_PAD + wed->wlan.rx_size +
602-
sizeof(struct skb_shared_info));
603-
604600
for (i = 0; i < dev->mt76.rx_token_size; i++) {
605601
struct mt76_txwi_cache *t;
606602

607603
t = mt76_rx_token_release(&dev->mt76, i);
608604
if (!t || !t->ptr)
609605
continue;
610606

611-
dma_unmap_single(dev->mt76.dma_dev, t->dma_addr,
612-
wed->wlan.rx_size, DMA_FROM_DEVICE);
613-
__free_pages(virt_to_page(t->ptr), get_order(length));
607+
mt76_put_page_pool_buf(t->ptr, false);
614608
t->ptr = NULL;
615609

616610
mt76_put_rxwi(&dev->mt76, t);
@@ -620,47 +614,38 @@ static void mt7915_mmio_wed_release_rx_buf(struct mtk_wed_device *wed)
620614
static u32 mt7915_mmio_wed_init_rx_buf(struct mtk_wed_device *wed, int size)
621615
{
622616
struct mtk_rxbm_desc *desc = wed->rx_buf_ring.desc;
617+
struct mt76_txwi_cache *t = NULL;
623618
struct mt7915_dev *dev;
624-
u32 length;
625-
int i;
619+
struct mt76_queue *q;
620+
int i, len;
626621

627622
dev = container_of(wed, struct mt7915_dev, mt76.mmio.wed);
628-
length = SKB_DATA_ALIGN(NET_SKB_PAD + wed->wlan.rx_size +
629-
sizeof(struct skb_shared_info));
623+
q = &dev->mt76.q_rx[MT_RXQ_MAIN];
624+
len = SKB_WITH_OVERHEAD(q->buf_size);
630625

631626
for (i = 0; i < size; i++) {
632-
struct mt76_txwi_cache *t = mt76_get_rxwi(&dev->mt76);
633-
dma_addr_t phy_addr;
634-
struct page *page;
627+
enum dma_data_direction dir;
628+
dma_addr_t addr;
629+
u32 offset;
635630
int token;
636-
void *ptr;
631+
void *buf;
637632

633+
t = mt76_get_rxwi(&dev->mt76);
638634
if (!t)
639635
goto unmap;
640636

641-
page = __dev_alloc_pages(GFP_KERNEL, get_order(length));
642-
if (!page) {
643-
mt76_put_rxwi(&dev->mt76, t);
637+
buf = mt76_get_page_pool_buf(q, &offset, q->buf_size);
638+
if (!buf)
644639
goto unmap;
645-
}
646640

647-
ptr = page_address(page);
648-
phy_addr = dma_map_single(dev->mt76.dma_dev, ptr,
649-
wed->wlan.rx_size,
650-
DMA_TO_DEVICE);
651-
if (unlikely(dma_mapping_error(dev->mt76.dev, phy_addr))) {
652-
__free_pages(page, get_order(length));
653-
mt76_put_rxwi(&dev->mt76, t);
654-
goto unmap;
655-
}
641+
addr = page_pool_get_dma_addr(virt_to_head_page(buf)) + offset;
642+
dir = page_pool_get_dma_dir(q->page_pool);
643+
dma_sync_single_for_device(dev->mt76.dma_dev, addr, len, dir);
656644

657-
desc->buf0 = cpu_to_le32(phy_addr);
658-
token = mt76_rx_token_consume(&dev->mt76, ptr, t, phy_addr);
645+
desc->buf0 = cpu_to_le32(addr);
646+
token = mt76_rx_token_consume(&dev->mt76, buf, t, addr);
659647
if (token < 0) {
660-
dma_unmap_single(dev->mt76.dma_dev, phy_addr,
661-
wed->wlan.rx_size, DMA_TO_DEVICE);
662-
__free_pages(page, get_order(length));
663-
mt76_put_rxwi(&dev->mt76, t);
648+
mt76_put_page_pool_buf(buf, false);
664649
goto unmap;
665650
}
666651

@@ -672,6 +657,8 @@ static u32 mt7915_mmio_wed_init_rx_buf(struct mtk_wed_device *wed, int size)
672657
return 0;
673658

674659
unmap:
660+
if (t)
661+
mt76_put_rxwi(&dev->mt76, t);
675662
mt7915_mmio_wed_release_rx_buf(wed);
676663
return -ENOMEM;
677664
}

0 commit comments

Comments
 (0)