Skip to content

Commit a3d0a91

Browse files
kiryltorvalds
authored andcommitted
thp: make split_queue per-node
Andrea Arcangeli suggested to make split queue per-node to improve scalability. Let's do it. Signed-off-by: Kirill A. Shutemov <[email protected]> Suggested-by: Andrea Arcangeli <[email protected]> Reviewed-by: Andrea Arcangeli <[email protected]> Cc: Hugh Dickins <[email protected]> Cc: Dave Hansen <[email protected]> Cc: Mel Gorman <[email protected]> Cc: Rik van Riel <[email protected]> Cc: Vlastimil Babka <[email protected]> Cc: "Aneesh Kumar K.V" <[email protected]> Cc: Johannes Weiner <[email protected]> Cc: Michal Hocko <[email protected]> Cc: Jerome Marchand <[email protected]> Cc: Sasha Levin <[email protected]> Signed-off-by: Andrew Morton <[email protected]> Signed-off-by: Linus Torvalds <[email protected]>
1 parent 34229b2 commit a3d0a91

File tree

3 files changed

+37
-23
lines changed

3 files changed

+37
-23
lines changed

include/linux/mmzone.h

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -682,6 +682,12 @@ typedef struct pglist_data {
682682
*/
683683
unsigned long first_deferred_pfn;
684684
#endif /* CONFIG_DEFERRED_STRUCT_PAGE_INIT */
685+
686+
#ifdef CONFIG_TRANSPARENT_HUGEPAGE
687+
spinlock_t split_queue_lock;
688+
struct list_head split_queue;
689+
unsigned long split_queue_len;
690+
#endif
685691
} pg_data_t;
686692

687693
#define node_present_pages(nid) (NODE_DATA(nid)->node_present_pages)

mm/huge_memory.c

Lines changed: 26 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -138,9 +138,6 @@ static struct khugepaged_scan khugepaged_scan = {
138138
.mm_head = LIST_HEAD_INIT(khugepaged_scan.mm_head),
139139
};
140140

141-
static DEFINE_SPINLOCK(split_queue_lock);
142-
static LIST_HEAD(split_queue);
143-
static unsigned long split_queue_len;
144141
static struct shrinker deferred_split_shrinker;
145142

146143
static void set_recommended_min_free_kbytes(void)
@@ -3358,6 +3355,7 @@ int total_mapcount(struct page *page)
33583355
int split_huge_page_to_list(struct page *page, struct list_head *list)
33593356
{
33603357
struct page *head = compound_head(page);
3358+
struct pglist_data *pgdata = NODE_DATA(page_to_nid(head));
33613359
struct anon_vma *anon_vma;
33623360
int count, mapcount, ret;
33633361
bool mlocked;
@@ -3401,27 +3399,27 @@ int split_huge_page_to_list(struct page *page, struct list_head *list)
34013399
lru_add_drain();
34023400

34033401
/* Prevent deferred_split_scan() touching ->_count */
3404-
spin_lock_irqsave(&split_queue_lock, flags);
3402+
spin_lock_irqsave(&pgdata->split_queue_lock, flags);
34053403
count = page_count(head);
34063404
mapcount = total_mapcount(head);
34073405
if (!mapcount && count == 1) {
34083406
if (!list_empty(page_deferred_list(head))) {
3409-
split_queue_len--;
3407+
pgdata->split_queue_len--;
34103408
list_del(page_deferred_list(head));
34113409
}
3412-
spin_unlock_irqrestore(&split_queue_lock, flags);
3410+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34133411
__split_huge_page(page, list);
34143412
ret = 0;
34153413
} else if (IS_ENABLED(CONFIG_DEBUG_VM) && mapcount) {
3416-
spin_unlock_irqrestore(&split_queue_lock, flags);
3414+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34173415
pr_alert("total_mapcount: %u, page_count(): %u\n",
34183416
mapcount, count);
34193417
if (PageTail(page))
34203418
dump_page(head, NULL);
34213419
dump_page(page, "total_mapcount(head) > 0");
34223420
BUG();
34233421
} else {
3424-
spin_unlock_irqrestore(&split_queue_lock, flags);
3422+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34253423
unfreeze_page(anon_vma, head);
34263424
ret = -EBUSY;
34273425
}
@@ -3436,52 +3434,56 @@ int split_huge_page_to_list(struct page *page, struct list_head *list)
34363434

34373435
void free_transhuge_page(struct page *page)
34383436
{
3437+
struct pglist_data *pgdata = NODE_DATA(page_to_nid(page));
34393438
unsigned long flags;
34403439

3441-
spin_lock_irqsave(&split_queue_lock, flags);
3440+
spin_lock_irqsave(&pgdata->split_queue_lock, flags);
34423441
if (!list_empty(page_deferred_list(page))) {
3443-
split_queue_len--;
3442+
pgdata->split_queue_len--;
34443443
list_del(page_deferred_list(page));
34453444
}
3446-
spin_unlock_irqrestore(&split_queue_lock, flags);
3445+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34473446
free_compound_page(page);
34483447
}
34493448

34503449
void deferred_split_huge_page(struct page *page)
34513450
{
3451+
struct pglist_data *pgdata = NODE_DATA(page_to_nid(page));
34523452
unsigned long flags;
34533453

34543454
VM_BUG_ON_PAGE(!PageTransHuge(page), page);
34553455

3456-
spin_lock_irqsave(&split_queue_lock, flags);
3456+
spin_lock_irqsave(&pgdata->split_queue_lock, flags);
34573457
if (list_empty(page_deferred_list(page))) {
3458-
list_add_tail(page_deferred_list(page), &split_queue);
3459-
split_queue_len++;
3458+
list_add_tail(page_deferred_list(page), &pgdata->split_queue);
3459+
pgdata->split_queue_len++;
34603460
}
3461-
spin_unlock_irqrestore(&split_queue_lock, flags);
3461+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34623462
}
34633463

34643464
static unsigned long deferred_split_count(struct shrinker *shrink,
34653465
struct shrink_control *sc)
34663466
{
3467+
struct pglist_data *pgdata = NODE_DATA(sc->nid);
34673468
/*
34683469
* Split a page from split_queue will free up at least one page,
34693470
* at most HPAGE_PMD_NR - 1. We don't track exact number.
34703471
* Let's use HPAGE_PMD_NR / 2 as ballpark.
34713472
*/
3472-
return ACCESS_ONCE(split_queue_len) * HPAGE_PMD_NR / 2;
3473+
return ACCESS_ONCE(pgdata->split_queue_len) * HPAGE_PMD_NR / 2;
34733474
}
34743475

34753476
static unsigned long deferred_split_scan(struct shrinker *shrink,
34763477
struct shrink_control *sc)
34773478
{
3479+
struct pglist_data *pgdata = NODE_DATA(sc->nid);
34783480
unsigned long flags;
34793481
LIST_HEAD(list), *pos, *next;
34803482
struct page *page;
34813483
int split = 0;
34823484

3483-
spin_lock_irqsave(&split_queue_lock, flags);
3484-
list_splice_init(&split_queue, &list);
3485+
spin_lock_irqsave(&pgdata->split_queue_lock, flags);
3486+
list_splice_init(&pgdata->split_queue, &list);
34853487

34863488
/* Take pin on all head pages to avoid freeing them under us */
34873489
list_for_each_safe(pos, next, &list) {
@@ -3490,10 +3492,10 @@ static unsigned long deferred_split_scan(struct shrinker *shrink,
34903492
/* race with put_compound_page() */
34913493
if (!get_page_unless_zero(page)) {
34923494
list_del_init(page_deferred_list(page));
3493-
split_queue_len--;
3495+
pgdata->split_queue_len--;
34943496
}
34953497
}
3496-
spin_unlock_irqrestore(&split_queue_lock, flags);
3498+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
34973499

34983500
list_for_each_safe(pos, next, &list) {
34993501
page = list_entry((void *)pos, struct page, mapping);
@@ -3505,9 +3507,9 @@ static unsigned long deferred_split_scan(struct shrinker *shrink,
35053507
put_page(page);
35063508
}
35073509

3508-
spin_lock_irqsave(&split_queue_lock, flags);
3509-
list_splice_tail(&list, &split_queue);
3510-
spin_unlock_irqrestore(&split_queue_lock, flags);
3510+
spin_lock_irqsave(&pgdata->split_queue_lock, flags);
3511+
list_splice_tail(&list, &pgdata->split_queue);
3512+
spin_unlock_irqrestore(&pgdata->split_queue_lock, flags);
35113513

35123514
return split * HPAGE_PMD_NR / 2;
35133515
}
@@ -3516,6 +3518,7 @@ static struct shrinker deferred_split_shrinker = {
35163518
.count_objects = deferred_split_count,
35173519
.scan_objects = deferred_split_scan,
35183520
.seeks = DEFAULT_SEEKS,
3521+
.flags = SHRINKER_NUMA_AWARE,
35193522
};
35203523

35213524
#ifdef CONFIG_DEBUG_FS

mm/page_alloc.c

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5209,6 +5209,11 @@ static void __paginginit free_area_init_core(struct pglist_data *pgdat)
52095209
spin_lock_init(&pgdat->numabalancing_migrate_lock);
52105210
pgdat->numabalancing_migrate_nr_pages = 0;
52115211
pgdat->numabalancing_migrate_next_window = jiffies;
5212+
#endif
5213+
#ifdef CONFIG_TRANSPARENT_HUGEPAGE
5214+
spin_lock_init(&pgdat->split_queue_lock);
5215+
INIT_LIST_HEAD(&pgdat->split_queue);
5216+
pgdat->split_queue_len = 0;
52125217
#endif
52135218
init_waitqueue_head(&pgdat->kswapd_wait);
52145219
init_waitqueue_head(&pgdat->pfmemalloc_wait);

0 commit comments

Comments
 (0)