234 lines
6.7 KiB
Diff
234 lines
6.7 KiB
Diff
From: Ingo Molnar <mingo@elte.hu>
|
|
Date: Fri, 3 Jul 2009 08:29:37 -0500
|
|
Subject: mm: page_alloc: rt-friendly per-cpu pages
|
|
Origin: https://www.kernel.org/pub/linux/kernel/projects/rt/4.18/older/patches-4.18.7-rt5.tar.xz
|
|
|
|
rt-friendly per-cpu pages: convert the irqs-off per-cpu locking
|
|
method into a preemptible, explicit-per-cpu-locks method.
|
|
|
|
Contains fixes from:
|
|
Peter Zijlstra <a.p.zijlstra@chello.nl>
|
|
Thomas Gleixner <tglx@linutronix.de>
|
|
|
|
Signed-off-by: Ingo Molnar <mingo@elte.hu>
|
|
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
|
|
---
|
|
mm/page_alloc.c | 63 ++++++++++++++++++++++++++++++++++++++------------------
|
|
1 file changed, 43 insertions(+), 20 deletions(-)
|
|
|
|
--- a/mm/page_alloc.c
|
|
+++ b/mm/page_alloc.c
|
|
@@ -61,6 +61,7 @@
|
|
#include <linux/hugetlb.h>
|
|
#include <linux/sched/rt.h>
|
|
#include <linux/sched/mm.h>
|
|
+#include <linux/locallock.h>
|
|
#include <linux/page_owner.h>
|
|
#include <linux/kthread.h>
|
|
#include <linux/memcontrol.h>
|
|
@@ -291,6 +292,18 @@ EXPORT_SYMBOL(nr_node_ids);
|
|
EXPORT_SYMBOL(nr_online_nodes);
|
|
#endif
|
|
|
|
+static DEFINE_LOCAL_IRQ_LOCK(pa_lock);
|
|
+
|
|
+#ifdef CONFIG_PREEMPT_RT_BASE
|
|
+# define cpu_lock_irqsave(cpu, flags) \
|
|
+ local_lock_irqsave_on(pa_lock, flags, cpu)
|
|
+# define cpu_unlock_irqrestore(cpu, flags) \
|
|
+ local_unlock_irqrestore_on(pa_lock, flags, cpu)
|
|
+#else
|
|
+# define cpu_lock_irqsave(cpu, flags) local_irq_save(flags)
|
|
+# define cpu_unlock_irqrestore(cpu, flags) local_irq_restore(flags)
|
|
+#endif
|
|
+
|
|
int page_group_by_mobility_disabled __read_mostly;
|
|
|
|
#ifdef CONFIG_DEFERRED_STRUCT_PAGE_INIT
|
|
@@ -1268,10 +1281,10 @@ static void __free_pages_ok(struct page
|
|
return;
|
|
|
|
migratetype = get_pfnblock_migratetype(page, pfn);
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
__count_vm_events(PGFREE, 1 << order);
|
|
free_one_page(page_zone(page), page, pfn, order, migratetype);
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
}
|
|
|
|
static void __init __free_pages_boot_core(struct page *page, unsigned int order)
|
|
@@ -2539,13 +2552,13 @@ void drain_zone_pages(struct zone *zone,
|
|
int to_drain, batch;
|
|
LIST_HEAD(dst);
|
|
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
batch = READ_ONCE(pcp->batch);
|
|
to_drain = min(pcp->count, batch);
|
|
if (to_drain > 0)
|
|
isolate_pcp_pages(to_drain, pcp, &dst);
|
|
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
|
|
if (to_drain > 0)
|
|
free_pcppages_bulk(zone, &dst, false);
|
|
@@ -2567,7 +2580,7 @@ static void drain_pages_zone(unsigned in
|
|
LIST_HEAD(dst);
|
|
int count;
|
|
|
|
- local_irq_save(flags);
|
|
+ cpu_lock_irqsave(cpu, flags);
|
|
pset = per_cpu_ptr(zone->pageset, cpu);
|
|
|
|
pcp = &pset->pcp;
|
|
@@ -2575,7 +2588,7 @@ static void drain_pages_zone(unsigned in
|
|
if (count)
|
|
isolate_pcp_pages(count, pcp, &dst);
|
|
|
|
- local_irq_restore(flags);
|
|
+ cpu_unlock_irqrestore(cpu, flags);
|
|
|
|
if (count)
|
|
free_pcppages_bulk(zone, &dst, false);
|
|
@@ -2613,6 +2626,7 @@ void drain_local_pages(struct zone *zone
|
|
drain_pages(cpu);
|
|
}
|
|
|
|
+#ifndef CONFIG_PREEMPT_RT_BASE
|
|
static void drain_local_pages_wq(struct work_struct *work)
|
|
{
|
|
/*
|
|
@@ -2626,6 +2640,7 @@ static void drain_local_pages_wq(struct
|
|
drain_local_pages(NULL);
|
|
preempt_enable();
|
|
}
|
|
+#endif
|
|
|
|
/*
|
|
* Spill all the per-cpu pages from all CPUs back into the buddy allocator.
|
|
@@ -2692,7 +2707,14 @@ void drain_all_pages(struct zone *zone)
|
|
else
|
|
cpumask_clear_cpu(cpu, &cpus_with_pcps);
|
|
}
|
|
-
|
|
+#ifdef CONFIG_PREEMPT_RT_BASE
|
|
+ for_each_cpu(cpu, &cpus_with_pcps) {
|
|
+ if (zone)
|
|
+ drain_pages_zone(cpu, zone);
|
|
+ else
|
|
+ drain_pages(cpu);
|
|
+ }
|
|
+#else
|
|
for_each_cpu(cpu, &cpus_with_pcps) {
|
|
struct work_struct *work = per_cpu_ptr(&pcpu_drain, cpu);
|
|
INIT_WORK(work, drain_local_pages_wq);
|
|
@@ -2700,6 +2722,7 @@ void drain_all_pages(struct zone *zone)
|
|
}
|
|
for_each_cpu(cpu, &cpus_with_pcps)
|
|
flush_work(per_cpu_ptr(&pcpu_drain, cpu));
|
|
+#endif
|
|
|
|
mutex_unlock(&pcpu_drain_mutex);
|
|
}
|
|
@@ -2819,9 +2842,9 @@ void free_unref_page(struct page *page)
|
|
if (!free_unref_page_prepare(page, pfn))
|
|
return;
|
|
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
free_unref_page_commit(page, pfn, &dst);
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
if (!list_empty(&dst))
|
|
free_pcppages_bulk(zone, &dst, false);
|
|
}
|
|
@@ -2848,7 +2871,7 @@ void free_unref_page_list(struct list_he
|
|
set_page_private(page, pfn);
|
|
}
|
|
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
list_for_each_entry_safe(page, next, list, lru) {
|
|
unsigned long pfn = page_private(page);
|
|
enum zone_type type;
|
|
@@ -2863,12 +2886,12 @@ void free_unref_page_list(struct list_he
|
|
* a large list of pages to free.
|
|
*/
|
|
if (++batch_count == SWAP_CLUSTER_MAX) {
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
batch_count = 0;
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
}
|
|
}
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
|
|
for (i = 0; i < __MAX_NR_ZONES; ) {
|
|
struct page *page;
|
|
@@ -3017,7 +3040,7 @@ static struct page *rmqueue_pcplist(stru
|
|
struct page *page;
|
|
unsigned long flags;
|
|
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
pcp = &this_cpu_ptr(zone->pageset)->pcp;
|
|
list = &pcp->lists[migratetype];
|
|
page = __rmqueue_pcplist(zone, migratetype, pcp, list);
|
|
@@ -3025,7 +3048,7 @@ static struct page *rmqueue_pcplist(stru
|
|
__count_zid_vm_events(PGALLOC, page_zonenum(page), 1 << order);
|
|
zone_statistics(preferred_zone, zone);
|
|
}
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
return page;
|
|
}
|
|
|
|
@@ -3052,7 +3075,7 @@ struct page *rmqueue(struct zone *prefer
|
|
* allocate greater than order-1 page units with __GFP_NOFAIL.
|
|
*/
|
|
WARN_ON_ONCE((gfp_flags & __GFP_NOFAIL) && (order > 1));
|
|
- spin_lock_irqsave(&zone->lock, flags);
|
|
+ local_spin_lock_irqsave(pa_lock, &zone->lock, flags);
|
|
|
|
do {
|
|
page = NULL;
|
|
@@ -3072,14 +3095,14 @@ struct page *rmqueue(struct zone *prefer
|
|
|
|
__count_zid_vm_events(PGALLOC, page_zonenum(page), 1 << order);
|
|
zone_statistics(preferred_zone, zone);
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
|
|
out:
|
|
VM_BUG_ON_PAGE(page && bad_range(zone, page), page);
|
|
return page;
|
|
|
|
failed:
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
return NULL;
|
|
}
|
|
|
|
@@ -8011,7 +8034,7 @@ void zone_pcp_reset(struct zone *zone)
|
|
struct per_cpu_pageset *pset;
|
|
|
|
/* avoid races with drain_pages() */
|
|
- local_irq_save(flags);
|
|
+ local_lock_irqsave(pa_lock, flags);
|
|
if (zone->pageset != &boot_pageset) {
|
|
for_each_online_cpu(cpu) {
|
|
pset = per_cpu_ptr(zone->pageset, cpu);
|
|
@@ -8020,7 +8043,7 @@ void zone_pcp_reset(struct zone *zone)
|
|
free_percpu(zone->pageset);
|
|
zone->pageset = &boot_pageset;
|
|
}
|
|
- local_irq_restore(flags);
|
|
+ local_unlock_irqrestore(pa_lock, flags);
|
|
}
|
|
|
|
#ifdef CONFIG_MEMORY_HOTREMOVE
|