David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0-only |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 2 | /* |
| 3 | * mm_init.c - Memory initialisation verification and debugging |
| 4 | * |
| 5 | * Copyright 2008 IBM Corporation, 2008 |
| 6 | * Author Mel Gorman <mel@csn.ul.ie> |
| 7 | * |
| 8 | */ |
| 9 | #include <linux/kernel.h> |
| 10 | #include <linux/init.h> |
| 11 | #include <linux/kobject.h> |
| 12 | #include <linux/export.h> |
| 13 | #include <linux/memory.h> |
| 14 | #include <linux/notifier.h> |
| 15 | #include <linux/sched.h> |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 16 | #include <linux/mman.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 17 | #include "internal.h" |
| 18 | |
| 19 | #ifdef CONFIG_DEBUG_MEMORY_INIT |
| 20 | int __meminitdata mminit_loglevel; |
| 21 | |
| 22 | #ifndef SECTIONS_SHIFT |
| 23 | #define SECTIONS_SHIFT 0 |
| 24 | #endif |
| 25 | |
| 26 | /* The zonelists are simply reported, validation is manual. */ |
| 27 | void __init mminit_verify_zonelist(void) |
| 28 | { |
| 29 | int nid; |
| 30 | |
| 31 | if (mminit_loglevel < MMINIT_VERIFY) |
| 32 | return; |
| 33 | |
| 34 | for_each_online_node(nid) { |
| 35 | pg_data_t *pgdat = NODE_DATA(nid); |
| 36 | struct zone *zone; |
| 37 | struct zoneref *z; |
| 38 | struct zonelist *zonelist; |
| 39 | int i, listid, zoneid; |
| 40 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 41 | BUILD_BUG_ON(MAX_ZONELISTS > 2); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 42 | for (i = 0; i < MAX_ZONELISTS * MAX_NR_ZONES; i++) { |
| 43 | |
| 44 | /* Identify the zone and nodelist */ |
| 45 | zoneid = i % MAX_NR_ZONES; |
| 46 | listid = i / MAX_NR_ZONES; |
| 47 | zonelist = &pgdat->node_zonelists[listid]; |
| 48 | zone = &pgdat->node_zones[zoneid]; |
| 49 | if (!populated_zone(zone)) |
| 50 | continue; |
| 51 | |
| 52 | /* Print information about the zonelist */ |
| 53 | printk(KERN_DEBUG "mminit::zonelist %s %d:%s = ", |
| 54 | listid > 0 ? "thisnode" : "general", nid, |
| 55 | zone->name); |
| 56 | |
| 57 | /* Iterate the zonelist */ |
| 58 | for_each_zone_zonelist(zone, z, zonelist, zoneid) |
| 59 | pr_cont("%d:%s ", zone_to_nid(zone), zone->name); |
| 60 | pr_cont("\n"); |
| 61 | } |
| 62 | } |
| 63 | } |
| 64 | |
| 65 | void __init mminit_verify_pageflags_layout(void) |
| 66 | { |
| 67 | int shift, width; |
| 68 | unsigned long or_mask, add_mask; |
| 69 | |
| 70 | shift = 8 * sizeof(unsigned long); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 71 | width = shift - SECTIONS_WIDTH - NODES_WIDTH - ZONES_WIDTH |
| 72 | - LAST_CPUPID_SHIFT - KASAN_TAG_WIDTH; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 73 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_widths", |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 74 | "Section %d Node %d Zone %d Lastcpupid %d Kasantag %d Flags %d\n", |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 75 | SECTIONS_WIDTH, |
| 76 | NODES_WIDTH, |
| 77 | ZONES_WIDTH, |
| 78 | LAST_CPUPID_WIDTH, |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 79 | KASAN_TAG_WIDTH, |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 80 | NR_PAGEFLAGS); |
| 81 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_shifts", |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 82 | "Section %d Node %d Zone %d Lastcpupid %d Kasantag %d\n", |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 83 | SECTIONS_SHIFT, |
| 84 | NODES_SHIFT, |
| 85 | ZONES_SHIFT, |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 86 | LAST_CPUPID_SHIFT, |
| 87 | KASAN_TAG_WIDTH); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 88 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_pgshifts", |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 89 | "Section %lu Node %lu Zone %lu Lastcpupid %lu Kasantag %lu\n", |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 90 | (unsigned long)SECTIONS_PGSHIFT, |
| 91 | (unsigned long)NODES_PGSHIFT, |
| 92 | (unsigned long)ZONES_PGSHIFT, |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 93 | (unsigned long)LAST_CPUPID_PGSHIFT, |
| 94 | (unsigned long)KASAN_TAG_PGSHIFT); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 95 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_nodezoneid", |
| 96 | "Node/Zone ID: %lu -> %lu\n", |
| 97 | (unsigned long)(ZONEID_PGOFF + ZONEID_SHIFT), |
| 98 | (unsigned long)ZONEID_PGOFF); |
| 99 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_usage", |
| 100 | "location: %d -> %d layout %d -> %d unused %d -> %d page-flags\n", |
| 101 | shift, width, width, NR_PAGEFLAGS, NR_PAGEFLAGS, 0); |
| 102 | #ifdef NODE_NOT_IN_PAGE_FLAGS |
| 103 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_nodeflags", |
| 104 | "Node not in page flags"); |
| 105 | #endif |
| 106 | #ifdef LAST_CPUPID_NOT_IN_PAGE_FLAGS |
| 107 | mminit_dprintk(MMINIT_TRACE, "pageflags_layout_nodeflags", |
| 108 | "Last cpupid not in page flags"); |
| 109 | #endif |
| 110 | |
| 111 | if (SECTIONS_WIDTH) { |
| 112 | shift -= SECTIONS_WIDTH; |
| 113 | BUG_ON(shift != SECTIONS_PGSHIFT); |
| 114 | } |
| 115 | if (NODES_WIDTH) { |
| 116 | shift -= NODES_WIDTH; |
| 117 | BUG_ON(shift != NODES_PGSHIFT); |
| 118 | } |
| 119 | if (ZONES_WIDTH) { |
| 120 | shift -= ZONES_WIDTH; |
| 121 | BUG_ON(shift != ZONES_PGSHIFT); |
| 122 | } |
| 123 | |
| 124 | /* Check for bitmask overlaps */ |
| 125 | or_mask = (ZONES_MASK << ZONES_PGSHIFT) | |
| 126 | (NODES_MASK << NODES_PGSHIFT) | |
| 127 | (SECTIONS_MASK << SECTIONS_PGSHIFT); |
| 128 | add_mask = (ZONES_MASK << ZONES_PGSHIFT) + |
| 129 | (NODES_MASK << NODES_PGSHIFT) + |
| 130 | (SECTIONS_MASK << SECTIONS_PGSHIFT); |
| 131 | BUG_ON(or_mask != add_mask); |
| 132 | } |
| 133 | |
| 134 | static __init int set_mminit_loglevel(char *str) |
| 135 | { |
| 136 | get_option(&str, &mminit_loglevel); |
| 137 | return 0; |
| 138 | } |
| 139 | early_param("mminit_loglevel", set_mminit_loglevel); |
| 140 | #endif /* CONFIG_DEBUG_MEMORY_INIT */ |
| 141 | |
| 142 | struct kobject *mm_kobj; |
| 143 | EXPORT_SYMBOL_GPL(mm_kobj); |
| 144 | |
| 145 | #ifdef CONFIG_SMP |
| 146 | s32 vm_committed_as_batch = 32; |
| 147 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 148 | void mm_compute_batch(int overcommit_policy) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 149 | { |
| 150 | u64 memsized_batch; |
| 151 | s32 nr = num_present_cpus(); |
| 152 | s32 batch = max_t(s32, nr*2, 32); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 153 | unsigned long ram_pages = totalram_pages(); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 154 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 155 | /* |
| 156 | * For policy OVERCOMMIT_NEVER, set batch size to 0.4% of |
| 157 | * (total memory/#cpus), and lift it to 25% for other policies |
| 158 | * to easy the possible lock contention for percpu_counter |
| 159 | * vm_committed_as, while the max limit is INT_MAX |
| 160 | */ |
| 161 | if (overcommit_policy == OVERCOMMIT_NEVER) |
| 162 | memsized_batch = min_t(u64, ram_pages/nr/256, INT_MAX); |
| 163 | else |
| 164 | memsized_batch = min_t(u64, ram_pages/nr/4, INT_MAX); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 165 | |
| 166 | vm_committed_as_batch = max_t(s32, memsized_batch, batch); |
| 167 | } |
| 168 | |
| 169 | static int __meminit mm_compute_batch_notifier(struct notifier_block *self, |
| 170 | unsigned long action, void *arg) |
| 171 | { |
| 172 | switch (action) { |
| 173 | case MEM_ONLINE: |
| 174 | case MEM_OFFLINE: |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 175 | mm_compute_batch(sysctl_overcommit_memory); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 176 | default: |
| 177 | break; |
| 178 | } |
| 179 | return NOTIFY_OK; |
| 180 | } |
| 181 | |
| 182 | static struct notifier_block compute_batch_nb __meminitdata = { |
| 183 | .notifier_call = mm_compute_batch_notifier, |
| 184 | .priority = IPC_CALLBACK_PRI, /* use lowest priority */ |
| 185 | }; |
| 186 | |
| 187 | static int __init mm_compute_batch_init(void) |
| 188 | { |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 189 | mm_compute_batch(sysctl_overcommit_memory); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 190 | register_hotmemory_notifier(&compute_batch_nb); |
| 191 | |
| 192 | return 0; |
| 193 | } |
| 194 | |
| 195 | __initcall(mm_compute_batch_init); |
| 196 | |
| 197 | #endif |
| 198 | |
| 199 | static int __init mm_sysfs_init(void) |
| 200 | { |
| 201 | mm_kobj = kobject_create_and_add("mm", kernel_kobj); |
| 202 | if (!mm_kobj) |
| 203 | return -ENOMEM; |
| 204 | |
| 205 | return 0; |
| 206 | } |
| 207 | postcore_initcall(mm_sysfs_init); |