David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0-or-later |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 2 | /* |
| 3 | * PowerPC version |
| 4 | * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org) |
| 5 | * |
| 6 | * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au) |
| 7 | * and Cort Dougan (PReP) (cort@cs.nmt.edu) |
| 8 | * Copyright (C) 1996 Paul Mackerras |
| 9 | * PPC44x/36-bit changes by Matt Porter (mporter@mvista.com) |
| 10 | * |
| 11 | * Derived from "arch/i386/mm/init.c" |
| 12 | * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 13 | */ |
| 14 | |
| 15 | #include <linux/export.h> |
| 16 | #include <linux/sched.h> |
| 17 | #include <linux/kernel.h> |
| 18 | #include <linux/errno.h> |
| 19 | #include <linux/string.h> |
| 20 | #include <linux/gfp.h> |
| 21 | #include <linux/types.h> |
| 22 | #include <linux/mm.h> |
| 23 | #include <linux/stddef.h> |
| 24 | #include <linux/init.h> |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 25 | #include <linux/memblock.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 26 | #include <linux/highmem.h> |
| 27 | #include <linux/initrd.h> |
| 28 | #include <linux/pagemap.h> |
| 29 | #include <linux/suspend.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 30 | #include <linux/hugetlb.h> |
| 31 | #include <linux/slab.h> |
| 32 | #include <linux/vmalloc.h> |
| 33 | #include <linux/memremap.h> |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 34 | #include <linux/dma-direct.h> |
| 35 | #include <linux/kprobes.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 36 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 37 | #include <asm/prom.h> |
| 38 | #include <asm/io.h> |
| 39 | #include <asm/mmu_context.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 40 | #include <asm/mmu.h> |
| 41 | #include <asm/smp.h> |
| 42 | #include <asm/machdep.h> |
| 43 | #include <asm/btext.h> |
| 44 | #include <asm/tlb.h> |
| 45 | #include <asm/sections.h> |
| 46 | #include <asm/sparsemem.h> |
| 47 | #include <asm/vdso.h> |
| 48 | #include <asm/fixmap.h> |
| 49 | #include <asm/swiotlb.h> |
| 50 | #include <asm/rtas.h> |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 51 | #include <asm/kasan.h> |
| 52 | #include <asm/svm.h> |
| 53 | #include <asm/mmzone.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 54 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 55 | #include <mm/mmu_decl.h> |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 56 | |
| 57 | #ifndef CPU_FTR_COHERENT_ICACHE |
| 58 | #define CPU_FTR_COHERENT_ICACHE 0 /* XXX for now */ |
| 59 | #define CPU_FTR_NOEXECUTE 0 |
| 60 | #endif |
| 61 | |
| 62 | unsigned long long memory_limit; |
| 63 | bool init_mem_is_free; |
| 64 | |
| 65 | #ifdef CONFIG_HIGHMEM |
| 66 | pte_t *kmap_pte; |
| 67 | EXPORT_SYMBOL(kmap_pte); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 68 | #endif |
| 69 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 70 | pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn, |
| 71 | unsigned long size, pgprot_t vma_prot) |
| 72 | { |
| 73 | if (ppc_md.phys_mem_access_prot) |
| 74 | return ppc_md.phys_mem_access_prot(file, pfn, size, vma_prot); |
| 75 | |
| 76 | if (!page_is_ram(pfn)) |
| 77 | vma_prot = pgprot_noncached(vma_prot); |
| 78 | |
| 79 | return vma_prot; |
| 80 | } |
| 81 | EXPORT_SYMBOL(phys_mem_access_prot); |
| 82 | |
| 83 | #ifdef CONFIG_MEMORY_HOTPLUG |
| 84 | |
| 85 | #ifdef CONFIG_NUMA |
| 86 | int memory_add_physaddr_to_nid(u64 start) |
| 87 | { |
| 88 | return hot_add_scn_to_nid(start); |
| 89 | } |
| 90 | #endif |
| 91 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 92 | int __weak create_section_mapping(unsigned long start, unsigned long end, |
| 93 | int nid, pgprot_t prot) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 94 | { |
| 95 | return -ENODEV; |
| 96 | } |
| 97 | |
| 98 | int __weak remove_section_mapping(unsigned long start, unsigned long end) |
| 99 | { |
| 100 | return -ENODEV; |
| 101 | } |
| 102 | |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 103 | #define FLUSH_CHUNK_SIZE SZ_1G |
| 104 | /** |
| 105 | * flush_dcache_range_chunked(): Write any modified data cache blocks out to |
| 106 | * memory and invalidate them, in chunks of up to FLUSH_CHUNK_SIZE |
| 107 | * Does not invalidate the corresponding instruction cache blocks. |
| 108 | * |
| 109 | * @start: the start address |
| 110 | * @stop: the stop address (exclusive) |
| 111 | * @chunk: the max size of the chunks |
| 112 | */ |
| 113 | static void flush_dcache_range_chunked(unsigned long start, unsigned long stop, |
| 114 | unsigned long chunk) |
| 115 | { |
| 116 | unsigned long i; |
| 117 | |
| 118 | for (i = start; i < stop; i += chunk) { |
| 119 | flush_dcache_range(i, min(stop, i + chunk)); |
| 120 | cond_resched(); |
| 121 | } |
| 122 | } |
| 123 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 124 | int __ref arch_add_memory(int nid, u64 start, u64 size, |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 125 | struct mhp_params *params) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 126 | { |
| 127 | unsigned long start_pfn = start >> PAGE_SHIFT; |
| 128 | unsigned long nr_pages = size >> PAGE_SHIFT; |
| 129 | int rc; |
| 130 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 131 | start = (unsigned long)__va(start); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 132 | rc = create_section_mapping(start, start + size, nid, |
| 133 | params->pgprot); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 134 | if (rc) { |
| 135 | pr_warn("Unable to create mapping for hot added memory 0x%llx..0x%llx: %d\n", |
| 136 | start, start + size, rc); |
| 137 | return -EFAULT; |
| 138 | } |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 139 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 140 | return __add_pages(nid, start_pfn, nr_pages, params); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 141 | } |
| 142 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 143 | void __ref arch_remove_memory(int nid, u64 start, u64 size, |
| 144 | struct vmem_altmap *altmap) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 145 | { |
| 146 | unsigned long start_pfn = start >> PAGE_SHIFT; |
| 147 | unsigned long nr_pages = size >> PAGE_SHIFT; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 148 | int ret; |
| 149 | |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 150 | __remove_pages(start_pfn, nr_pages, altmap); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 151 | |
| 152 | /* Remove htab bolted mappings for this section of memory */ |
| 153 | start = (unsigned long)__va(start); |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 154 | flush_dcache_range_chunked(start, start + size, FLUSH_CHUNK_SIZE); |
| 155 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 156 | ret = remove_section_mapping(start, start + size); |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 157 | WARN_ON_ONCE(ret); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 158 | |
| 159 | /* Ensure all vmalloc mappings are flushed in case they also |
| 160 | * hit that section of memory |
| 161 | */ |
| 162 | vm_unmap_aliases(); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 163 | } |
| 164 | #endif |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 165 | |
| 166 | #ifndef CONFIG_NEED_MULTIPLE_NODES |
| 167 | void __init mem_topology_setup(void) |
| 168 | { |
| 169 | max_low_pfn = max_pfn = memblock_end_of_DRAM() >> PAGE_SHIFT; |
| 170 | min_low_pfn = MEMORY_START >> PAGE_SHIFT; |
| 171 | #ifdef CONFIG_HIGHMEM |
| 172 | max_low_pfn = lowmem_end_addr >> PAGE_SHIFT; |
| 173 | #endif |
| 174 | |
| 175 | /* Place all memblock_regions in the same node and merge contiguous |
| 176 | * memblock_regions |
| 177 | */ |
| 178 | memblock_set_node(0, PHYS_ADDR_MAX, &memblock.memory, 0); |
| 179 | } |
| 180 | |
| 181 | void __init initmem_init(void) |
| 182 | { |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 183 | sparse_init(); |
| 184 | } |
| 185 | |
| 186 | /* mark pages that don't exist as nosave */ |
| 187 | static int __init mark_nonram_nosave(void) |
| 188 | { |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 189 | unsigned long spfn, epfn, prev = 0; |
| 190 | int i; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 191 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 192 | for_each_mem_pfn_range(i, MAX_NUMNODES, &spfn, &epfn, NULL) { |
| 193 | if (prev && prev < spfn) |
| 194 | register_nosave_region(prev, spfn); |
| 195 | |
| 196 | prev = epfn; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 197 | } |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 198 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 199 | return 0; |
| 200 | } |
| 201 | #else /* CONFIG_NEED_MULTIPLE_NODES */ |
| 202 | static int __init mark_nonram_nosave(void) |
| 203 | { |
| 204 | return 0; |
| 205 | } |
| 206 | #endif |
| 207 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 208 | /* |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 209 | * Zones usage: |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 210 | * |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 211 | * We setup ZONE_DMA to be 31-bits on all platforms and ZONE_NORMAL to be |
| 212 | * everything else. GFP_DMA32 page allocations automatically fall back to |
| 213 | * ZONE_DMA. |
| 214 | * |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 215 | * By using 31-bit unconditionally, we can exploit zone_dma_bits to inform the |
| 216 | * generic DMA mapping code. 32-bit only devices (if not handled by an IOMMU |
| 217 | * anyway) will take a first dip into ZONE_NORMAL and get otherwise served by |
| 218 | * ZONE_DMA. |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 219 | */ |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 220 | static unsigned long max_zone_pfns[MAX_NR_ZONES]; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 221 | |
| 222 | /* |
| 223 | * paging_init() sets up the page tables - in fact we've already done this. |
| 224 | */ |
| 225 | void __init paging_init(void) |
| 226 | { |
| 227 | unsigned long long total_ram = memblock_phys_mem_size(); |
| 228 | phys_addr_t top_of_ram = memblock_end_of_DRAM(); |
| 229 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 230 | #ifdef CONFIG_HIGHMEM |
| 231 | unsigned long v = __fix_to_virt(FIX_KMAP_END); |
| 232 | unsigned long end = __fix_to_virt(FIX_KMAP_BEGIN); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 233 | |
| 234 | for (; v < end; v += PAGE_SIZE) |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 235 | map_kernel_page(v, 0, __pgprot(0)); /* XXX gross */ |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 236 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 237 | map_kernel_page(PKMAP_BASE, 0, __pgprot(0)); /* XXX gross */ |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 238 | pkmap_page_table = virt_to_kpte(PKMAP_BASE); |
| 239 | |
| 240 | kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN)); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 241 | #endif /* CONFIG_HIGHMEM */ |
| 242 | |
| 243 | printk(KERN_DEBUG "Top of RAM: 0x%llx, Total RAM: 0x%llx\n", |
| 244 | (unsigned long long)top_of_ram, total_ram); |
| 245 | printk(KERN_DEBUG "Memory hole size: %ldMB\n", |
| 246 | (long int)((top_of_ram - total_ram) >> 20)); |
| 247 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 248 | /* |
| 249 | * Allow 30-bit DMA for very limited Broadcom wifi chips on many |
| 250 | * powerbooks. |
| 251 | */ |
| 252 | if (IS_ENABLED(CONFIG_PPC32)) |
| 253 | zone_dma_bits = 30; |
| 254 | else |
| 255 | zone_dma_bits = 31; |
| 256 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 257 | #ifdef CONFIG_ZONE_DMA |
| 258 | max_zone_pfns[ZONE_DMA] = min(max_low_pfn, |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 259 | 1UL << (zone_dma_bits - PAGE_SHIFT)); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 260 | #endif |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 261 | max_zone_pfns[ZONE_NORMAL] = max_low_pfn; |
| 262 | #ifdef CONFIG_HIGHMEM |
| 263 | max_zone_pfns[ZONE_HIGHMEM] = max_pfn; |
| 264 | #endif |
| 265 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 266 | free_area_init(max_zone_pfns); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 267 | |
| 268 | mark_nonram_nosave(); |
| 269 | } |
| 270 | |
| 271 | void __init mem_init(void) |
| 272 | { |
| 273 | /* |
| 274 | * book3s is limited to 16 page sizes due to encoding this in |
| 275 | * a 4-bit field for slices. |
| 276 | */ |
| 277 | BUILD_BUG_ON(MMU_PAGE_COUNT > 16); |
| 278 | |
| 279 | #ifdef CONFIG_SWIOTLB |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 280 | /* |
| 281 | * Some platforms (e.g. 85xx) limit DMA-able memory way below |
| 282 | * 4G. We force memblock to bottom-up mode to ensure that the |
| 283 | * memory allocated in swiotlb_init() is DMA-able. |
| 284 | * As it's the last memblock allocation, no need to reset it |
| 285 | * back to to-down. |
| 286 | */ |
| 287 | memblock_set_bottom_up(true); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 288 | if (is_secure_guest()) |
| 289 | svm_swiotlb_init(); |
| 290 | else |
| 291 | swiotlb_init(0); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 292 | #endif |
| 293 | |
| 294 | high_memory = (void *) __va(max_low_pfn * PAGE_SIZE); |
| 295 | set_max_mapnr(max_pfn); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 296 | |
| 297 | kasan_late_init(); |
| 298 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 299 | memblock_free_all(); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 300 | |
| 301 | #ifdef CONFIG_HIGHMEM |
| 302 | { |
| 303 | unsigned long pfn, highmem_mapnr; |
| 304 | |
| 305 | highmem_mapnr = lowmem_end_addr >> PAGE_SHIFT; |
| 306 | for (pfn = highmem_mapnr; pfn < max_mapnr; ++pfn) { |
| 307 | phys_addr_t paddr = (phys_addr_t)pfn << PAGE_SHIFT; |
| 308 | struct page *page = pfn_to_page(pfn); |
| 309 | if (!memblock_is_reserved(paddr)) |
| 310 | free_highmem_page(page); |
| 311 | } |
| 312 | } |
| 313 | #endif /* CONFIG_HIGHMEM */ |
| 314 | |
| 315 | #if defined(CONFIG_PPC_FSL_BOOK3E) && !defined(CONFIG_SMP) |
| 316 | /* |
| 317 | * If smp is enabled, next_tlbcam_idx is initialized in the cpu up |
| 318 | * functions.... do it here for the non-smp case. |
| 319 | */ |
| 320 | per_cpu(next_tlbcam_idx, smp_processor_id()) = |
| 321 | (mfspr(SPRN_TLB1CFG) & TLBnCFG_N_ENTRY) - 1; |
| 322 | #endif |
| 323 | |
| 324 | mem_init_print_info(NULL); |
| 325 | #ifdef CONFIG_PPC32 |
| 326 | pr_info("Kernel virtual memory layout:\n"); |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 327 | #ifdef CONFIG_KASAN |
| 328 | pr_info(" * 0x%08lx..0x%08lx : kasan shadow mem\n", |
| 329 | KASAN_SHADOW_START, KASAN_SHADOW_END); |
| 330 | #endif |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 331 | pr_info(" * 0x%08lx..0x%08lx : fixmap\n", FIXADDR_START, FIXADDR_TOP); |
| 332 | #ifdef CONFIG_HIGHMEM |
| 333 | pr_info(" * 0x%08lx..0x%08lx : highmem PTEs\n", |
| 334 | PKMAP_BASE, PKMAP_ADDR(LAST_PKMAP)); |
| 335 | #endif /* CONFIG_HIGHMEM */ |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 336 | if (ioremap_bot != IOREMAP_TOP) |
| 337 | pr_info(" * 0x%08lx..0x%08lx : early ioremap\n", |
| 338 | ioremap_bot, IOREMAP_TOP); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 339 | pr_info(" * 0x%08lx..0x%08lx : vmalloc & ioremap\n", |
| 340 | VMALLOC_START, VMALLOC_END); |
| 341 | #endif /* CONFIG_PPC32 */ |
| 342 | } |
| 343 | |
| 344 | void free_initmem(void) |
| 345 | { |
| 346 | ppc_md.progress = ppc_printk_progress; |
| 347 | mark_initmem_nx(); |
| 348 | init_mem_is_free = true; |
| 349 | free_initmem_default(POISON_FREE_INITMEM); |
| 350 | } |
| 351 | |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 352 | /** |
| 353 | * flush_coherent_icache() - if a CPU has a coherent icache, flush it |
| 354 | * @addr: The base address to use (can be any valid address, the whole cache will be flushed) |
| 355 | * Return true if the cache was flushed, false otherwise |
| 356 | */ |
| 357 | static inline bool flush_coherent_icache(unsigned long addr) |
| 358 | { |
| 359 | /* |
| 360 | * For a snooping icache, we still need a dummy icbi to purge all the |
| 361 | * prefetched instructions from the ifetch buffers. We also need a sync |
| 362 | * before the icbi to order the the actual stores to memory that might |
| 363 | * have modified instructions with the icbi. |
| 364 | */ |
| 365 | if (cpu_has_feature(CPU_FTR_COHERENT_ICACHE)) { |
| 366 | mb(); /* sync */ |
| 367 | allow_read_from_user((const void __user *)addr, L1_CACHE_BYTES); |
| 368 | icbi((void *)addr); |
| 369 | prevent_read_from_user((const void __user *)addr, L1_CACHE_BYTES); |
| 370 | mb(); /* sync */ |
| 371 | isync(); |
| 372 | return true; |
| 373 | } |
| 374 | |
| 375 | return false; |
| 376 | } |
| 377 | |
| 378 | /** |
| 379 | * invalidate_icache_range() - Flush the icache by issuing icbi across an address range |
| 380 | * @start: the start address |
| 381 | * @stop: the stop address (exclusive) |
| 382 | */ |
| 383 | static void invalidate_icache_range(unsigned long start, unsigned long stop) |
| 384 | { |
| 385 | unsigned long shift = l1_icache_shift(); |
| 386 | unsigned long bytes = l1_icache_bytes(); |
| 387 | char *addr = (char *)(start & ~(bytes - 1)); |
| 388 | unsigned long size = stop - (unsigned long)addr + (bytes - 1); |
| 389 | unsigned long i; |
| 390 | |
| 391 | for (i = 0; i < size >> shift; i++, addr += bytes) |
| 392 | icbi(addr); |
| 393 | |
| 394 | mb(); /* sync */ |
| 395 | isync(); |
| 396 | } |
| 397 | |
| 398 | /** |
| 399 | * flush_icache_range: Write any modified data cache blocks out to memory |
| 400 | * and invalidate the corresponding blocks in the instruction cache |
| 401 | * |
| 402 | * Generic code will call this after writing memory, before executing from it. |
| 403 | * |
| 404 | * @start: the start address |
| 405 | * @stop: the stop address (exclusive) |
| 406 | */ |
| 407 | void flush_icache_range(unsigned long start, unsigned long stop) |
| 408 | { |
| 409 | if (flush_coherent_icache(start)) |
| 410 | return; |
| 411 | |
| 412 | clean_dcache_range(start, stop); |
| 413 | |
| 414 | if (IS_ENABLED(CONFIG_44x)) { |
| 415 | /* |
| 416 | * Flash invalidate on 44x because we are passed kmapped |
| 417 | * addresses and this doesn't work for userspace pages due to |
| 418 | * the virtually tagged icache. |
| 419 | */ |
| 420 | iccci((void *)start); |
| 421 | mb(); /* sync */ |
| 422 | isync(); |
| 423 | } else |
| 424 | invalidate_icache_range(start, stop); |
| 425 | } |
| 426 | EXPORT_SYMBOL(flush_icache_range); |
| 427 | |
| 428 | #if !defined(CONFIG_PPC_8xx) && !defined(CONFIG_PPC64) |
| 429 | /** |
| 430 | * flush_dcache_icache_phys() - Flush a page by it's physical address |
| 431 | * @physaddr: the physical address of the page |
| 432 | */ |
| 433 | static void flush_dcache_icache_phys(unsigned long physaddr) |
| 434 | { |
| 435 | unsigned long bytes = l1_dcache_bytes(); |
| 436 | unsigned long nb = PAGE_SIZE / bytes; |
| 437 | unsigned long addr = physaddr & PAGE_MASK; |
| 438 | unsigned long msr, msr0; |
| 439 | unsigned long loop1 = addr, loop2 = addr; |
| 440 | |
| 441 | msr0 = mfmsr(); |
| 442 | msr = msr0 & ~MSR_DR; |
| 443 | /* |
| 444 | * This must remain as ASM to prevent potential memory accesses |
| 445 | * while the data MMU is disabled |
| 446 | */ |
| 447 | asm volatile( |
| 448 | " mtctr %2;\n" |
| 449 | " mtmsr %3;\n" |
| 450 | " isync;\n" |
| 451 | "0: dcbst 0, %0;\n" |
| 452 | " addi %0, %0, %4;\n" |
| 453 | " bdnz 0b;\n" |
| 454 | " sync;\n" |
| 455 | " mtctr %2;\n" |
| 456 | "1: icbi 0, %1;\n" |
| 457 | " addi %1, %1, %4;\n" |
| 458 | " bdnz 1b;\n" |
| 459 | " sync;\n" |
| 460 | " mtmsr %5;\n" |
| 461 | " isync;\n" |
| 462 | : "+&r" (loop1), "+&r" (loop2) |
| 463 | : "r" (nb), "r" (msr), "i" (bytes), "r" (msr0) |
| 464 | : "ctr", "memory"); |
| 465 | } |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 466 | NOKPROBE_SYMBOL(flush_dcache_icache_phys) |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 467 | #endif // !defined(CONFIG_PPC_8xx) && !defined(CONFIG_PPC64) |
| 468 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 469 | /* |
| 470 | * This is called when a page has been modified by the kernel. |
| 471 | * It just marks the page as not i-cache clean. We do the i-cache |
| 472 | * flush later when the page is given to a user process, if necessary. |
| 473 | */ |
| 474 | void flush_dcache_page(struct page *page) |
| 475 | { |
| 476 | if (cpu_has_feature(CPU_FTR_COHERENT_ICACHE)) |
| 477 | return; |
| 478 | /* avoid an atomic op if possible */ |
| 479 | if (test_bit(PG_arch_1, &page->flags)) |
| 480 | clear_bit(PG_arch_1, &page->flags); |
| 481 | } |
| 482 | EXPORT_SYMBOL(flush_dcache_page); |
| 483 | |
| 484 | void flush_dcache_icache_page(struct page *page) |
| 485 | { |
| 486 | #ifdef CONFIG_HUGETLB_PAGE |
| 487 | if (PageCompound(page)) { |
| 488 | flush_dcache_icache_hugepage(page); |
| 489 | return; |
| 490 | } |
| 491 | #endif |
| 492 | #if defined(CONFIG_PPC_8xx) || defined(CONFIG_PPC64) |
| 493 | /* On 8xx there is no need to kmap since highmem is not supported */ |
| 494 | __flush_dcache_icache(page_address(page)); |
| 495 | #else |
| 496 | if (IS_ENABLED(CONFIG_BOOKE) || sizeof(phys_addr_t) > sizeof(void *)) { |
| 497 | void *start = kmap_atomic(page); |
| 498 | __flush_dcache_icache(start); |
| 499 | kunmap_atomic(start); |
| 500 | } else { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 501 | unsigned long addr = page_to_pfn(page) << PAGE_SHIFT; |
| 502 | |
| 503 | if (flush_coherent_icache(addr)) |
| 504 | return; |
| 505 | flush_dcache_icache_phys(addr); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 506 | } |
| 507 | #endif |
| 508 | } |
| 509 | EXPORT_SYMBOL(flush_dcache_icache_page); |
| 510 | |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame] | 511 | /** |
| 512 | * __flush_dcache_icache(): Flush a particular page from the data cache to RAM. |
| 513 | * Note: this is necessary because the instruction cache does *not* |
| 514 | * snoop from the data cache. |
| 515 | * |
| 516 | * @page: the address of the page to flush |
| 517 | */ |
| 518 | void __flush_dcache_icache(void *p) |
| 519 | { |
| 520 | unsigned long addr = (unsigned long)p; |
| 521 | |
| 522 | if (flush_coherent_icache(addr)) |
| 523 | return; |
| 524 | |
| 525 | clean_dcache_range(addr, addr + PAGE_SIZE); |
| 526 | |
| 527 | /* |
| 528 | * We don't flush the icache on 44x. Those have a virtual icache and we |
| 529 | * don't have access to the virtual address here (it's not the page |
| 530 | * vaddr but where it's mapped in user space). The flushing of the |
| 531 | * icache on these is handled elsewhere, when a change in the address |
| 532 | * space occurs, before returning to user space. |
| 533 | */ |
| 534 | |
| 535 | if (mmu_has_feature(MMU_FTR_TYPE_44x)) |
| 536 | return; |
| 537 | |
| 538 | invalidate_icache_range(addr, addr + PAGE_SIZE); |
| 539 | } |
| 540 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 541 | void clear_user_page(void *page, unsigned long vaddr, struct page *pg) |
| 542 | { |
| 543 | clear_page(page); |
| 544 | |
| 545 | /* |
| 546 | * We shouldn't have to do this, but some versions of glibc |
| 547 | * require it (ld.so assumes zero filled pages are icache clean) |
| 548 | * - Anton |
| 549 | */ |
| 550 | flush_dcache_page(pg); |
| 551 | } |
| 552 | EXPORT_SYMBOL(clear_user_page); |
| 553 | |
| 554 | void copy_user_page(void *vto, void *vfrom, unsigned long vaddr, |
| 555 | struct page *pg) |
| 556 | { |
| 557 | copy_page(vto, vfrom); |
| 558 | |
| 559 | /* |
| 560 | * We should be able to use the following optimisation, however |
| 561 | * there are two problems. |
| 562 | * Firstly a bug in some versions of binutils meant PLT sections |
| 563 | * were not marked executable. |
| 564 | * Secondly the first word in the GOT section is blrl, used |
| 565 | * to establish the GOT address. Until recently the GOT was |
| 566 | * not marked executable. |
| 567 | * - Anton |
| 568 | */ |
| 569 | #if 0 |
| 570 | if (!vma->vm_file && ((vma->vm_flags & VM_EXEC) == 0)) |
| 571 | return; |
| 572 | #endif |
| 573 | |
| 574 | flush_dcache_page(pg); |
| 575 | } |
| 576 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 577 | void flush_icache_user_page(struct vm_area_struct *vma, struct page *page, |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 578 | unsigned long addr, int len) |
| 579 | { |
| 580 | unsigned long maddr; |
| 581 | |
| 582 | maddr = (unsigned long) kmap(page) + (addr & ~PAGE_MASK); |
| 583 | flush_icache_range(maddr, maddr + len); |
| 584 | kunmap(page); |
| 585 | } |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 586 | |
| 587 | /* |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 588 | * System memory should not be in /proc/iomem but various tools expect it |
| 589 | * (eg kdump). |
| 590 | */ |
| 591 | static int __init add_system_ram_resources(void) |
| 592 | { |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 593 | phys_addr_t start, end; |
| 594 | u64 i; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 595 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 596 | for_each_mem_range(i, &start, &end) { |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 597 | struct resource *res; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 598 | |
| 599 | res = kzalloc(sizeof(struct resource), GFP_KERNEL); |
| 600 | WARN_ON(!res); |
| 601 | |
| 602 | if (res) { |
| 603 | res->name = "System RAM"; |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 604 | res->start = start; |
| 605 | /* |
| 606 | * In memblock, end points to the first byte after |
| 607 | * the range while in resourses, end points to the |
| 608 | * last byte in the range. |
| 609 | */ |
| 610 | res->end = end - 1; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 611 | res->flags = IORESOURCE_SYSTEM_RAM | IORESOURCE_BUSY; |
| 612 | WARN_ON(request_resource(&iomem_resource, res) < 0); |
| 613 | } |
| 614 | } |
| 615 | |
| 616 | return 0; |
| 617 | } |
| 618 | subsys_initcall(add_system_ram_resources); |
| 619 | |
| 620 | #ifdef CONFIG_STRICT_DEVMEM |
| 621 | /* |
| 622 | * devmem_is_allowed(): check to see if /dev/mem access to a certain address |
| 623 | * is valid. The argument is a physical page number. |
| 624 | * |
| 625 | * Access has to be given to non-kernel-ram areas as well, these contain the |
| 626 | * PCI mmio resources as well as potential bios/acpi data regions. |
| 627 | */ |
| 628 | int devmem_is_allowed(unsigned long pfn) |
| 629 | { |
| 630 | if (page_is_rtas_user_buf(pfn)) |
| 631 | return 1; |
| 632 | if (iomem_is_exclusive(PFN_PHYS(pfn))) |
| 633 | return 0; |
| 634 | if (!page_is_ram(pfn)) |
| 635 | return 1; |
| 636 | return 0; |
| 637 | } |
| 638 | #endif /* CONFIG_STRICT_DEVMEM */ |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 639 | |
| 640 | /* |
| 641 | * This is defined in kernel/resource.c but only powerpc needs to export it, for |
| 642 | * the EHEA driver. Drop this when drivers/net/ethernet/ibm/ehea is removed. |
| 643 | */ |
| 644 | EXPORT_SYMBOL_GPL(walk_system_ram_range); |