Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Code to handle transition of Linux booting another kernel. |
| 3 | * |
| 4 | * Copyright (C) 2002-2003 Eric Biederman <ebiederm@xmission.com> |
| 5 | * GameCube/ppc32 port Copyright (C) 2004 Albert Herranz |
| 6 | * Copyright (C) 2005 IBM Corporation. |
| 7 | * |
| 8 | * This source code is licensed under the GNU General Public License, |
| 9 | * Version 2. See the file COPYING for more details. |
| 10 | */ |
| 11 | |
| 12 | #include <linux/kexec.h> |
| 13 | #include <linux/reboot.h> |
| 14 | #include <linux/threads.h> |
| 15 | #include <linux/memblock.h> |
| 16 | #include <linux/of.h> |
| 17 | #include <linux/irq.h> |
| 18 | #include <linux/ftrace.h> |
| 19 | |
| 20 | #include <asm/kdump.h> |
| 21 | #include <asm/machdep.h> |
| 22 | #include <asm/pgalloc.h> |
| 23 | #include <asm/prom.h> |
| 24 | #include <asm/sections.h> |
| 25 | |
| 26 | void machine_kexec_mask_interrupts(void) { |
| 27 | unsigned int i; |
| 28 | struct irq_desc *desc; |
| 29 | |
| 30 | for_each_irq_desc(i, desc) { |
| 31 | struct irq_chip *chip; |
| 32 | |
| 33 | chip = irq_desc_get_chip(desc); |
| 34 | if (!chip) |
| 35 | continue; |
| 36 | |
| 37 | if (chip->irq_eoi && irqd_irq_inprogress(&desc->irq_data)) |
| 38 | chip->irq_eoi(&desc->irq_data); |
| 39 | |
| 40 | if (chip->irq_mask) |
| 41 | chip->irq_mask(&desc->irq_data); |
| 42 | |
| 43 | if (chip->irq_disable && !irqd_irq_disabled(&desc->irq_data)) |
| 44 | chip->irq_disable(&desc->irq_data); |
| 45 | } |
| 46 | } |
| 47 | |
| 48 | void machine_crash_shutdown(struct pt_regs *regs) |
| 49 | { |
| 50 | default_machine_crash_shutdown(regs); |
| 51 | } |
| 52 | |
| 53 | /* |
| 54 | * Do what every setup is needed on image and the |
| 55 | * reboot code buffer to allow us to avoid allocations |
| 56 | * later. |
| 57 | */ |
| 58 | int machine_kexec_prepare(struct kimage *image) |
| 59 | { |
| 60 | if (ppc_md.machine_kexec_prepare) |
| 61 | return ppc_md.machine_kexec_prepare(image); |
| 62 | else |
| 63 | return default_machine_kexec_prepare(image); |
| 64 | } |
| 65 | |
| 66 | void machine_kexec_cleanup(struct kimage *image) |
| 67 | { |
| 68 | } |
| 69 | |
| 70 | void arch_crash_save_vmcoreinfo(void) |
| 71 | { |
| 72 | |
| 73 | #ifdef CONFIG_NEED_MULTIPLE_NODES |
| 74 | VMCOREINFO_SYMBOL(node_data); |
| 75 | VMCOREINFO_LENGTH(node_data, MAX_NUMNODES); |
| 76 | #endif |
| 77 | #ifndef CONFIG_NEED_MULTIPLE_NODES |
| 78 | VMCOREINFO_SYMBOL(contig_page_data); |
| 79 | #endif |
| 80 | #if defined(CONFIG_PPC64) && defined(CONFIG_SPARSEMEM_VMEMMAP) |
| 81 | VMCOREINFO_SYMBOL(vmemmap_list); |
| 82 | VMCOREINFO_SYMBOL(mmu_vmemmap_psize); |
| 83 | VMCOREINFO_SYMBOL(mmu_psize_defs); |
| 84 | VMCOREINFO_STRUCT_SIZE(vmemmap_backing); |
| 85 | VMCOREINFO_OFFSET(vmemmap_backing, list); |
| 86 | VMCOREINFO_OFFSET(vmemmap_backing, phys); |
| 87 | VMCOREINFO_OFFSET(vmemmap_backing, virt_addr); |
| 88 | VMCOREINFO_STRUCT_SIZE(mmu_psize_def); |
| 89 | VMCOREINFO_OFFSET(mmu_psize_def, shift); |
| 90 | #endif |
| 91 | } |
| 92 | |
| 93 | /* |
| 94 | * Do not allocate memory (or fail in any way) in machine_kexec(). |
| 95 | * We are past the point of no return, committed to rebooting now. |
| 96 | */ |
| 97 | void machine_kexec(struct kimage *image) |
| 98 | { |
| 99 | int save_ftrace_enabled; |
| 100 | |
| 101 | save_ftrace_enabled = __ftrace_enabled_save(); |
| 102 | this_cpu_disable_ftrace(); |
| 103 | |
| 104 | if (ppc_md.machine_kexec) |
| 105 | ppc_md.machine_kexec(image); |
| 106 | else |
| 107 | default_machine_kexec(image); |
| 108 | |
| 109 | this_cpu_enable_ftrace(); |
| 110 | __ftrace_enabled_restore(save_ftrace_enabled); |
| 111 | |
| 112 | /* Fall back to normal restart if we're still alive. */ |
| 113 | machine_restart(NULL); |
| 114 | for(;;); |
| 115 | } |
| 116 | |
| 117 | void __init reserve_crashkernel(void) |
| 118 | { |
| 119 | unsigned long long crash_size, crash_base; |
| 120 | int ret; |
| 121 | |
| 122 | /* use common parsing */ |
| 123 | ret = parse_crashkernel(boot_command_line, memblock_phys_mem_size(), |
| 124 | &crash_size, &crash_base); |
| 125 | if (ret == 0 && crash_size > 0) { |
| 126 | crashk_res.start = crash_base; |
| 127 | crashk_res.end = crash_base + crash_size - 1; |
| 128 | } |
| 129 | |
| 130 | if (crashk_res.end == crashk_res.start) { |
| 131 | crashk_res.start = crashk_res.end = 0; |
| 132 | return; |
| 133 | } |
| 134 | |
| 135 | /* We might have got these values via the command line or the |
| 136 | * device tree, either way sanitise them now. */ |
| 137 | |
| 138 | crash_size = resource_size(&crashk_res); |
| 139 | |
| 140 | #ifndef CONFIG_NONSTATIC_KERNEL |
| 141 | if (crashk_res.start != KDUMP_KERNELBASE) |
| 142 | printk("Crash kernel location must be 0x%x\n", |
| 143 | KDUMP_KERNELBASE); |
| 144 | |
| 145 | crashk_res.start = KDUMP_KERNELBASE; |
| 146 | #else |
| 147 | if (!crashk_res.start) { |
| 148 | #ifdef CONFIG_PPC64 |
| 149 | /* |
| 150 | * On 64bit we split the RMO in half but cap it at half of |
| 151 | * a small SLB (128MB) since the crash kernel needs to place |
| 152 | * itself and some stacks to be in the first segment. |
| 153 | */ |
| 154 | crashk_res.start = min(0x8000000ULL, (ppc64_rma_size / 2)); |
| 155 | #else |
| 156 | crashk_res.start = KDUMP_KERNELBASE; |
| 157 | #endif |
| 158 | } |
| 159 | |
| 160 | crash_base = PAGE_ALIGN(crashk_res.start); |
| 161 | if (crash_base != crashk_res.start) { |
| 162 | printk("Crash kernel base must be aligned to 0x%lx\n", |
| 163 | PAGE_SIZE); |
| 164 | crashk_res.start = crash_base; |
| 165 | } |
| 166 | |
| 167 | #endif |
| 168 | crash_size = PAGE_ALIGN(crash_size); |
| 169 | crashk_res.end = crashk_res.start + crash_size - 1; |
| 170 | |
| 171 | /* The crash region must not overlap the current kernel */ |
| 172 | if (overlaps_crashkernel(__pa(_stext), _end - _stext)) { |
| 173 | printk(KERN_WARNING |
| 174 | "Crash kernel can not overlap current kernel\n"); |
| 175 | crashk_res.start = crashk_res.end = 0; |
| 176 | return; |
| 177 | } |
| 178 | |
| 179 | /* Crash kernel trumps memory limit */ |
| 180 | if (memory_limit && memory_limit <= crashk_res.end) { |
| 181 | memory_limit = crashk_res.end + 1; |
| 182 | printk("Adjusted memory limit for crashkernel, now 0x%llx\n", |
| 183 | memory_limit); |
| 184 | } |
| 185 | |
| 186 | printk(KERN_INFO "Reserving %ldMB of memory at %ldMB " |
| 187 | "for crashkernel (System RAM: %ldMB)\n", |
| 188 | (unsigned long)(crash_size >> 20), |
| 189 | (unsigned long)(crashk_res.start >> 20), |
| 190 | (unsigned long)(memblock_phys_mem_size() >> 20)); |
| 191 | |
| 192 | if (!memblock_is_region_memory(crashk_res.start, crash_size) || |
| 193 | memblock_reserve(crashk_res.start, crash_size)) { |
| 194 | pr_err("Failed to reserve memory for crashkernel!\n"); |
| 195 | crashk_res.start = crashk_res.end = 0; |
| 196 | return; |
| 197 | } |
| 198 | } |
| 199 | |
| 200 | int overlaps_crashkernel(unsigned long start, unsigned long size) |
| 201 | { |
| 202 | return (start + size) > crashk_res.start && start <= crashk_res.end; |
| 203 | } |
| 204 | |
| 205 | /* Values we need to export to the second kernel via the device tree. */ |
| 206 | static phys_addr_t kernel_end; |
| 207 | static phys_addr_t crashk_base; |
| 208 | static phys_addr_t crashk_size; |
| 209 | static unsigned long long mem_limit; |
| 210 | |
| 211 | static struct property kernel_end_prop = { |
| 212 | .name = "linux,kernel-end", |
| 213 | .length = sizeof(phys_addr_t), |
| 214 | .value = &kernel_end, |
| 215 | }; |
| 216 | |
| 217 | static struct property crashk_base_prop = { |
| 218 | .name = "linux,crashkernel-base", |
| 219 | .length = sizeof(phys_addr_t), |
| 220 | .value = &crashk_base |
| 221 | }; |
| 222 | |
| 223 | static struct property crashk_size_prop = { |
| 224 | .name = "linux,crashkernel-size", |
| 225 | .length = sizeof(phys_addr_t), |
| 226 | .value = &crashk_size, |
| 227 | }; |
| 228 | |
| 229 | static struct property memory_limit_prop = { |
| 230 | .name = "linux,memory-limit", |
| 231 | .length = sizeof(unsigned long long), |
| 232 | .value = &mem_limit, |
| 233 | }; |
| 234 | |
| 235 | #define cpu_to_be_ulong __PASTE(cpu_to_be, BITS_PER_LONG) |
| 236 | |
| 237 | static void __init export_crashk_values(struct device_node *node) |
| 238 | { |
| 239 | /* There might be existing crash kernel properties, but we can't |
| 240 | * be sure what's in them, so remove them. */ |
| 241 | of_remove_property(node, of_find_property(node, |
| 242 | "linux,crashkernel-base", NULL)); |
| 243 | of_remove_property(node, of_find_property(node, |
| 244 | "linux,crashkernel-size", NULL)); |
| 245 | |
| 246 | if (crashk_res.start != 0) { |
| 247 | crashk_base = cpu_to_be_ulong(crashk_res.start), |
| 248 | of_add_property(node, &crashk_base_prop); |
| 249 | crashk_size = cpu_to_be_ulong(resource_size(&crashk_res)); |
| 250 | of_add_property(node, &crashk_size_prop); |
| 251 | } |
| 252 | |
| 253 | /* |
| 254 | * memory_limit is required by the kexec-tools to limit the |
| 255 | * crash regions to the actual memory used. |
| 256 | */ |
| 257 | mem_limit = cpu_to_be_ulong(memory_limit); |
| 258 | of_update_property(node, &memory_limit_prop); |
| 259 | } |
| 260 | |
| 261 | static int __init kexec_setup(void) |
| 262 | { |
| 263 | struct device_node *node; |
| 264 | |
| 265 | node = of_find_node_by_path("/chosen"); |
| 266 | if (!node) |
| 267 | return -ENOENT; |
| 268 | |
| 269 | /* remove any stale properties so ours can be found */ |
| 270 | of_remove_property(node, of_find_property(node, kernel_end_prop.name, NULL)); |
| 271 | |
| 272 | /* information needed by userspace when using default_machine_kexec */ |
| 273 | kernel_end = cpu_to_be_ulong(__pa(_end)); |
| 274 | of_add_property(node, &kernel_end_prop); |
| 275 | |
| 276 | export_crashk_values(node); |
| 277 | |
| 278 | of_node_put(node); |
| 279 | return 0; |
| 280 | } |
| 281 | late_initcall(kexec_setup); |