1 /* 2 * Copyright IBM Corp. 2005, 2011 3 * 4 * Author(s): Rolf Adelsberger, 5 * Heiko Carstens <heiko.carstens@de.ibm.com> 6 * Michael Holzheu <holzheu@linux.vnet.ibm.com> 7 */ 8 9 #include <linux/device.h> 10 #include <linux/mm.h> 11 #include <linux/kexec.h> 12 #include <linux/delay.h> 13 #include <linux/reboot.h> 14 #include <linux/ftrace.h> 15 #include <linux/debug_locks.h> 16 #include <linux/suspend.h> 17 #include <asm/cio.h> 18 #include <asm/setup.h> 19 #include <asm/pgtable.h> 20 #include <asm/pgalloc.h> 21 #include <asm/smp.h> 22 #include <asm/reset.h> 23 #include <asm/ipl.h> 24 #include <asm/diag.h> 25 #include <asm/elf.h> 26 #include <asm/asm-offsets.h> 27 #include <asm/cacheflush.h> 28 #include <asm/os_info.h> 29 #include <asm/set_memory.h> 30 #include <asm/switch_to.h> 31 #include <asm/nmi.h> 32 33 typedef void (*relocate_kernel_t)(kimage_entry_t *, unsigned long); 34 35 extern const unsigned char relocate_kernel[]; 36 extern const unsigned long long relocate_kernel_len; 37 38 #ifdef CONFIG_CRASH_DUMP 39 40 /* 41 * PM notifier callback for kdump 42 */ 43 static int machine_kdump_pm_cb(struct notifier_block *nb, unsigned long action, 44 void *ptr) 45 { 46 switch (action) { 47 case PM_SUSPEND_PREPARE: 48 case PM_HIBERNATION_PREPARE: 49 if (kexec_crash_image) 50 arch_kexec_unprotect_crashkres(); 51 break; 52 case PM_POST_SUSPEND: 53 case PM_POST_HIBERNATION: 54 if (kexec_crash_image) 55 arch_kexec_protect_crashkres(); 56 break; 57 default: 58 return NOTIFY_DONE; 59 } 60 return NOTIFY_OK; 61 } 62 63 static int __init machine_kdump_pm_init(void) 64 { 65 pm_notifier(machine_kdump_pm_cb, 0); 66 return 0; 67 } 68 arch_initcall(machine_kdump_pm_init); 69 70 /* 71 * Reset the system, copy boot CPU registers to absolute zero, 72 * and jump to the kdump image 73 */ 74 static void __do_machine_kdump(void *image) 75 { 76 int (*start_kdump)(int); 77 unsigned long prefix; 78 79 /* store_status() saved the prefix register to lowcore */ 80 prefix = (unsigned long) S390_lowcore.prefixreg_save_area; 81 82 /* Now do the reset */ 83 s390_reset_system(); 84 85 /* 86 * Copy dump CPU store status info to absolute zero. 87 * This need to be done *after* s390_reset_system set the 88 * prefix register of this CPU to zero 89 */ 90 memcpy((void *) __LC_FPREGS_SAVE_AREA, 91 (void *)(prefix + __LC_FPREGS_SAVE_AREA), 512); 92 93 __load_psw_mask(PSW_MASK_BASE | PSW_DEFAULT_KEY | PSW_MASK_EA | PSW_MASK_BA); 94 start_kdump = (void *)((struct kimage *) image)->start; 95 start_kdump(1); 96 97 /* Die if start_kdump returns */ 98 disabled_wait((unsigned long) __builtin_return_address(0)); 99 } 100 101 /* 102 * Start kdump: create a LGR log entry, store status of all CPUs and 103 * branch to __do_machine_kdump. 104 */ 105 static noinline void __machine_kdump(void *image) 106 { 107 struct mcesa *mcesa; 108 unsigned long cr2_old, cr2_new; 109 int this_cpu, cpu; 110 111 lgr_info_log(); 112 /* Get status of the other CPUs */ 113 this_cpu = smp_find_processor_id(stap()); 114 for_each_online_cpu(cpu) { 115 if (cpu == this_cpu) 116 continue; 117 if (smp_store_status(cpu)) 118 continue; 119 } 120 /* Store status of the boot CPU */ 121 mcesa = (struct mcesa *)(S390_lowcore.mcesad & MCESA_ORIGIN_MASK); 122 if (MACHINE_HAS_VX) 123 save_vx_regs((__vector128 *) mcesa->vector_save_area); 124 if (MACHINE_HAS_GS) { 125 __ctl_store(cr2_old, 2, 2); 126 cr2_new = cr2_old | (1UL << 4); 127 __ctl_load(cr2_new, 2, 2); 128 save_gs_cb((struct gs_cb *) mcesa->guarded_storage_save_area); 129 __ctl_load(cr2_old, 2, 2); 130 } 131 /* 132 * To create a good backchain for this CPU in the dump store_status 133 * is passed the address of a function. The address is saved into 134 * the PSW save area of the boot CPU and the function is invoked as 135 * a tail call of store_status. The backchain in the dump will look 136 * like this: 137 * restart_int_handler -> __machine_kexec -> __do_machine_kdump 138 * The call to store_status() will not return. 139 */ 140 store_status(__do_machine_kdump, image); 141 } 142 #endif 143 144 /* 145 * Check if kdump checksums are valid: We call purgatory with parameter "0" 146 */ 147 static int kdump_csum_valid(struct kimage *image) 148 { 149 #ifdef CONFIG_CRASH_DUMP 150 int (*start_kdump)(int) = (void *)image->start; 151 int rc; 152 153 __arch_local_irq_stnsm(0xfb); /* disable DAT */ 154 rc = start_kdump(0); 155 __arch_local_irq_stosm(0x04); /* enable DAT */ 156 return rc ? 0 : -EINVAL; 157 #else 158 return -EINVAL; 159 #endif 160 } 161 162 #ifdef CONFIG_CRASH_DUMP 163 164 void crash_free_reserved_phys_range(unsigned long begin, unsigned long end) 165 { 166 unsigned long addr, size; 167 168 for (addr = begin; addr < end; addr += PAGE_SIZE) 169 free_reserved_page(pfn_to_page(addr >> PAGE_SHIFT)); 170 size = begin - crashk_res.start; 171 if (size) 172 os_info_crashkernel_add(crashk_res.start, size); 173 else 174 os_info_crashkernel_add(0, 0); 175 } 176 177 static void crash_protect_pages(int protect) 178 { 179 unsigned long size; 180 181 if (!crashk_res.end) 182 return; 183 size = resource_size(&crashk_res); 184 if (protect) 185 set_memory_ro(crashk_res.start, size >> PAGE_SHIFT); 186 else 187 set_memory_rw(crashk_res.start, size >> PAGE_SHIFT); 188 } 189 190 void arch_kexec_protect_crashkres(void) 191 { 192 crash_protect_pages(1); 193 } 194 195 void arch_kexec_unprotect_crashkres(void) 196 { 197 crash_protect_pages(0); 198 } 199 200 #endif 201 202 /* 203 * Give back memory to hypervisor before new kdump is loaded 204 */ 205 static int machine_kexec_prepare_kdump(void) 206 { 207 #ifdef CONFIG_CRASH_DUMP 208 if (MACHINE_IS_VM) 209 diag10_range(PFN_DOWN(crashk_res.start), 210 PFN_DOWN(crashk_res.end - crashk_res.start + 1)); 211 return 0; 212 #else 213 return -EINVAL; 214 #endif 215 } 216 217 int machine_kexec_prepare(struct kimage *image) 218 { 219 void *reboot_code_buffer; 220 221 /* Can't replace kernel image since it is read-only. */ 222 if (ipl_flags & IPL_NSS_VALID) 223 return -EOPNOTSUPP; 224 225 if (image->type == KEXEC_TYPE_CRASH) 226 return machine_kexec_prepare_kdump(); 227 228 /* We don't support anything but the default image type for now. */ 229 if (image->type != KEXEC_TYPE_DEFAULT) 230 return -EINVAL; 231 232 /* Get the destination where the assembler code should be copied to.*/ 233 reboot_code_buffer = (void *) page_to_phys(image->control_code_page); 234 235 /* Then copy it */ 236 memcpy(reboot_code_buffer, relocate_kernel, relocate_kernel_len); 237 return 0; 238 } 239 240 void machine_kexec_cleanup(struct kimage *image) 241 { 242 } 243 244 void arch_crash_save_vmcoreinfo(void) 245 { 246 VMCOREINFO_SYMBOL(lowcore_ptr); 247 VMCOREINFO_SYMBOL(high_memory); 248 VMCOREINFO_LENGTH(lowcore_ptr, NR_CPUS); 249 mem_assign_absolute(S390_lowcore.vmcore_info, paddr_vmcoreinfo_note()); 250 } 251 252 void machine_shutdown(void) 253 { 254 } 255 256 void machine_crash_shutdown(struct pt_regs *regs) 257 { 258 } 259 260 /* 261 * Do normal kexec 262 */ 263 static void __do_machine_kexec(void *data) 264 { 265 relocate_kernel_t data_mover; 266 struct kimage *image = data; 267 268 s390_reset_system(); 269 data_mover = (relocate_kernel_t) page_to_phys(image->control_code_page); 270 271 /* Call the moving routine */ 272 (*data_mover)(&image->head, image->start); 273 274 /* Die if kexec returns */ 275 disabled_wait((unsigned long) __builtin_return_address(0)); 276 } 277 278 /* 279 * Reset system and call either kdump or normal kexec 280 */ 281 static void __machine_kexec(void *data) 282 { 283 __arch_local_irq_stosm(0x04); /* enable DAT */ 284 pfault_fini(); 285 tracing_off(); 286 debug_locks_off(); 287 #ifdef CONFIG_CRASH_DUMP 288 if (((struct kimage *) data)->type == KEXEC_TYPE_CRASH) 289 __machine_kdump(data); 290 #endif 291 __do_machine_kexec(data); 292 } 293 294 /* 295 * Do either kdump or normal kexec. In case of kdump we first ask 296 * purgatory, if kdump checksums are valid. 297 */ 298 void machine_kexec(struct kimage *image) 299 { 300 if (image->type == KEXEC_TYPE_CRASH && !kdump_csum_valid(image)) 301 return; 302 tracer_disable(); 303 smp_send_stop(); 304 smp_call_ipl_cpu(__machine_kexec, image); 305 } 306