1*9a08862aSNagarathnam Muthusamy /* 2*9a08862aSNagarathnam Muthusamy * Set up the VMAs to tell the VM about the vDSO. 3*9a08862aSNagarathnam Muthusamy * Copyright 2007 Andi Kleen, SUSE Labs. 4*9a08862aSNagarathnam Muthusamy * Subject to the GPL, v.2 5*9a08862aSNagarathnam Muthusamy */ 6*9a08862aSNagarathnam Muthusamy 7*9a08862aSNagarathnam Muthusamy /* 8*9a08862aSNagarathnam Muthusamy * Copyright (c) 2017 Oracle and/or its affiliates. All rights reserved. 9*9a08862aSNagarathnam Muthusamy */ 10*9a08862aSNagarathnam Muthusamy 11*9a08862aSNagarathnam Muthusamy #include <linux/mm.h> 12*9a08862aSNagarathnam Muthusamy #include <linux/err.h> 13*9a08862aSNagarathnam Muthusamy #include <linux/sched.h> 14*9a08862aSNagarathnam Muthusamy #include <linux/slab.h> 15*9a08862aSNagarathnam Muthusamy #include <linux/init.h> 16*9a08862aSNagarathnam Muthusamy #include <linux/linkage.h> 17*9a08862aSNagarathnam Muthusamy #include <linux/random.h> 18*9a08862aSNagarathnam Muthusamy #include <linux/elf.h> 19*9a08862aSNagarathnam Muthusamy #include <asm/vdso.h> 20*9a08862aSNagarathnam Muthusamy #include <asm/vvar.h> 21*9a08862aSNagarathnam Muthusamy #include <asm/page.h> 22*9a08862aSNagarathnam Muthusamy 23*9a08862aSNagarathnam Muthusamy unsigned int __read_mostly vdso_enabled = 1; 24*9a08862aSNagarathnam Muthusamy 25*9a08862aSNagarathnam Muthusamy static struct vm_special_mapping vvar_mapping = { 26*9a08862aSNagarathnam Muthusamy .name = "[vvar]" 27*9a08862aSNagarathnam Muthusamy }; 28*9a08862aSNagarathnam Muthusamy 29*9a08862aSNagarathnam Muthusamy #ifdef CONFIG_SPARC64 30*9a08862aSNagarathnam Muthusamy static struct vm_special_mapping vdso_mapping64 = { 31*9a08862aSNagarathnam Muthusamy .name = "[vdso]" 32*9a08862aSNagarathnam Muthusamy }; 33*9a08862aSNagarathnam Muthusamy #endif 34*9a08862aSNagarathnam Muthusamy 35*9a08862aSNagarathnam Muthusamy #ifdef CONFIG_COMPAT 36*9a08862aSNagarathnam Muthusamy static struct vm_special_mapping vdso_mapping32 = { 37*9a08862aSNagarathnam Muthusamy .name = "[vdso]" 38*9a08862aSNagarathnam Muthusamy }; 39*9a08862aSNagarathnam Muthusamy #endif 40*9a08862aSNagarathnam Muthusamy 41*9a08862aSNagarathnam Muthusamy struct vvar_data *vvar_data; 42*9a08862aSNagarathnam Muthusamy 43*9a08862aSNagarathnam Muthusamy #define SAVE_INSTR_SIZE 4 44*9a08862aSNagarathnam Muthusamy 45*9a08862aSNagarathnam Muthusamy /* 46*9a08862aSNagarathnam Muthusamy * Allocate pages for the vdso and vvar, and copy in the vdso text from the 47*9a08862aSNagarathnam Muthusamy * kernel image. 48*9a08862aSNagarathnam Muthusamy */ 49*9a08862aSNagarathnam Muthusamy int __init init_vdso_image(const struct vdso_image *image, 50*9a08862aSNagarathnam Muthusamy struct vm_special_mapping *vdso_mapping) 51*9a08862aSNagarathnam Muthusamy { 52*9a08862aSNagarathnam Muthusamy int i; 53*9a08862aSNagarathnam Muthusamy struct page *dp, **dpp = NULL; 54*9a08862aSNagarathnam Muthusamy int dnpages = 0; 55*9a08862aSNagarathnam Muthusamy struct page *cp, **cpp = NULL; 56*9a08862aSNagarathnam Muthusamy int cnpages = (image->size) / PAGE_SIZE; 57*9a08862aSNagarathnam Muthusamy 58*9a08862aSNagarathnam Muthusamy /* 59*9a08862aSNagarathnam Muthusamy * First, the vdso text. This is initialied data, an integral number of 60*9a08862aSNagarathnam Muthusamy * pages long. 61*9a08862aSNagarathnam Muthusamy */ 62*9a08862aSNagarathnam Muthusamy if (WARN_ON(image->size % PAGE_SIZE != 0)) 63*9a08862aSNagarathnam Muthusamy goto oom; 64*9a08862aSNagarathnam Muthusamy 65*9a08862aSNagarathnam Muthusamy cpp = kcalloc(cnpages, sizeof(struct page *), GFP_KERNEL); 66*9a08862aSNagarathnam Muthusamy vdso_mapping->pages = cpp; 67*9a08862aSNagarathnam Muthusamy 68*9a08862aSNagarathnam Muthusamy if (!cpp) 69*9a08862aSNagarathnam Muthusamy goto oom; 70*9a08862aSNagarathnam Muthusamy 71*9a08862aSNagarathnam Muthusamy if (vdso_fix_stick) { 72*9a08862aSNagarathnam Muthusamy /* 73*9a08862aSNagarathnam Muthusamy * If the system uses %tick instead of %stick, patch the VDSO 74*9a08862aSNagarathnam Muthusamy * with instruction reading %tick instead of %stick. 75*9a08862aSNagarathnam Muthusamy */ 76*9a08862aSNagarathnam Muthusamy unsigned int j, k = SAVE_INSTR_SIZE; 77*9a08862aSNagarathnam Muthusamy unsigned char *data = image->data; 78*9a08862aSNagarathnam Muthusamy 79*9a08862aSNagarathnam Muthusamy for (j = image->sym_vread_tick_patch_start; 80*9a08862aSNagarathnam Muthusamy j < image->sym_vread_tick_patch_end; j++) { 81*9a08862aSNagarathnam Muthusamy 82*9a08862aSNagarathnam Muthusamy data[image->sym_vread_tick + k] = data[j]; 83*9a08862aSNagarathnam Muthusamy k++; 84*9a08862aSNagarathnam Muthusamy } 85*9a08862aSNagarathnam Muthusamy } 86*9a08862aSNagarathnam Muthusamy 87*9a08862aSNagarathnam Muthusamy for (i = 0; i < cnpages; i++) { 88*9a08862aSNagarathnam Muthusamy cp = alloc_page(GFP_KERNEL); 89*9a08862aSNagarathnam Muthusamy if (!cp) 90*9a08862aSNagarathnam Muthusamy goto oom; 91*9a08862aSNagarathnam Muthusamy cpp[i] = cp; 92*9a08862aSNagarathnam Muthusamy copy_page(page_address(cp), image->data + i * PAGE_SIZE); 93*9a08862aSNagarathnam Muthusamy } 94*9a08862aSNagarathnam Muthusamy 95*9a08862aSNagarathnam Muthusamy /* 96*9a08862aSNagarathnam Muthusamy * Now the vvar page. This is uninitialized data. 97*9a08862aSNagarathnam Muthusamy */ 98*9a08862aSNagarathnam Muthusamy 99*9a08862aSNagarathnam Muthusamy if (vvar_data == NULL) { 100*9a08862aSNagarathnam Muthusamy dnpages = (sizeof(struct vvar_data) / PAGE_SIZE) + 1; 101*9a08862aSNagarathnam Muthusamy if (WARN_ON(dnpages != 1)) 102*9a08862aSNagarathnam Muthusamy goto oom; 103*9a08862aSNagarathnam Muthusamy dpp = kcalloc(dnpages, sizeof(struct page *), GFP_KERNEL); 104*9a08862aSNagarathnam Muthusamy vvar_mapping.pages = dpp; 105*9a08862aSNagarathnam Muthusamy 106*9a08862aSNagarathnam Muthusamy if (!dpp) 107*9a08862aSNagarathnam Muthusamy goto oom; 108*9a08862aSNagarathnam Muthusamy 109*9a08862aSNagarathnam Muthusamy dp = alloc_page(GFP_KERNEL); 110*9a08862aSNagarathnam Muthusamy if (!dp) 111*9a08862aSNagarathnam Muthusamy goto oom; 112*9a08862aSNagarathnam Muthusamy 113*9a08862aSNagarathnam Muthusamy dpp[0] = dp; 114*9a08862aSNagarathnam Muthusamy vvar_data = page_address(dp); 115*9a08862aSNagarathnam Muthusamy memset(vvar_data, 0, PAGE_SIZE); 116*9a08862aSNagarathnam Muthusamy 117*9a08862aSNagarathnam Muthusamy vvar_data->seq = 0; 118*9a08862aSNagarathnam Muthusamy } 119*9a08862aSNagarathnam Muthusamy 120*9a08862aSNagarathnam Muthusamy return 0; 121*9a08862aSNagarathnam Muthusamy oom: 122*9a08862aSNagarathnam Muthusamy if (cpp != NULL) { 123*9a08862aSNagarathnam Muthusamy for (i = 0; i < cnpages; i++) { 124*9a08862aSNagarathnam Muthusamy if (cpp[i] != NULL) 125*9a08862aSNagarathnam Muthusamy __free_page(cpp[i]); 126*9a08862aSNagarathnam Muthusamy } 127*9a08862aSNagarathnam Muthusamy kfree(cpp); 128*9a08862aSNagarathnam Muthusamy vdso_mapping->pages = NULL; 129*9a08862aSNagarathnam Muthusamy } 130*9a08862aSNagarathnam Muthusamy 131*9a08862aSNagarathnam Muthusamy if (dpp != NULL) { 132*9a08862aSNagarathnam Muthusamy for (i = 0; i < dnpages; i++) { 133*9a08862aSNagarathnam Muthusamy if (dpp[i] != NULL) 134*9a08862aSNagarathnam Muthusamy __free_page(dpp[i]); 135*9a08862aSNagarathnam Muthusamy } 136*9a08862aSNagarathnam Muthusamy kfree(dpp); 137*9a08862aSNagarathnam Muthusamy vvar_mapping.pages = NULL; 138*9a08862aSNagarathnam Muthusamy } 139*9a08862aSNagarathnam Muthusamy 140*9a08862aSNagarathnam Muthusamy pr_warn("Cannot allocate vdso\n"); 141*9a08862aSNagarathnam Muthusamy vdso_enabled = 0; 142*9a08862aSNagarathnam Muthusamy return -ENOMEM; 143*9a08862aSNagarathnam Muthusamy } 144*9a08862aSNagarathnam Muthusamy 145*9a08862aSNagarathnam Muthusamy static int __init init_vdso(void) 146*9a08862aSNagarathnam Muthusamy { 147*9a08862aSNagarathnam Muthusamy int err = 0; 148*9a08862aSNagarathnam Muthusamy #ifdef CONFIG_SPARC64 149*9a08862aSNagarathnam Muthusamy err = init_vdso_image(&vdso_image_64_builtin, &vdso_mapping64); 150*9a08862aSNagarathnam Muthusamy if (err) 151*9a08862aSNagarathnam Muthusamy return err; 152*9a08862aSNagarathnam Muthusamy #endif 153*9a08862aSNagarathnam Muthusamy 154*9a08862aSNagarathnam Muthusamy #ifdef CONFIG_COMPAT 155*9a08862aSNagarathnam Muthusamy err = init_vdso_image(&vdso_image_32_builtin, &vdso_mapping32); 156*9a08862aSNagarathnam Muthusamy #endif 157*9a08862aSNagarathnam Muthusamy return err; 158*9a08862aSNagarathnam Muthusamy 159*9a08862aSNagarathnam Muthusamy } 160*9a08862aSNagarathnam Muthusamy subsys_initcall(init_vdso); 161*9a08862aSNagarathnam Muthusamy 162*9a08862aSNagarathnam Muthusamy struct linux_binprm; 163*9a08862aSNagarathnam Muthusamy 164*9a08862aSNagarathnam Muthusamy /* Shuffle the vdso up a bit, randomly. */ 165*9a08862aSNagarathnam Muthusamy static unsigned long vdso_addr(unsigned long start, unsigned int len) 166*9a08862aSNagarathnam Muthusamy { 167*9a08862aSNagarathnam Muthusamy unsigned int offset; 168*9a08862aSNagarathnam Muthusamy 169*9a08862aSNagarathnam Muthusamy /* This loses some more bits than a modulo, but is cheaper */ 170*9a08862aSNagarathnam Muthusamy offset = get_random_int() & (PTRS_PER_PTE - 1); 171*9a08862aSNagarathnam Muthusamy return start + (offset << PAGE_SHIFT); 172*9a08862aSNagarathnam Muthusamy } 173*9a08862aSNagarathnam Muthusamy 174*9a08862aSNagarathnam Muthusamy static int map_vdso(const struct vdso_image *image, 175*9a08862aSNagarathnam Muthusamy struct vm_special_mapping *vdso_mapping) 176*9a08862aSNagarathnam Muthusamy { 177*9a08862aSNagarathnam Muthusamy struct mm_struct *mm = current->mm; 178*9a08862aSNagarathnam Muthusamy struct vm_area_struct *vma; 179*9a08862aSNagarathnam Muthusamy unsigned long text_start, addr = 0; 180*9a08862aSNagarathnam Muthusamy int ret = 0; 181*9a08862aSNagarathnam Muthusamy 182*9a08862aSNagarathnam Muthusamy down_write(&mm->mmap_sem); 183*9a08862aSNagarathnam Muthusamy 184*9a08862aSNagarathnam Muthusamy /* 185*9a08862aSNagarathnam Muthusamy * First, get an unmapped region: then randomize it, and make sure that 186*9a08862aSNagarathnam Muthusamy * region is free. 187*9a08862aSNagarathnam Muthusamy */ 188*9a08862aSNagarathnam Muthusamy if (current->flags & PF_RANDOMIZE) { 189*9a08862aSNagarathnam Muthusamy addr = get_unmapped_area(NULL, 0, 190*9a08862aSNagarathnam Muthusamy image->size - image->sym_vvar_start, 191*9a08862aSNagarathnam Muthusamy 0, 0); 192*9a08862aSNagarathnam Muthusamy if (IS_ERR_VALUE(addr)) { 193*9a08862aSNagarathnam Muthusamy ret = addr; 194*9a08862aSNagarathnam Muthusamy goto up_fail; 195*9a08862aSNagarathnam Muthusamy } 196*9a08862aSNagarathnam Muthusamy addr = vdso_addr(addr, image->size - image->sym_vvar_start); 197*9a08862aSNagarathnam Muthusamy } 198*9a08862aSNagarathnam Muthusamy addr = get_unmapped_area(NULL, addr, 199*9a08862aSNagarathnam Muthusamy image->size - image->sym_vvar_start, 0, 0); 200*9a08862aSNagarathnam Muthusamy if (IS_ERR_VALUE(addr)) { 201*9a08862aSNagarathnam Muthusamy ret = addr; 202*9a08862aSNagarathnam Muthusamy goto up_fail; 203*9a08862aSNagarathnam Muthusamy } 204*9a08862aSNagarathnam Muthusamy 205*9a08862aSNagarathnam Muthusamy text_start = addr - image->sym_vvar_start; 206*9a08862aSNagarathnam Muthusamy current->mm->context.vdso = (void __user *)text_start; 207*9a08862aSNagarathnam Muthusamy 208*9a08862aSNagarathnam Muthusamy /* 209*9a08862aSNagarathnam Muthusamy * MAYWRITE to allow gdb to COW and set breakpoints 210*9a08862aSNagarathnam Muthusamy */ 211*9a08862aSNagarathnam Muthusamy vma = _install_special_mapping(mm, 212*9a08862aSNagarathnam Muthusamy text_start, 213*9a08862aSNagarathnam Muthusamy image->size, 214*9a08862aSNagarathnam Muthusamy VM_READ|VM_EXEC| 215*9a08862aSNagarathnam Muthusamy VM_MAYREAD|VM_MAYWRITE|VM_MAYEXEC, 216*9a08862aSNagarathnam Muthusamy vdso_mapping); 217*9a08862aSNagarathnam Muthusamy 218*9a08862aSNagarathnam Muthusamy if (IS_ERR(vma)) { 219*9a08862aSNagarathnam Muthusamy ret = PTR_ERR(vma); 220*9a08862aSNagarathnam Muthusamy goto up_fail; 221*9a08862aSNagarathnam Muthusamy } 222*9a08862aSNagarathnam Muthusamy 223*9a08862aSNagarathnam Muthusamy vma = _install_special_mapping(mm, 224*9a08862aSNagarathnam Muthusamy addr, 225*9a08862aSNagarathnam Muthusamy -image->sym_vvar_start, 226*9a08862aSNagarathnam Muthusamy VM_READ|VM_MAYREAD, 227*9a08862aSNagarathnam Muthusamy &vvar_mapping); 228*9a08862aSNagarathnam Muthusamy 229*9a08862aSNagarathnam Muthusamy if (IS_ERR(vma)) { 230*9a08862aSNagarathnam Muthusamy ret = PTR_ERR(vma); 231*9a08862aSNagarathnam Muthusamy do_munmap(mm, text_start, image->size, NULL); 232*9a08862aSNagarathnam Muthusamy } 233*9a08862aSNagarathnam Muthusamy 234*9a08862aSNagarathnam Muthusamy up_fail: 235*9a08862aSNagarathnam Muthusamy if (ret) 236*9a08862aSNagarathnam Muthusamy current->mm->context.vdso = NULL; 237*9a08862aSNagarathnam Muthusamy 238*9a08862aSNagarathnam Muthusamy up_write(&mm->mmap_sem); 239*9a08862aSNagarathnam Muthusamy return ret; 240*9a08862aSNagarathnam Muthusamy } 241*9a08862aSNagarathnam Muthusamy 242*9a08862aSNagarathnam Muthusamy int arch_setup_additional_pages(struct linux_binprm *bprm, int uses_interp) 243*9a08862aSNagarathnam Muthusamy { 244*9a08862aSNagarathnam Muthusamy 245*9a08862aSNagarathnam Muthusamy if (!vdso_enabled) 246*9a08862aSNagarathnam Muthusamy return 0; 247*9a08862aSNagarathnam Muthusamy 248*9a08862aSNagarathnam Muthusamy #if defined CONFIG_COMPAT 249*9a08862aSNagarathnam Muthusamy if (!(is_32bit_task())) 250*9a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_64_builtin, &vdso_mapping64); 251*9a08862aSNagarathnam Muthusamy else 252*9a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_32_builtin, &vdso_mapping32); 253*9a08862aSNagarathnam Muthusamy #else 254*9a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_64_builtin, &vdso_mapping64); 255*9a08862aSNagarathnam Muthusamy #endif 256*9a08862aSNagarathnam Muthusamy 257*9a08862aSNagarathnam Muthusamy } 258*9a08862aSNagarathnam Muthusamy 259*9a08862aSNagarathnam Muthusamy static __init int vdso_setup(char *s) 260*9a08862aSNagarathnam Muthusamy { 261*9a08862aSNagarathnam Muthusamy int err; 262*9a08862aSNagarathnam Muthusamy unsigned long val; 263*9a08862aSNagarathnam Muthusamy 264*9a08862aSNagarathnam Muthusamy err = kstrtoul(s, 10, &val); 265*9a08862aSNagarathnam Muthusamy vdso_enabled = val; 266*9a08862aSNagarathnam Muthusamy return err; 267*9a08862aSNagarathnam Muthusamy } 268*9a08862aSNagarathnam Muthusamy __setup("vdso=", vdso_setup); 269