19a08862aSNagarathnam Muthusamy /* 29a08862aSNagarathnam Muthusamy * Set up the VMAs to tell the VM about the vDSO. 39a08862aSNagarathnam Muthusamy * Copyright 2007 Andi Kleen, SUSE Labs. 49a08862aSNagarathnam Muthusamy * Subject to the GPL, v.2 59a08862aSNagarathnam Muthusamy */ 69a08862aSNagarathnam Muthusamy 79a08862aSNagarathnam Muthusamy /* 89a08862aSNagarathnam Muthusamy * Copyright (c) 2017 Oracle and/or its affiliates. All rights reserved. 99a08862aSNagarathnam Muthusamy */ 109a08862aSNagarathnam Muthusamy 119a08862aSNagarathnam Muthusamy #include <linux/mm.h> 129a08862aSNagarathnam Muthusamy #include <linux/err.h> 139a08862aSNagarathnam Muthusamy #include <linux/sched.h> 149a08862aSNagarathnam Muthusamy #include <linux/slab.h> 159a08862aSNagarathnam Muthusamy #include <linux/init.h> 169a08862aSNagarathnam Muthusamy #include <linux/linkage.h> 179a08862aSNagarathnam Muthusamy #include <linux/random.h> 189a08862aSNagarathnam Muthusamy #include <linux/elf.h> 199a08862aSNagarathnam Muthusamy #include <asm/vdso.h> 209a08862aSNagarathnam Muthusamy #include <asm/vvar.h> 219a08862aSNagarathnam Muthusamy #include <asm/page.h> 229a08862aSNagarathnam Muthusamy 239a08862aSNagarathnam Muthusamy unsigned int __read_mostly vdso_enabled = 1; 249a08862aSNagarathnam Muthusamy 259a08862aSNagarathnam Muthusamy static struct vm_special_mapping vvar_mapping = { 269a08862aSNagarathnam Muthusamy .name = "[vvar]" 279a08862aSNagarathnam Muthusamy }; 289a08862aSNagarathnam Muthusamy 299a08862aSNagarathnam Muthusamy #ifdef CONFIG_SPARC64 309a08862aSNagarathnam Muthusamy static struct vm_special_mapping vdso_mapping64 = { 319a08862aSNagarathnam Muthusamy .name = "[vdso]" 329a08862aSNagarathnam Muthusamy }; 339a08862aSNagarathnam Muthusamy #endif 349a08862aSNagarathnam Muthusamy 359a08862aSNagarathnam Muthusamy #ifdef CONFIG_COMPAT 369a08862aSNagarathnam Muthusamy static struct vm_special_mapping vdso_mapping32 = { 379a08862aSNagarathnam Muthusamy .name = "[vdso]" 389a08862aSNagarathnam Muthusamy }; 399a08862aSNagarathnam Muthusamy #endif 409a08862aSNagarathnam Muthusamy 419a08862aSNagarathnam Muthusamy struct vvar_data *vvar_data; 429a08862aSNagarathnam Muthusamy 439a08862aSNagarathnam Muthusamy #define SAVE_INSTR_SIZE 4 449a08862aSNagarathnam Muthusamy 459a08862aSNagarathnam Muthusamy /* 469a08862aSNagarathnam Muthusamy * Allocate pages for the vdso and vvar, and copy in the vdso text from the 479a08862aSNagarathnam Muthusamy * kernel image. 489a08862aSNagarathnam Muthusamy */ 499a08862aSNagarathnam Muthusamy int __init init_vdso_image(const struct vdso_image *image, 509a08862aSNagarathnam Muthusamy struct vm_special_mapping *vdso_mapping) 519a08862aSNagarathnam Muthusamy { 529a08862aSNagarathnam Muthusamy int i; 539a08862aSNagarathnam Muthusamy struct page *dp, **dpp = NULL; 549a08862aSNagarathnam Muthusamy int dnpages = 0; 559a08862aSNagarathnam Muthusamy struct page *cp, **cpp = NULL; 569a08862aSNagarathnam Muthusamy int cnpages = (image->size) / PAGE_SIZE; 579a08862aSNagarathnam Muthusamy 589a08862aSNagarathnam Muthusamy /* 599a08862aSNagarathnam Muthusamy * First, the vdso text. This is initialied data, an integral number of 609a08862aSNagarathnam Muthusamy * pages long. 619a08862aSNagarathnam Muthusamy */ 629a08862aSNagarathnam Muthusamy if (WARN_ON(image->size % PAGE_SIZE != 0)) 639a08862aSNagarathnam Muthusamy goto oom; 649a08862aSNagarathnam Muthusamy 659a08862aSNagarathnam Muthusamy cpp = kcalloc(cnpages, sizeof(struct page *), GFP_KERNEL); 669a08862aSNagarathnam Muthusamy vdso_mapping->pages = cpp; 679a08862aSNagarathnam Muthusamy 689a08862aSNagarathnam Muthusamy if (!cpp) 699a08862aSNagarathnam Muthusamy goto oom; 709a08862aSNagarathnam Muthusamy 719a08862aSNagarathnam Muthusamy if (vdso_fix_stick) { 729a08862aSNagarathnam Muthusamy /* 739a08862aSNagarathnam Muthusamy * If the system uses %tick instead of %stick, patch the VDSO 749a08862aSNagarathnam Muthusamy * with instruction reading %tick instead of %stick. 759a08862aSNagarathnam Muthusamy */ 769a08862aSNagarathnam Muthusamy unsigned int j, k = SAVE_INSTR_SIZE; 779a08862aSNagarathnam Muthusamy unsigned char *data = image->data; 789a08862aSNagarathnam Muthusamy 799a08862aSNagarathnam Muthusamy for (j = image->sym_vread_tick_patch_start; 809a08862aSNagarathnam Muthusamy j < image->sym_vread_tick_patch_end; j++) { 819a08862aSNagarathnam Muthusamy 829a08862aSNagarathnam Muthusamy data[image->sym_vread_tick + k] = data[j]; 839a08862aSNagarathnam Muthusamy k++; 849a08862aSNagarathnam Muthusamy } 859a08862aSNagarathnam Muthusamy } 869a08862aSNagarathnam Muthusamy 879a08862aSNagarathnam Muthusamy for (i = 0; i < cnpages; i++) { 889a08862aSNagarathnam Muthusamy cp = alloc_page(GFP_KERNEL); 899a08862aSNagarathnam Muthusamy if (!cp) 909a08862aSNagarathnam Muthusamy goto oom; 919a08862aSNagarathnam Muthusamy cpp[i] = cp; 929a08862aSNagarathnam Muthusamy copy_page(page_address(cp), image->data + i * PAGE_SIZE); 939a08862aSNagarathnam Muthusamy } 949a08862aSNagarathnam Muthusamy 959a08862aSNagarathnam Muthusamy /* 969a08862aSNagarathnam Muthusamy * Now the vvar page. This is uninitialized data. 979a08862aSNagarathnam Muthusamy */ 989a08862aSNagarathnam Muthusamy 999a08862aSNagarathnam Muthusamy if (vvar_data == NULL) { 1009a08862aSNagarathnam Muthusamy dnpages = (sizeof(struct vvar_data) / PAGE_SIZE) + 1; 1019a08862aSNagarathnam Muthusamy if (WARN_ON(dnpages != 1)) 1029a08862aSNagarathnam Muthusamy goto oom; 1039a08862aSNagarathnam Muthusamy dpp = kcalloc(dnpages, sizeof(struct page *), GFP_KERNEL); 1049a08862aSNagarathnam Muthusamy vvar_mapping.pages = dpp; 1059a08862aSNagarathnam Muthusamy 1069a08862aSNagarathnam Muthusamy if (!dpp) 1079a08862aSNagarathnam Muthusamy goto oom; 1089a08862aSNagarathnam Muthusamy 1099a08862aSNagarathnam Muthusamy dp = alloc_page(GFP_KERNEL); 1109a08862aSNagarathnam Muthusamy if (!dp) 1119a08862aSNagarathnam Muthusamy goto oom; 1129a08862aSNagarathnam Muthusamy 1139a08862aSNagarathnam Muthusamy dpp[0] = dp; 1149a08862aSNagarathnam Muthusamy vvar_data = page_address(dp); 1159a08862aSNagarathnam Muthusamy memset(vvar_data, 0, PAGE_SIZE); 1169a08862aSNagarathnam Muthusamy 1179a08862aSNagarathnam Muthusamy vvar_data->seq = 0; 1189a08862aSNagarathnam Muthusamy } 1199a08862aSNagarathnam Muthusamy 1209a08862aSNagarathnam Muthusamy return 0; 1219a08862aSNagarathnam Muthusamy oom: 1229a08862aSNagarathnam Muthusamy if (cpp != NULL) { 1239a08862aSNagarathnam Muthusamy for (i = 0; i < cnpages; i++) { 1249a08862aSNagarathnam Muthusamy if (cpp[i] != NULL) 1259a08862aSNagarathnam Muthusamy __free_page(cpp[i]); 1269a08862aSNagarathnam Muthusamy } 1279a08862aSNagarathnam Muthusamy kfree(cpp); 1289a08862aSNagarathnam Muthusamy vdso_mapping->pages = NULL; 1299a08862aSNagarathnam Muthusamy } 1309a08862aSNagarathnam Muthusamy 1319a08862aSNagarathnam Muthusamy if (dpp != NULL) { 1329a08862aSNagarathnam Muthusamy for (i = 0; i < dnpages; i++) { 1339a08862aSNagarathnam Muthusamy if (dpp[i] != NULL) 1349a08862aSNagarathnam Muthusamy __free_page(dpp[i]); 1359a08862aSNagarathnam Muthusamy } 1369a08862aSNagarathnam Muthusamy kfree(dpp); 1379a08862aSNagarathnam Muthusamy vvar_mapping.pages = NULL; 1389a08862aSNagarathnam Muthusamy } 1399a08862aSNagarathnam Muthusamy 1409a08862aSNagarathnam Muthusamy pr_warn("Cannot allocate vdso\n"); 1419a08862aSNagarathnam Muthusamy vdso_enabled = 0; 1429a08862aSNagarathnam Muthusamy return -ENOMEM; 1439a08862aSNagarathnam Muthusamy } 1449a08862aSNagarathnam Muthusamy 1459a08862aSNagarathnam Muthusamy static int __init init_vdso(void) 1469a08862aSNagarathnam Muthusamy { 1479a08862aSNagarathnam Muthusamy int err = 0; 1489a08862aSNagarathnam Muthusamy #ifdef CONFIG_SPARC64 1499a08862aSNagarathnam Muthusamy err = init_vdso_image(&vdso_image_64_builtin, &vdso_mapping64); 1509a08862aSNagarathnam Muthusamy if (err) 1519a08862aSNagarathnam Muthusamy return err; 1529a08862aSNagarathnam Muthusamy #endif 1539a08862aSNagarathnam Muthusamy 1549a08862aSNagarathnam Muthusamy #ifdef CONFIG_COMPAT 1559a08862aSNagarathnam Muthusamy err = init_vdso_image(&vdso_image_32_builtin, &vdso_mapping32); 1569a08862aSNagarathnam Muthusamy #endif 1579a08862aSNagarathnam Muthusamy return err; 1589a08862aSNagarathnam Muthusamy 1599a08862aSNagarathnam Muthusamy } 1609a08862aSNagarathnam Muthusamy subsys_initcall(init_vdso); 1619a08862aSNagarathnam Muthusamy 1629a08862aSNagarathnam Muthusamy struct linux_binprm; 1639a08862aSNagarathnam Muthusamy 1649a08862aSNagarathnam Muthusamy /* Shuffle the vdso up a bit, randomly. */ 1659a08862aSNagarathnam Muthusamy static unsigned long vdso_addr(unsigned long start, unsigned int len) 1669a08862aSNagarathnam Muthusamy { 1679a08862aSNagarathnam Muthusamy unsigned int offset; 1689a08862aSNagarathnam Muthusamy 1699a08862aSNagarathnam Muthusamy /* This loses some more bits than a modulo, but is cheaper */ 1709a08862aSNagarathnam Muthusamy offset = get_random_int() & (PTRS_PER_PTE - 1); 1719a08862aSNagarathnam Muthusamy return start + (offset << PAGE_SHIFT); 1729a08862aSNagarathnam Muthusamy } 1739a08862aSNagarathnam Muthusamy 1749a08862aSNagarathnam Muthusamy static int map_vdso(const struct vdso_image *image, 1759a08862aSNagarathnam Muthusamy struct vm_special_mapping *vdso_mapping) 1769a08862aSNagarathnam Muthusamy { 1779a08862aSNagarathnam Muthusamy struct mm_struct *mm = current->mm; 1789a08862aSNagarathnam Muthusamy struct vm_area_struct *vma; 1799a08862aSNagarathnam Muthusamy unsigned long text_start, addr = 0; 1809a08862aSNagarathnam Muthusamy int ret = 0; 1819a08862aSNagarathnam Muthusamy 1829a08862aSNagarathnam Muthusamy down_write(&mm->mmap_sem); 1839a08862aSNagarathnam Muthusamy 1849a08862aSNagarathnam Muthusamy /* 1859a08862aSNagarathnam Muthusamy * First, get an unmapped region: then randomize it, and make sure that 1869a08862aSNagarathnam Muthusamy * region is free. 1879a08862aSNagarathnam Muthusamy */ 1889a08862aSNagarathnam Muthusamy if (current->flags & PF_RANDOMIZE) { 1899a08862aSNagarathnam Muthusamy addr = get_unmapped_area(NULL, 0, 1909a08862aSNagarathnam Muthusamy image->size - image->sym_vvar_start, 1919a08862aSNagarathnam Muthusamy 0, 0); 1929a08862aSNagarathnam Muthusamy if (IS_ERR_VALUE(addr)) { 1939a08862aSNagarathnam Muthusamy ret = addr; 1949a08862aSNagarathnam Muthusamy goto up_fail; 1959a08862aSNagarathnam Muthusamy } 1969a08862aSNagarathnam Muthusamy addr = vdso_addr(addr, image->size - image->sym_vvar_start); 1979a08862aSNagarathnam Muthusamy } 1989a08862aSNagarathnam Muthusamy addr = get_unmapped_area(NULL, addr, 1999a08862aSNagarathnam Muthusamy image->size - image->sym_vvar_start, 0, 0); 2009a08862aSNagarathnam Muthusamy if (IS_ERR_VALUE(addr)) { 2019a08862aSNagarathnam Muthusamy ret = addr; 2029a08862aSNagarathnam Muthusamy goto up_fail; 2039a08862aSNagarathnam Muthusamy } 2049a08862aSNagarathnam Muthusamy 2059a08862aSNagarathnam Muthusamy text_start = addr - image->sym_vvar_start; 2069a08862aSNagarathnam Muthusamy current->mm->context.vdso = (void __user *)text_start; 2079a08862aSNagarathnam Muthusamy 2089a08862aSNagarathnam Muthusamy /* 2099a08862aSNagarathnam Muthusamy * MAYWRITE to allow gdb to COW and set breakpoints 2109a08862aSNagarathnam Muthusamy */ 2119a08862aSNagarathnam Muthusamy vma = _install_special_mapping(mm, 2129a08862aSNagarathnam Muthusamy text_start, 2139a08862aSNagarathnam Muthusamy image->size, 2149a08862aSNagarathnam Muthusamy VM_READ|VM_EXEC| 2159a08862aSNagarathnam Muthusamy VM_MAYREAD|VM_MAYWRITE|VM_MAYEXEC, 2169a08862aSNagarathnam Muthusamy vdso_mapping); 2179a08862aSNagarathnam Muthusamy 2189a08862aSNagarathnam Muthusamy if (IS_ERR(vma)) { 2199a08862aSNagarathnam Muthusamy ret = PTR_ERR(vma); 2209a08862aSNagarathnam Muthusamy goto up_fail; 2219a08862aSNagarathnam Muthusamy } 2229a08862aSNagarathnam Muthusamy 2239a08862aSNagarathnam Muthusamy vma = _install_special_mapping(mm, 2249a08862aSNagarathnam Muthusamy addr, 2259a08862aSNagarathnam Muthusamy -image->sym_vvar_start, 2269a08862aSNagarathnam Muthusamy VM_READ|VM_MAYREAD, 2279a08862aSNagarathnam Muthusamy &vvar_mapping); 2289a08862aSNagarathnam Muthusamy 2299a08862aSNagarathnam Muthusamy if (IS_ERR(vma)) { 2309a08862aSNagarathnam Muthusamy ret = PTR_ERR(vma); 2319a08862aSNagarathnam Muthusamy do_munmap(mm, text_start, image->size, NULL); 2329a08862aSNagarathnam Muthusamy } 2339a08862aSNagarathnam Muthusamy 2349a08862aSNagarathnam Muthusamy up_fail: 2359a08862aSNagarathnam Muthusamy if (ret) 2369a08862aSNagarathnam Muthusamy current->mm->context.vdso = NULL; 2379a08862aSNagarathnam Muthusamy 2389a08862aSNagarathnam Muthusamy up_write(&mm->mmap_sem); 2399a08862aSNagarathnam Muthusamy return ret; 2409a08862aSNagarathnam Muthusamy } 2419a08862aSNagarathnam Muthusamy 2429a08862aSNagarathnam Muthusamy int arch_setup_additional_pages(struct linux_binprm *bprm, int uses_interp) 2439a08862aSNagarathnam Muthusamy { 2449a08862aSNagarathnam Muthusamy 2459a08862aSNagarathnam Muthusamy if (!vdso_enabled) 2469a08862aSNagarathnam Muthusamy return 0; 2479a08862aSNagarathnam Muthusamy 2489a08862aSNagarathnam Muthusamy #if defined CONFIG_COMPAT 2499a08862aSNagarathnam Muthusamy if (!(is_32bit_task())) 2509a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_64_builtin, &vdso_mapping64); 2519a08862aSNagarathnam Muthusamy else 2529a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_32_builtin, &vdso_mapping32); 2539a08862aSNagarathnam Muthusamy #else 2549a08862aSNagarathnam Muthusamy return map_vdso(&vdso_image_64_builtin, &vdso_mapping64); 2559a08862aSNagarathnam Muthusamy #endif 2569a08862aSNagarathnam Muthusamy 2579a08862aSNagarathnam Muthusamy } 2589a08862aSNagarathnam Muthusamy 2599a08862aSNagarathnam Muthusamy static __init int vdso_setup(char *s) 2609a08862aSNagarathnam Muthusamy { 2619a08862aSNagarathnam Muthusamy int err; 2629a08862aSNagarathnam Muthusamy unsigned long val; 2639a08862aSNagarathnam Muthusamy 2649a08862aSNagarathnam Muthusamy err = kstrtoul(s, 10, &val); 265*62d6f3b7SDan Carpenter if (err) 2669a08862aSNagarathnam Muthusamy return err; 267*62d6f3b7SDan Carpenter vdso_enabled = val; 268*62d6f3b7SDan Carpenter return 0; 2699a08862aSNagarathnam Muthusamy } 2709a08862aSNagarathnam Muthusamy __setup("vdso=", vdso_setup); 271