xref: /linux/kernel/module/main.c (revision db59d74e5da144111fc133fb1bf72e6392bdb04e)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * Copyright (C) 2002 Richard Henderson
4  * Copyright (C) 2001 Rusty Russell, 2002, 2010 Rusty Russell IBM.
5  * Copyright (C) 2023 Luis Chamberlain <mcgrof@kernel.org>
6  */
7 
8 #define INCLUDE_VERMAGIC
9 
10 #include <linux/export.h>
11 #include <linux/extable.h>
12 #include <linux/moduleloader.h>
13 #include <linux/module_signature.h>
14 #include <linux/trace_events.h>
15 #include <linux/init.h>
16 #include <linux/kallsyms.h>
17 #include <linux/buildid.h>
18 #include <linux/fs.h>
19 #include <linux/kernel.h>
20 #include <linux/kernel_read_file.h>
21 #include <linux/kstrtox.h>
22 #include <linux/slab.h>
23 #include <linux/vmalloc.h>
24 #include <linux/elf.h>
25 #include <linux/seq_file.h>
26 #include <linux/syscalls.h>
27 #include <linux/fcntl.h>
28 #include <linux/rcupdate.h>
29 #include <linux/capability.h>
30 #include <linux/cpu.h>
31 #include <linux/moduleparam.h>
32 #include <linux/errno.h>
33 #include <linux/err.h>
34 #include <linux/vermagic.h>
35 #include <linux/notifier.h>
36 #include <linux/sched.h>
37 #include <linux/device.h>
38 #include <linux/string.h>
39 #include <linux/mutex.h>
40 #include <linux/rculist.h>
41 #include <linux/uaccess.h>
42 #include <asm/cacheflush.h>
43 #include <linux/set_memory.h>
44 #include <asm/mmu_context.h>
45 #include <linux/license.h>
46 #include <asm/sections.h>
47 #include <linux/tracepoint.h>
48 #include <linux/ftrace.h>
49 #include <linux/livepatch.h>
50 #include <linux/async.h>
51 #include <linux/percpu.h>
52 #include <linux/kmemleak.h>
53 #include <linux/jump_label.h>
54 #include <linux/pfn.h>
55 #include <linux/bsearch.h>
56 #include <linux/dynamic_debug.h>
57 #include <linux/audit.h>
58 #include <linux/cfi.h>
59 #include <linux/codetag.h>
60 #include <linux/debugfs.h>
61 #include <linux/execmem.h>
62 #include <uapi/linux/module.h>
63 #include "internal.h"
64 
65 #define CREATE_TRACE_POINTS
66 #include <trace/events/module.h>
67 
68 /*
69  * Mutex protects:
70  * 1) List of modules (also safely readable within RCU read section),
71  * 2) module_use links,
72  * 3) mod_tree.addr_min/mod_tree.addr_max.
73  * (delete and add uses RCU list operations).
74  */
75 DEFINE_MUTEX(module_mutex);
76 LIST_HEAD(modules);
77 
78 /* Work queue for freeing init sections in success case */
79 static void do_free_init(struct work_struct *w);
80 static DECLARE_WORK(init_free_wq, do_free_init);
81 static LLIST_HEAD(init_free_list);
82 
83 struct mod_tree_root mod_tree __cacheline_aligned = {
84 	.addr_min = -1UL,
85 };
86 
87 struct symsearch {
88 	const struct kernel_symbol *start, *stop;
89 	const u32 *crcs;
90 	enum mod_license license;
91 };
92 
93 /*
94  * Bounds of module memory, for speeding up __module_address.
95  * Protected by module_mutex.
96  */
97 static void __mod_update_bounds(enum mod_mem_type type __maybe_unused, void *base,
98 				unsigned int size, struct mod_tree_root *tree)
99 {
100 	unsigned long min = (unsigned long)base;
101 	unsigned long max = min + size;
102 
103 #ifdef CONFIG_ARCH_WANTS_MODULES_DATA_IN_VMALLOC
104 	if (mod_mem_type_is_core_data(type)) {
105 		if (min < tree->data_addr_min)
106 			tree->data_addr_min = min;
107 		if (max > tree->data_addr_max)
108 			tree->data_addr_max = max;
109 		return;
110 	}
111 #endif
112 	if (min < tree->addr_min)
113 		tree->addr_min = min;
114 	if (max > tree->addr_max)
115 		tree->addr_max = max;
116 }
117 
118 static void mod_update_bounds(struct module *mod)
119 {
120 	for_each_mod_mem_type(type) {
121 		struct module_memory *mod_mem = &mod->mem[type];
122 
123 		if (mod_mem->size)
124 			__mod_update_bounds(type, mod_mem->base, mod_mem->size, &mod_tree);
125 	}
126 }
127 
128 /* Block module loading/unloading? */
129 int modules_disabled;
130 core_param(nomodule, modules_disabled, bint, 0);
131 
132 /* Waiting for a module to finish initializing? */
133 static DECLARE_WAIT_QUEUE_HEAD(module_wq);
134 
135 static BLOCKING_NOTIFIER_HEAD(module_notify_list);
136 
137 int register_module_notifier(struct notifier_block *nb)
138 {
139 	return blocking_notifier_chain_register(&module_notify_list, nb);
140 }
141 EXPORT_SYMBOL(register_module_notifier);
142 
143 int unregister_module_notifier(struct notifier_block *nb)
144 {
145 	return blocking_notifier_chain_unregister(&module_notify_list, nb);
146 }
147 EXPORT_SYMBOL(unregister_module_notifier);
148 
149 /*
150  * We require a truly strong try_module_get(): 0 means success.
151  * Otherwise an error is returned due to ongoing or failed
152  * initialization etc.
153  */
154 static inline int strong_try_module_get(struct module *mod)
155 {
156 	BUG_ON(mod && mod->state == MODULE_STATE_UNFORMED);
157 	if (mod && mod->state == MODULE_STATE_COMING)
158 		return -EBUSY;
159 	if (try_module_get(mod))
160 		return 0;
161 	else
162 		return -ENOENT;
163 }
164 
165 static inline void add_taint_module(struct module *mod, unsigned flag,
166 				    enum lockdep_ok lockdep_ok)
167 {
168 	add_taint(flag, lockdep_ok);
169 	set_bit(flag, &mod->taints);
170 }
171 
172 /*
173  * Like strncmp(), except s/-/_/g as per scripts/Makefile.lib:name-fix-token rule.
174  */
175 static int mod_strncmp(const char *str_a, const char *str_b, size_t n)
176 {
177 	for (int i = 0; i < n; i++) {
178 		char a = str_a[i];
179 		char b = str_b[i];
180 		int d;
181 
182 		if (a == '-') a = '_';
183 		if (b == '-') b = '_';
184 
185 		d = a - b;
186 		if (d)
187 			return d;
188 
189 		if (!a)
190 			break;
191 	}
192 
193 	return 0;
194 }
195 
196 /*
197  * A thread that wants to hold a reference to a module only while it
198  * is running can call this to safely exit.
199  */
200 void __noreturn __module_put_and_kthread_exit(struct module *mod, long code)
201 {
202 	module_put(mod);
203 	kthread_exit(code);
204 }
205 EXPORT_SYMBOL(__module_put_and_kthread_exit);
206 
207 /* Find a module section: 0 means not found. */
208 static unsigned int find_sec(const struct load_info *info, const char *name)
209 {
210 	unsigned int i;
211 
212 	for (i = 1; i < info->hdr->e_shnum; i++) {
213 		Elf_Shdr *shdr = &info->sechdrs[i];
214 		/* Alloc bit cleared means "ignore it." */
215 		if ((shdr->sh_flags & SHF_ALLOC)
216 		    && strcmp(info->secstrings + shdr->sh_name, name) == 0)
217 			return i;
218 	}
219 	return 0;
220 }
221 
222 /**
223  * find_any_unique_sec() - Find a unique section index by name
224  * @info: Load info for the module to scan
225  * @name: Name of the section we're looking for
226  *
227  * Locates a unique section by name. Ignores SHF_ALLOC.
228  *
229  * Return: Section index if found uniquely, zero if absent, negative count
230  *         of total instances if multiple were found.
231  */
232 static int find_any_unique_sec(const struct load_info *info, const char *name)
233 {
234 	unsigned int idx;
235 	unsigned int count = 0;
236 	int i;
237 
238 	for (i = 1; i < info->hdr->e_shnum; i++) {
239 		if (strcmp(info->secstrings + info->sechdrs[i].sh_name,
240 			   name) == 0) {
241 			count++;
242 			idx = i;
243 		}
244 	}
245 	if (count == 1) {
246 		return idx;
247 	} else if (count == 0) {
248 		return 0;
249 	} else {
250 		return -count;
251 	}
252 }
253 
254 /* Find a module section, or NULL. */
255 static void *section_addr(const struct load_info *info, const char *name)
256 {
257 	/* Section 0 has sh_addr 0. */
258 	return (void *)info->sechdrs[find_sec(info, name)].sh_addr;
259 }
260 
261 /* Find a module section, or NULL.  Fill in number of "objects" in section. */
262 static void *section_objs(const struct load_info *info,
263 			  const char *name,
264 			  size_t object_size,
265 			  unsigned int *num)
266 {
267 	unsigned int sec = find_sec(info, name);
268 
269 	/* Section 0 has sh_addr 0 and sh_size 0. */
270 	*num = info->sechdrs[sec].sh_size / object_size;
271 	return (void *)info->sechdrs[sec].sh_addr;
272 }
273 
274 /* Find a module section: 0 means not found. Ignores SHF_ALLOC flag. */
275 static unsigned int find_any_sec(const struct load_info *info, const char *name)
276 {
277 	unsigned int i;
278 
279 	for (i = 1; i < info->hdr->e_shnum; i++) {
280 		Elf_Shdr *shdr = &info->sechdrs[i];
281 		if (strcmp(info->secstrings + shdr->sh_name, name) == 0)
282 			return i;
283 	}
284 	return 0;
285 }
286 
287 /*
288  * Find a module section, or NULL. Fill in number of "objects" in section.
289  * Ignores SHF_ALLOC flag.
290  */
291 static __maybe_unused void *any_section_objs(const struct load_info *info,
292 					     const char *name,
293 					     size_t object_size,
294 					     unsigned int *num)
295 {
296 	unsigned int sec = find_any_sec(info, name);
297 
298 	/* Section 0 has sh_addr 0 and sh_size 0. */
299 	*num = info->sechdrs[sec].sh_size / object_size;
300 	return (void *)info->sechdrs[sec].sh_addr;
301 }
302 
303 #ifndef CONFIG_MODVERSIONS
304 #define symversion(base, idx) NULL
305 #else
306 #define symversion(base, idx) ((base != NULL) ? ((base) + (idx)) : NULL)
307 #endif
308 
309 static const char *kernel_symbol_name(const struct kernel_symbol *sym)
310 {
311 #ifdef CONFIG_HAVE_ARCH_PREL32_RELOCATIONS
312 	return offset_to_ptr(&sym->name_offset);
313 #else
314 	return sym->name;
315 #endif
316 }
317 
318 static const char *kernel_symbol_namespace(const struct kernel_symbol *sym)
319 {
320 #ifdef CONFIG_HAVE_ARCH_PREL32_RELOCATIONS
321 	if (!sym->namespace_offset)
322 		return NULL;
323 	return offset_to_ptr(&sym->namespace_offset);
324 #else
325 	return sym->namespace;
326 #endif
327 }
328 
329 int cmp_name(const void *name, const void *sym)
330 {
331 	return strcmp(name, kernel_symbol_name(sym));
332 }
333 
334 static bool find_exported_symbol_in_section(const struct symsearch *syms,
335 					    struct module *owner,
336 					    struct find_symbol_arg *fsa)
337 {
338 	struct kernel_symbol *sym;
339 
340 	if (!fsa->gplok && syms->license == GPL_ONLY)
341 		return false;
342 
343 	sym = bsearch(fsa->name, syms->start, syms->stop - syms->start,
344 			sizeof(struct kernel_symbol), cmp_name);
345 	if (!sym)
346 		return false;
347 
348 	fsa->owner = owner;
349 	fsa->crc = symversion(syms->crcs, sym - syms->start);
350 	fsa->sym = sym;
351 	fsa->license = syms->license;
352 
353 	return true;
354 }
355 
356 /*
357  * Find an exported symbol and return it, along with, (optional) crc and
358  * (optional) module which owns it. Needs RCU or module_mutex.
359  */
360 bool find_symbol(struct find_symbol_arg *fsa)
361 {
362 	static const struct symsearch arr[] = {
363 		{ __start___ksymtab, __stop___ksymtab, __start___kcrctab,
364 		  NOT_GPL_ONLY },
365 		{ __start___ksymtab_gpl, __stop___ksymtab_gpl,
366 		  __start___kcrctab_gpl,
367 		  GPL_ONLY },
368 	};
369 	struct module *mod;
370 	unsigned int i;
371 
372 	for (i = 0; i < ARRAY_SIZE(arr); i++)
373 		if (find_exported_symbol_in_section(&arr[i], NULL, fsa))
374 			return true;
375 
376 	list_for_each_entry_rcu(mod, &modules, list,
377 				lockdep_is_held(&module_mutex)) {
378 		struct symsearch arr[] = {
379 			{ mod->syms, mod->syms + mod->num_syms, mod->crcs,
380 			  NOT_GPL_ONLY },
381 			{ mod->gpl_syms, mod->gpl_syms + mod->num_gpl_syms,
382 			  mod->gpl_crcs,
383 			  GPL_ONLY },
384 		};
385 
386 		if (mod->state == MODULE_STATE_UNFORMED)
387 			continue;
388 
389 		for (i = 0; i < ARRAY_SIZE(arr); i++)
390 			if (find_exported_symbol_in_section(&arr[i], mod, fsa))
391 				return true;
392 	}
393 
394 	pr_debug("Failed to find symbol %s\n", fsa->name);
395 	return false;
396 }
397 
398 /*
399  * Search for module by name: must hold module_mutex (or RCU for read-only
400  * access).
401  */
402 struct module *find_module_all(const char *name, size_t len,
403 			       bool even_unformed)
404 {
405 	struct module *mod;
406 
407 	list_for_each_entry_rcu(mod, &modules, list,
408 				lockdep_is_held(&module_mutex)) {
409 		if (!even_unformed && mod->state == MODULE_STATE_UNFORMED)
410 			continue;
411 		if (strlen(mod->name) == len && !memcmp(mod->name, name, len))
412 			return mod;
413 	}
414 	return NULL;
415 }
416 
417 struct module *find_module(const char *name)
418 {
419 	return find_module_all(name, strlen(name), false);
420 }
421 
422 #ifdef CONFIG_SMP
423 
424 static inline void __percpu *mod_percpu(struct module *mod)
425 {
426 	return mod->percpu;
427 }
428 
429 static int percpu_modalloc(struct module *mod, struct load_info *info)
430 {
431 	Elf_Shdr *pcpusec = &info->sechdrs[info->index.pcpu];
432 	unsigned long align = pcpusec->sh_addralign;
433 
434 	if (!pcpusec->sh_size)
435 		return 0;
436 
437 	if (align > PAGE_SIZE) {
438 		pr_warn("%s: per-cpu alignment %li > %li\n",
439 			mod->name, align, PAGE_SIZE);
440 		align = PAGE_SIZE;
441 	}
442 
443 	mod->percpu = __alloc_reserved_percpu(pcpusec->sh_size, align);
444 	if (!mod->percpu) {
445 		pr_warn("%s: Could not allocate %lu bytes percpu data\n",
446 			mod->name, (unsigned long)pcpusec->sh_size);
447 		return -ENOMEM;
448 	}
449 	mod->percpu_size = pcpusec->sh_size;
450 	return 0;
451 }
452 
453 static void percpu_modfree(struct module *mod)
454 {
455 	free_percpu(mod->percpu);
456 }
457 
458 static unsigned int find_pcpusec(struct load_info *info)
459 {
460 	return find_sec(info, ".data..percpu");
461 }
462 
463 static void percpu_modcopy(struct module *mod,
464 			   const void *from, unsigned long size)
465 {
466 	int cpu;
467 
468 	for_each_possible_cpu(cpu)
469 		memcpy(per_cpu_ptr(mod->percpu, cpu), from, size);
470 }
471 
472 bool __is_module_percpu_address(unsigned long addr, unsigned long *can_addr)
473 {
474 	struct module *mod;
475 	unsigned int cpu;
476 
477 	guard(rcu)();
478 	list_for_each_entry_rcu(mod, &modules, list) {
479 		if (mod->state == MODULE_STATE_UNFORMED)
480 			continue;
481 		if (!mod->percpu_size)
482 			continue;
483 		for_each_possible_cpu(cpu) {
484 			void *start = per_cpu_ptr(mod->percpu, cpu);
485 			void *va = (void *)addr;
486 
487 			if (va >= start && va < start + mod->percpu_size) {
488 				if (can_addr) {
489 					*can_addr = (unsigned long) (va - start);
490 					*can_addr += (unsigned long)
491 						per_cpu_ptr(mod->percpu,
492 							    get_boot_cpu_id());
493 				}
494 				return true;
495 			}
496 		}
497 	}
498 	return false;
499 }
500 
501 /**
502  * is_module_percpu_address() - test whether address is from module static percpu
503  * @addr: address to test
504  *
505  * Test whether @addr belongs to module static percpu area.
506  *
507  * Return: %true if @addr is from module static percpu area
508  */
509 bool is_module_percpu_address(unsigned long addr)
510 {
511 	return __is_module_percpu_address(addr, NULL);
512 }
513 
514 #else /* ... !CONFIG_SMP */
515 
516 static inline void __percpu *mod_percpu(struct module *mod)
517 {
518 	return NULL;
519 }
520 static int percpu_modalloc(struct module *mod, struct load_info *info)
521 {
522 	/* UP modules shouldn't have this section: ENOMEM isn't quite right */
523 	if (info->sechdrs[info->index.pcpu].sh_size != 0)
524 		return -ENOMEM;
525 	return 0;
526 }
527 static inline void percpu_modfree(struct module *mod)
528 {
529 }
530 static unsigned int find_pcpusec(struct load_info *info)
531 {
532 	return 0;
533 }
534 static inline void percpu_modcopy(struct module *mod,
535 				  const void *from, unsigned long size)
536 {
537 	/* pcpusec should be 0, and size of that section should be 0. */
538 	BUG_ON(size != 0);
539 }
540 bool is_module_percpu_address(unsigned long addr)
541 {
542 	return false;
543 }
544 
545 bool __is_module_percpu_address(unsigned long addr, unsigned long *can_addr)
546 {
547 	return false;
548 }
549 
550 #endif /* CONFIG_SMP */
551 
552 #define MODINFO_ATTR(field)	\
553 static void setup_modinfo_##field(struct module *mod, const char *s)  \
554 {                                                                     \
555 	mod->field = kstrdup(s, GFP_KERNEL);                          \
556 }                                                                     \
557 static ssize_t show_modinfo_##field(const struct module_attribute *mattr, \
558 			struct module_kobject *mk, char *buffer)      \
559 {                                                                     \
560 	return scnprintf(buffer, PAGE_SIZE, "%s\n", mk->mod->field);  \
561 }                                                                     \
562 static int modinfo_##field##_exists(struct module *mod)               \
563 {                                                                     \
564 	return mod->field != NULL;                                    \
565 }                                                                     \
566 static void free_modinfo_##field(struct module *mod)                  \
567 {                                                                     \
568 	kfree(mod->field);                                            \
569 	mod->field = NULL;                                            \
570 }                                                                     \
571 static const struct module_attribute modinfo_##field = {              \
572 	.attr = { .name = __stringify(field), .mode = 0444 },         \
573 	.show = show_modinfo_##field,                                 \
574 	.setup = setup_modinfo_##field,                               \
575 	.test = modinfo_##field##_exists,                             \
576 	.free = free_modinfo_##field,                                 \
577 };
578 
579 MODINFO_ATTR(version);
580 MODINFO_ATTR(srcversion);
581 
582 static struct {
583 	char name[MODULE_NAME_LEN + 1];
584 	char taints[MODULE_FLAGS_BUF_SIZE];
585 } last_unloaded_module;
586 
587 #ifdef CONFIG_MODULE_UNLOAD
588 
589 EXPORT_TRACEPOINT_SYMBOL(module_get);
590 
591 /* MODULE_REF_BASE is the base reference count by kmodule loader. */
592 #define MODULE_REF_BASE	1
593 
594 /* Init the unload section of the module. */
595 static int module_unload_init(struct module *mod)
596 {
597 	/*
598 	 * Initialize reference counter to MODULE_REF_BASE.
599 	 * refcnt == 0 means module is going.
600 	 */
601 	atomic_set(&mod->refcnt, MODULE_REF_BASE);
602 
603 	INIT_LIST_HEAD(&mod->source_list);
604 	INIT_LIST_HEAD(&mod->target_list);
605 
606 	/* Hold reference count during initialization. */
607 	atomic_inc(&mod->refcnt);
608 
609 	return 0;
610 }
611 
612 /* Does a already use b? */
613 static int already_uses(struct module *a, struct module *b)
614 {
615 	struct module_use *use;
616 
617 	list_for_each_entry(use, &b->source_list, source_list) {
618 		if (use->source == a)
619 			return 1;
620 	}
621 	pr_debug("%s does not use %s!\n", a->name, b->name);
622 	return 0;
623 }
624 
625 /*
626  * Module a uses b
627  *  - we add 'a' as a "source", 'b' as a "target" of module use
628  *  - the module_use is added to the list of 'b' sources (so
629  *    'b' can walk the list to see who sourced them), and of 'a'
630  *    targets (so 'a' can see what modules it targets).
631  */
632 static int add_module_usage(struct module *a, struct module *b)
633 {
634 	struct module_use *use;
635 
636 	pr_debug("Allocating new usage for %s.\n", a->name);
637 	use = kmalloc(sizeof(*use), GFP_ATOMIC);
638 	if (!use)
639 		return -ENOMEM;
640 
641 	use->source = a;
642 	use->target = b;
643 	list_add(&use->source_list, &b->source_list);
644 	list_add(&use->target_list, &a->target_list);
645 	return 0;
646 }
647 
648 /* Module a uses b: caller needs module_mutex() */
649 static int ref_module(struct module *a, struct module *b)
650 {
651 	int err;
652 
653 	if (b == NULL || already_uses(a, b))
654 		return 0;
655 
656 	/* If module isn't available, we fail. */
657 	err = strong_try_module_get(b);
658 	if (err)
659 		return err;
660 
661 	err = add_module_usage(a, b);
662 	if (err) {
663 		module_put(b);
664 		return err;
665 	}
666 	return 0;
667 }
668 
669 /* Clear the unload stuff of the module. */
670 static void module_unload_free(struct module *mod)
671 {
672 	struct module_use *use, *tmp;
673 
674 	mutex_lock(&module_mutex);
675 	list_for_each_entry_safe(use, tmp, &mod->target_list, target_list) {
676 		struct module *i = use->target;
677 		pr_debug("%s unusing %s\n", mod->name, i->name);
678 		module_put(i);
679 		list_del(&use->source_list);
680 		list_del(&use->target_list);
681 		kfree(use);
682 	}
683 	mutex_unlock(&module_mutex);
684 }
685 
686 #ifdef CONFIG_MODULE_FORCE_UNLOAD
687 static inline int try_force_unload(unsigned int flags)
688 {
689 	int ret = (flags & O_TRUNC);
690 	if (ret)
691 		add_taint(TAINT_FORCED_RMMOD, LOCKDEP_NOW_UNRELIABLE);
692 	return ret;
693 }
694 #else
695 static inline int try_force_unload(unsigned int flags)
696 {
697 	return 0;
698 }
699 #endif /* CONFIG_MODULE_FORCE_UNLOAD */
700 
701 /* Try to release refcount of module, 0 means success. */
702 static int try_release_module_ref(struct module *mod)
703 {
704 	int ret;
705 
706 	/* Try to decrement refcnt which we set at loading */
707 	ret = atomic_sub_return(MODULE_REF_BASE, &mod->refcnt);
708 	BUG_ON(ret < 0);
709 	if (ret)
710 		/* Someone can put this right now, recover with checking */
711 		ret = atomic_add_unless(&mod->refcnt, MODULE_REF_BASE, 0);
712 
713 	return ret;
714 }
715 
716 static int try_stop_module(struct module *mod, int flags, int *forced)
717 {
718 	/* If it's not unused, quit unless we're forcing. */
719 	if (try_release_module_ref(mod) != 0) {
720 		*forced = try_force_unload(flags);
721 		if (!(*forced))
722 			return -EWOULDBLOCK;
723 	}
724 
725 	/* Mark it as dying. */
726 	mod->state = MODULE_STATE_GOING;
727 
728 	return 0;
729 }
730 
731 /**
732  * module_refcount() - return the refcount or -1 if unloading
733  * @mod:	the module we're checking
734  *
735  * Return:
736  *	-1 if the module is in the process of unloading
737  *	otherwise the number of references in the kernel to the module
738  */
739 int module_refcount(struct module *mod)
740 {
741 	return atomic_read(&mod->refcnt) - MODULE_REF_BASE;
742 }
743 EXPORT_SYMBOL(module_refcount);
744 
745 /* This exists whether we can unload or not */
746 static void free_module(struct module *mod);
747 
748 SYSCALL_DEFINE2(delete_module, const char __user *, name_user,
749 		unsigned int, flags)
750 {
751 	struct module *mod;
752 	char name[MODULE_NAME_LEN];
753 	char buf[MODULE_FLAGS_BUF_SIZE];
754 	int ret, forced = 0;
755 
756 	if (!capable(CAP_SYS_MODULE) || modules_disabled)
757 		return -EPERM;
758 
759 	if (strncpy_from_user(name, name_user, MODULE_NAME_LEN-1) < 0)
760 		return -EFAULT;
761 	name[MODULE_NAME_LEN-1] = '\0';
762 
763 	audit_log_kern_module(name);
764 
765 	if (mutex_lock_interruptible(&module_mutex) != 0)
766 		return -EINTR;
767 
768 	mod = find_module(name);
769 	if (!mod) {
770 		ret = -ENOENT;
771 		goto out;
772 	}
773 
774 	if (!list_empty(&mod->source_list)) {
775 		/* Other modules depend on us: get rid of them first. */
776 		ret = -EWOULDBLOCK;
777 		goto out;
778 	}
779 
780 	/* Doing init or already dying? */
781 	if (mod->state != MODULE_STATE_LIVE) {
782 		/* FIXME: if (force), slam module count damn the torpedoes */
783 		pr_debug("%s already dying\n", mod->name);
784 		ret = -EBUSY;
785 		goto out;
786 	}
787 
788 	/* If it has an init func, it must have an exit func to unload */
789 	if (mod->init && !mod->exit) {
790 		forced = try_force_unload(flags);
791 		if (!forced) {
792 			/* This module can't be removed */
793 			ret = -EBUSY;
794 			goto out;
795 		}
796 	}
797 
798 	ret = try_stop_module(mod, flags, &forced);
799 	if (ret != 0)
800 		goto out;
801 
802 	mutex_unlock(&module_mutex);
803 	/* Final destruction now no one is using it. */
804 	if (mod->exit != NULL)
805 		mod->exit();
806 	blocking_notifier_call_chain(&module_notify_list,
807 				     MODULE_STATE_GOING, mod);
808 	klp_module_going(mod);
809 	ftrace_release_mod(mod);
810 
811 	async_synchronize_full();
812 
813 	/* Store the name and taints of the last unloaded module for diagnostic purposes */
814 	strscpy(last_unloaded_module.name, mod->name);
815 	strscpy(last_unloaded_module.taints, module_flags(mod, buf, false));
816 
817 	free_module(mod);
818 	/* someone could wait for the module in add_unformed_module() */
819 	wake_up_all(&module_wq);
820 	return 0;
821 out:
822 	mutex_unlock(&module_mutex);
823 	return ret;
824 }
825 
826 void __symbol_put(const char *symbol)
827 {
828 	struct find_symbol_arg fsa = {
829 		.name	= symbol,
830 		.gplok	= true,
831 	};
832 
833 	guard(rcu)();
834 	BUG_ON(!find_symbol(&fsa));
835 	module_put(fsa.owner);
836 }
837 EXPORT_SYMBOL(__symbol_put);
838 
839 /* Note this assumes addr is a function, which it currently always is. */
840 void symbol_put_addr(void *addr)
841 {
842 	struct module *modaddr;
843 	unsigned long a = (unsigned long)dereference_function_descriptor(addr);
844 
845 	if (core_kernel_text(a))
846 		return;
847 
848 	/*
849 	 * Even though we hold a reference on the module; we still need to
850 	 * RCU read section in order to safely traverse the data structure.
851 	 */
852 	guard(rcu)();
853 	modaddr = __module_text_address(a);
854 	BUG_ON(!modaddr);
855 	module_put(modaddr);
856 }
857 EXPORT_SYMBOL_GPL(symbol_put_addr);
858 
859 static ssize_t show_refcnt(const struct module_attribute *mattr,
860 			   struct module_kobject *mk, char *buffer)
861 {
862 	return sprintf(buffer, "%i\n", module_refcount(mk->mod));
863 }
864 
865 static const struct module_attribute modinfo_refcnt =
866 	__ATTR(refcnt, 0444, show_refcnt, NULL);
867 
868 void __module_get(struct module *module)
869 {
870 	if (module) {
871 		atomic_inc(&module->refcnt);
872 		trace_module_get(module, _RET_IP_);
873 	}
874 }
875 EXPORT_SYMBOL(__module_get);
876 
877 bool try_module_get(struct module *module)
878 {
879 	bool ret = true;
880 
881 	if (module) {
882 		/* Note: here, we can fail to get a reference */
883 		if (likely(module_is_live(module) &&
884 			   atomic_inc_not_zero(&module->refcnt) != 0))
885 			trace_module_get(module, _RET_IP_);
886 		else
887 			ret = false;
888 	}
889 	return ret;
890 }
891 EXPORT_SYMBOL(try_module_get);
892 
893 void module_put(struct module *module)
894 {
895 	int ret;
896 
897 	if (module) {
898 		ret = atomic_dec_if_positive(&module->refcnt);
899 		WARN_ON(ret < 0);	/* Failed to put refcount */
900 		trace_module_put(module, _RET_IP_);
901 	}
902 }
903 EXPORT_SYMBOL(module_put);
904 
905 #else /* !CONFIG_MODULE_UNLOAD */
906 static inline void module_unload_free(struct module *mod)
907 {
908 }
909 
910 static int ref_module(struct module *a, struct module *b)
911 {
912 	return strong_try_module_get(b);
913 }
914 
915 static inline int module_unload_init(struct module *mod)
916 {
917 	return 0;
918 }
919 #endif /* CONFIG_MODULE_UNLOAD */
920 
921 size_t module_flags_taint(unsigned long taints, char *buf)
922 {
923 	size_t l = 0;
924 	int i;
925 
926 	for (i = 0; i < TAINT_FLAGS_COUNT; i++) {
927 		if (taint_flags[i].module && test_bit(i, &taints))
928 			buf[l++] = taint_flags[i].c_true;
929 	}
930 
931 	return l;
932 }
933 
934 static ssize_t show_initstate(const struct module_attribute *mattr,
935 			      struct module_kobject *mk, char *buffer)
936 {
937 	const char *state = "unknown";
938 
939 	switch (mk->mod->state) {
940 	case MODULE_STATE_LIVE:
941 		state = "live";
942 		break;
943 	case MODULE_STATE_COMING:
944 		state = "coming";
945 		break;
946 	case MODULE_STATE_GOING:
947 		state = "going";
948 		break;
949 	default:
950 		BUG();
951 	}
952 	return sprintf(buffer, "%s\n", state);
953 }
954 
955 static const struct module_attribute modinfo_initstate =
956 	__ATTR(initstate, 0444, show_initstate, NULL);
957 
958 static ssize_t store_uevent(const struct module_attribute *mattr,
959 			    struct module_kobject *mk,
960 			    const char *buffer, size_t count)
961 {
962 	int rc;
963 
964 	rc = kobject_synth_uevent(&mk->kobj, buffer, count);
965 	return rc ? rc : count;
966 }
967 
968 const struct module_attribute module_uevent =
969 	__ATTR(uevent, 0200, NULL, store_uevent);
970 
971 static ssize_t show_coresize(const struct module_attribute *mattr,
972 			     struct module_kobject *mk, char *buffer)
973 {
974 	unsigned int size = mk->mod->mem[MOD_TEXT].size;
975 
976 	if (!IS_ENABLED(CONFIG_ARCH_WANTS_MODULES_DATA_IN_VMALLOC)) {
977 		for_class_mod_mem_type(type, core_data)
978 			size += mk->mod->mem[type].size;
979 	}
980 	return sprintf(buffer, "%u\n", size);
981 }
982 
983 static const struct module_attribute modinfo_coresize =
984 	__ATTR(coresize, 0444, show_coresize, NULL);
985 
986 #ifdef CONFIG_ARCH_WANTS_MODULES_DATA_IN_VMALLOC
987 static ssize_t show_datasize(const struct module_attribute *mattr,
988 			     struct module_kobject *mk, char *buffer)
989 {
990 	unsigned int size = 0;
991 
992 	for_class_mod_mem_type(type, core_data)
993 		size += mk->mod->mem[type].size;
994 	return sprintf(buffer, "%u\n", size);
995 }
996 
997 static const struct module_attribute modinfo_datasize =
998 	__ATTR(datasize, 0444, show_datasize, NULL);
999 #endif
1000 
1001 static ssize_t show_initsize(const struct module_attribute *mattr,
1002 			     struct module_kobject *mk, char *buffer)
1003 {
1004 	unsigned int size = 0;
1005 
1006 	for_class_mod_mem_type(type, init)
1007 		size += mk->mod->mem[type].size;
1008 	return sprintf(buffer, "%u\n", size);
1009 }
1010 
1011 static const struct module_attribute modinfo_initsize =
1012 	__ATTR(initsize, 0444, show_initsize, NULL);
1013 
1014 static ssize_t show_taint(const struct module_attribute *mattr,
1015 			  struct module_kobject *mk, char *buffer)
1016 {
1017 	size_t l;
1018 
1019 	l = module_flags_taint(mk->mod->taints, buffer);
1020 	buffer[l++] = '\n';
1021 	return l;
1022 }
1023 
1024 static const struct module_attribute modinfo_taint =
1025 	__ATTR(taint, 0444, show_taint, NULL);
1026 
1027 const struct module_attribute *const modinfo_attrs[] = {
1028 	&module_uevent,
1029 	&modinfo_version,
1030 	&modinfo_srcversion,
1031 	&modinfo_initstate,
1032 	&modinfo_coresize,
1033 #ifdef CONFIG_ARCH_WANTS_MODULES_DATA_IN_VMALLOC
1034 	&modinfo_datasize,
1035 #endif
1036 	&modinfo_initsize,
1037 	&modinfo_taint,
1038 #ifdef CONFIG_MODULE_UNLOAD
1039 	&modinfo_refcnt,
1040 #endif
1041 	NULL,
1042 };
1043 
1044 const size_t modinfo_attrs_count = ARRAY_SIZE(modinfo_attrs);
1045 
1046 static const char vermagic[] = VERMAGIC_STRING;
1047 
1048 int try_to_force_load(struct module *mod, const char *reason)
1049 {
1050 #ifdef CONFIG_MODULE_FORCE_LOAD
1051 	if (!test_taint(TAINT_FORCED_MODULE))
1052 		pr_warn("%s: %s: kernel tainted.\n", mod->name, reason);
1053 	add_taint_module(mod, TAINT_FORCED_MODULE, LOCKDEP_NOW_UNRELIABLE);
1054 	return 0;
1055 #else
1056 	return -ENOEXEC;
1057 #endif
1058 }
1059 
1060 /* Parse tag=value strings from .modinfo section */
1061 char *module_next_tag_pair(char *string, unsigned long *secsize)
1062 {
1063 	/* Skip non-zero chars */
1064 	while (string[0]) {
1065 		string++;
1066 		if ((*secsize)-- <= 1)
1067 			return NULL;
1068 	}
1069 
1070 	/* Skip any zero padding. */
1071 	while (!string[0]) {
1072 		string++;
1073 		if ((*secsize)-- <= 1)
1074 			return NULL;
1075 	}
1076 	return string;
1077 }
1078 
1079 static char *get_next_modinfo(const struct load_info *info, const char *tag,
1080 			      char *prev)
1081 {
1082 	char *p;
1083 	unsigned int taglen = strlen(tag);
1084 	Elf_Shdr *infosec = &info->sechdrs[info->index.info];
1085 	unsigned long size = infosec->sh_size;
1086 
1087 	/*
1088 	 * get_modinfo() calls made before rewrite_section_headers()
1089 	 * must use sh_offset, as sh_addr isn't set!
1090 	 */
1091 	char *modinfo = (char *)info->hdr + infosec->sh_offset;
1092 
1093 	if (prev) {
1094 		size -= prev - modinfo;
1095 		modinfo = module_next_tag_pair(prev, &size);
1096 	}
1097 
1098 	for (p = modinfo; p; p = module_next_tag_pair(p, &size)) {
1099 		if (strncmp(p, tag, taglen) == 0 && p[taglen] == '=')
1100 			return p + taglen + 1;
1101 	}
1102 	return NULL;
1103 }
1104 
1105 static char *get_modinfo(const struct load_info *info, const char *tag)
1106 {
1107 	return get_next_modinfo(info, tag, NULL);
1108 }
1109 
1110 /**
1111  * verify_module_namespace() - does @modname have access to this symbol's @namespace
1112  * @namespace: export symbol namespace
1113  * @modname: module name
1114  *
1115  * If @namespace is prefixed with "module:" to indicate it is a module namespace
1116  * then test if @modname matches any of the comma separated patterns.
1117  *
1118  * The patterns only support tail-glob.
1119  */
1120 static bool verify_module_namespace(const char *namespace, const char *modname)
1121 {
1122 	size_t len, modlen = strlen(modname);
1123 	const char *prefix = "module:";
1124 	const char *sep;
1125 	bool glob;
1126 
1127 	if (!strstarts(namespace, prefix))
1128 		return false;
1129 
1130 	for (namespace += strlen(prefix); *namespace; namespace = sep) {
1131 		sep = strchrnul(namespace, ',');
1132 		len = sep - namespace;
1133 
1134 		glob = false;
1135 		if (sep[-1] == '*') {
1136 			len--;
1137 			glob = true;
1138 		}
1139 
1140 		if (*sep)
1141 			sep++;
1142 
1143 		if (mod_strncmp(namespace, modname, len) == 0 && (glob || len == modlen))
1144 			return true;
1145 	}
1146 
1147 	return false;
1148 }
1149 
1150 static int verify_namespace_is_imported(const struct load_info *info,
1151 					const struct kernel_symbol *sym,
1152 					struct module *mod)
1153 {
1154 	const char *namespace;
1155 	char *imported_namespace;
1156 
1157 	namespace = kernel_symbol_namespace(sym);
1158 	if (namespace && namespace[0]) {
1159 
1160 		if (verify_module_namespace(namespace, mod->name))
1161 			return 0;
1162 
1163 		for_each_modinfo_entry(imported_namespace, info, "import_ns") {
1164 			if (strcmp(namespace, imported_namespace) == 0)
1165 				return 0;
1166 		}
1167 #ifdef CONFIG_MODULE_ALLOW_MISSING_NAMESPACE_IMPORTS
1168 		pr_warn(
1169 #else
1170 		pr_err(
1171 #endif
1172 			"%s: module uses symbol (%s) from namespace %s, but does not import it.\n",
1173 			mod->name, kernel_symbol_name(sym), namespace);
1174 #ifndef CONFIG_MODULE_ALLOW_MISSING_NAMESPACE_IMPORTS
1175 		return -EINVAL;
1176 #endif
1177 	}
1178 	return 0;
1179 }
1180 
1181 static bool inherit_taint(struct module *mod, struct module *owner, const char *name)
1182 {
1183 	if (!owner || !test_bit(TAINT_PROPRIETARY_MODULE, &owner->taints))
1184 		return true;
1185 
1186 	if (mod->using_gplonly_symbols) {
1187 		pr_err("%s: module using GPL-only symbols uses symbols %s from proprietary module %s.\n",
1188 			mod->name, name, owner->name);
1189 		return false;
1190 	}
1191 
1192 	if (!test_bit(TAINT_PROPRIETARY_MODULE, &mod->taints)) {
1193 		pr_warn("%s: module uses symbols %s from proprietary module %s, inheriting taint.\n",
1194 			mod->name, name, owner->name);
1195 		set_bit(TAINT_PROPRIETARY_MODULE, &mod->taints);
1196 	}
1197 	return true;
1198 }
1199 
1200 /* Resolve a symbol for this module.  I.e. if we find one, record usage. */
1201 static const struct kernel_symbol *resolve_symbol(struct module *mod,
1202 						  const struct load_info *info,
1203 						  const char *name,
1204 						  char ownername[])
1205 {
1206 	struct find_symbol_arg fsa = {
1207 		.name	= name,
1208 		.gplok	= !(mod->taints & (1 << TAINT_PROPRIETARY_MODULE)),
1209 		.warn	= true,
1210 	};
1211 	int err;
1212 
1213 	/*
1214 	 * The module_mutex should not be a heavily contended lock;
1215 	 * if we get the occasional sleep here, we'll go an extra iteration
1216 	 * in the wait_event_interruptible(), which is harmless.
1217 	 */
1218 	sched_annotate_sleep();
1219 	mutex_lock(&module_mutex);
1220 	if (!find_symbol(&fsa))
1221 		goto unlock;
1222 
1223 	if (fsa.license == GPL_ONLY)
1224 		mod->using_gplonly_symbols = true;
1225 
1226 	if (!inherit_taint(mod, fsa.owner, name)) {
1227 		fsa.sym = NULL;
1228 		goto getname;
1229 	}
1230 
1231 	if (!check_version(info, name, mod, fsa.crc)) {
1232 		fsa.sym = ERR_PTR(-EINVAL);
1233 		goto getname;
1234 	}
1235 
1236 	err = verify_namespace_is_imported(info, fsa.sym, mod);
1237 	if (err) {
1238 		fsa.sym = ERR_PTR(err);
1239 		goto getname;
1240 	}
1241 
1242 	err = ref_module(mod, fsa.owner);
1243 	if (err) {
1244 		fsa.sym = ERR_PTR(err);
1245 		goto getname;
1246 	}
1247 
1248 getname:
1249 	/* We must make copy under the lock if we failed to get ref. */
1250 	strscpy(ownername, module_name(fsa.owner), MODULE_NAME_LEN);
1251 unlock:
1252 	mutex_unlock(&module_mutex);
1253 	return fsa.sym;
1254 }
1255 
1256 static const struct kernel_symbol *
1257 resolve_symbol_wait(struct module *mod,
1258 		    const struct load_info *info,
1259 		    const char *name)
1260 {
1261 	const struct kernel_symbol *ksym;
1262 	char owner[MODULE_NAME_LEN];
1263 
1264 	if (wait_event_interruptible_timeout(module_wq,
1265 			!IS_ERR(ksym = resolve_symbol(mod, info, name, owner))
1266 			|| PTR_ERR(ksym) != -EBUSY,
1267 					     30 * HZ) <= 0) {
1268 		pr_warn("%s: gave up waiting for init of module %s.\n",
1269 			mod->name, owner);
1270 	}
1271 	return ksym;
1272 }
1273 
1274 void __weak module_arch_cleanup(struct module *mod)
1275 {
1276 }
1277 
1278 void __weak module_arch_freeing_init(struct module *mod)
1279 {
1280 }
1281 
1282 static int module_memory_alloc(struct module *mod, enum mod_mem_type type)
1283 {
1284 	unsigned int size = PAGE_ALIGN(mod->mem[type].size);
1285 	enum execmem_type execmem_type;
1286 	void *ptr;
1287 
1288 	mod->mem[type].size = size;
1289 
1290 	if (mod_mem_type_is_data(type))
1291 		execmem_type = EXECMEM_MODULE_DATA;
1292 	else
1293 		execmem_type = EXECMEM_MODULE_TEXT;
1294 
1295 	ptr = execmem_alloc(execmem_type, size);
1296 	if (!ptr)
1297 		return -ENOMEM;
1298 
1299 	if (execmem_is_rox(execmem_type)) {
1300 		int err = execmem_make_temp_rw(ptr, size);
1301 
1302 		if (err) {
1303 			execmem_free(ptr);
1304 			return -ENOMEM;
1305 		}
1306 
1307 		mod->mem[type].is_rox = true;
1308 	}
1309 
1310 	/*
1311 	 * The pointer to these blocks of memory are stored on the module
1312 	 * structure and we keep that around so long as the module is
1313 	 * around. We only free that memory when we unload the module.
1314 	 * Just mark them as not being a leak then. The .init* ELF
1315 	 * sections *do* get freed after boot so we *could* treat them
1316 	 * slightly differently with kmemleak_ignore() and only grey
1317 	 * them out as they work as typical memory allocations which
1318 	 * *do* eventually get freed, but let's just keep things simple
1319 	 * and avoid *any* false positives.
1320 	 */
1321 	if (!mod->mem[type].is_rox)
1322 		kmemleak_not_leak(ptr);
1323 
1324 	memset(ptr, 0, size);
1325 	mod->mem[type].base = ptr;
1326 
1327 	return 0;
1328 }
1329 
1330 static void module_memory_restore_rox(struct module *mod)
1331 {
1332 	for_class_mod_mem_type(type, text) {
1333 		struct module_memory *mem = &mod->mem[type];
1334 
1335 		if (mem->is_rox)
1336 			execmem_restore_rox(mem->base, mem->size);
1337 	}
1338 }
1339 
1340 static void module_memory_free(struct module *mod, enum mod_mem_type type)
1341 {
1342 	struct module_memory *mem = &mod->mem[type];
1343 
1344 	execmem_free(mem->base);
1345 }
1346 
1347 static void free_mod_mem(struct module *mod)
1348 {
1349 	for_each_mod_mem_type(type) {
1350 		struct module_memory *mod_mem = &mod->mem[type];
1351 
1352 		if (type == MOD_DATA)
1353 			continue;
1354 
1355 		/* Free lock-classes; relies on the preceding sync_rcu(). */
1356 		lockdep_free_key_range(mod_mem->base, mod_mem->size);
1357 		if (mod_mem->size)
1358 			module_memory_free(mod, type);
1359 	}
1360 
1361 	/* MOD_DATA hosts mod, so free it at last */
1362 	lockdep_free_key_range(mod->mem[MOD_DATA].base, mod->mem[MOD_DATA].size);
1363 	module_memory_free(mod, MOD_DATA);
1364 }
1365 
1366 /* Free a module, remove from lists, etc. */
1367 static void free_module(struct module *mod)
1368 {
1369 	trace_module_free(mod);
1370 
1371 	codetag_unload_module(mod);
1372 
1373 	mod_sysfs_teardown(mod);
1374 
1375 	/*
1376 	 * We leave it in list to prevent duplicate loads, but make sure
1377 	 * that noone uses it while it's being deconstructed.
1378 	 */
1379 	mutex_lock(&module_mutex);
1380 	mod->state = MODULE_STATE_UNFORMED;
1381 	mutex_unlock(&module_mutex);
1382 
1383 	/* Arch-specific cleanup. */
1384 	module_arch_cleanup(mod);
1385 
1386 	/* Module unload stuff */
1387 	module_unload_free(mod);
1388 
1389 	/* Free any allocated parameters. */
1390 	destroy_params(mod->kp, mod->num_kp);
1391 
1392 	if (is_livepatch_module(mod))
1393 		free_module_elf(mod);
1394 
1395 	/* Now we can delete it from the lists */
1396 	mutex_lock(&module_mutex);
1397 	/* Unlink carefully: kallsyms could be walking list. */
1398 	list_del_rcu(&mod->list);
1399 	mod_tree_remove(mod);
1400 	/* Remove this module from bug list, this uses list_del_rcu */
1401 	module_bug_cleanup(mod);
1402 	/* Wait for RCU synchronizing before releasing mod->list and buglist. */
1403 	synchronize_rcu();
1404 	if (try_add_tainted_module(mod))
1405 		pr_err("%s: adding tainted module to the unloaded tainted modules list failed.\n",
1406 		       mod->name);
1407 	mutex_unlock(&module_mutex);
1408 
1409 	/* This may be empty, but that's OK */
1410 	module_arch_freeing_init(mod);
1411 	kfree(mod->args);
1412 	percpu_modfree(mod);
1413 
1414 	free_mod_mem(mod);
1415 }
1416 
1417 void *__symbol_get(const char *symbol)
1418 {
1419 	struct find_symbol_arg fsa = {
1420 		.name	= symbol,
1421 		.gplok	= true,
1422 		.warn	= true,
1423 	};
1424 
1425 	scoped_guard(rcu) {
1426 		if (!find_symbol(&fsa))
1427 			return NULL;
1428 		if (fsa.license != GPL_ONLY) {
1429 			pr_warn("failing symbol_get of non-GPLONLY symbol %s.\n",
1430 				symbol);
1431 			return NULL;
1432 		}
1433 		if (strong_try_module_get(fsa.owner))
1434 			return NULL;
1435 	}
1436 	return (void *)kernel_symbol_value(fsa.sym);
1437 }
1438 EXPORT_SYMBOL_GPL(__symbol_get);
1439 
1440 /*
1441  * Ensure that an exported symbol [global namespace] does not already exist
1442  * in the kernel or in some other module's exported symbol table.
1443  *
1444  * You must hold the module_mutex.
1445  */
1446 static int verify_exported_symbols(struct module *mod)
1447 {
1448 	unsigned int i;
1449 	const struct kernel_symbol *s;
1450 	struct {
1451 		const struct kernel_symbol *sym;
1452 		unsigned int num;
1453 	} arr[] = {
1454 		{ mod->syms, mod->num_syms },
1455 		{ mod->gpl_syms, mod->num_gpl_syms },
1456 	};
1457 
1458 	for (i = 0; i < ARRAY_SIZE(arr); i++) {
1459 		for (s = arr[i].sym; s < arr[i].sym + arr[i].num; s++) {
1460 			struct find_symbol_arg fsa = {
1461 				.name	= kernel_symbol_name(s),
1462 				.gplok	= true,
1463 			};
1464 			if (find_symbol(&fsa)) {
1465 				pr_err("%s: exports duplicate symbol %s"
1466 				       " (owned by %s)\n",
1467 				       mod->name, kernel_symbol_name(s),
1468 				       module_name(fsa.owner));
1469 				return -ENOEXEC;
1470 			}
1471 		}
1472 	}
1473 	return 0;
1474 }
1475 
1476 static bool ignore_undef_symbol(Elf_Half emachine, const char *name)
1477 {
1478 	/*
1479 	 * On x86, PIC code and Clang non-PIC code may have call foo@PLT. GNU as
1480 	 * before 2.37 produces an unreferenced _GLOBAL_OFFSET_TABLE_ on x86-64.
1481 	 * i386 has a similar problem but may not deserve a fix.
1482 	 *
1483 	 * If we ever have to ignore many symbols, consider refactoring the code to
1484 	 * only warn if referenced by a relocation.
1485 	 */
1486 	if (emachine == EM_386 || emachine == EM_X86_64)
1487 		return !strcmp(name, "_GLOBAL_OFFSET_TABLE_");
1488 	return false;
1489 }
1490 
1491 /* Change all symbols so that st_value encodes the pointer directly. */
1492 static int simplify_symbols(struct module *mod, const struct load_info *info)
1493 {
1494 	Elf_Shdr *symsec = &info->sechdrs[info->index.sym];
1495 	Elf_Sym *sym = (void *)symsec->sh_addr;
1496 	unsigned long secbase;
1497 	unsigned int i;
1498 	int ret = 0;
1499 	const struct kernel_symbol *ksym;
1500 
1501 	for (i = 1; i < symsec->sh_size / sizeof(Elf_Sym); i++) {
1502 		const char *name = info->strtab + sym[i].st_name;
1503 
1504 		switch (sym[i].st_shndx) {
1505 		case SHN_COMMON:
1506 			/* Ignore common symbols */
1507 			if (!strncmp(name, "__gnu_lto", 9))
1508 				break;
1509 
1510 			/*
1511 			 * We compiled with -fno-common.  These are not
1512 			 * supposed to happen.
1513 			 */
1514 			pr_debug("Common symbol: %s\n", name);
1515 			pr_warn("%s: please compile with -fno-common\n",
1516 			       mod->name);
1517 			ret = -ENOEXEC;
1518 			break;
1519 
1520 		case SHN_ABS:
1521 			/* Don't need to do anything */
1522 			pr_debug("Absolute symbol: 0x%08lx %s\n",
1523 				 (long)sym[i].st_value, name);
1524 			break;
1525 
1526 		case SHN_LIVEPATCH:
1527 			/* Livepatch symbols are resolved by livepatch */
1528 			break;
1529 
1530 		case SHN_UNDEF:
1531 			ksym = resolve_symbol_wait(mod, info, name);
1532 			/* Ok if resolved.  */
1533 			if (ksym && !IS_ERR(ksym)) {
1534 				sym[i].st_value = kernel_symbol_value(ksym);
1535 				break;
1536 			}
1537 
1538 			/* Ok if weak or ignored.  */
1539 			if (!ksym &&
1540 			    (ELF_ST_BIND(sym[i].st_info) == STB_WEAK ||
1541 			     ignore_undef_symbol(info->hdr->e_machine, name)))
1542 				break;
1543 
1544 			ret = PTR_ERR(ksym) ?: -ENOENT;
1545 			pr_warn("%s: Unknown symbol %s (err %d)\n",
1546 				mod->name, name, ret);
1547 			break;
1548 
1549 		default:
1550 			/* Divert to percpu allocation if a percpu var. */
1551 			if (sym[i].st_shndx == info->index.pcpu)
1552 				secbase = (unsigned long)mod_percpu(mod);
1553 			else
1554 				secbase = info->sechdrs[sym[i].st_shndx].sh_addr;
1555 			sym[i].st_value += secbase;
1556 			break;
1557 		}
1558 	}
1559 
1560 	return ret;
1561 }
1562 
1563 static int apply_relocations(struct module *mod, const struct load_info *info)
1564 {
1565 	unsigned int i;
1566 	int err = 0;
1567 
1568 	/* Now do relocations. */
1569 	for (i = 1; i < info->hdr->e_shnum; i++) {
1570 		unsigned int infosec = info->sechdrs[i].sh_info;
1571 
1572 		/* Not a valid relocation section? */
1573 		if (infosec >= info->hdr->e_shnum)
1574 			continue;
1575 
1576 		/* Don't bother with non-allocated sections */
1577 		if (!(info->sechdrs[infosec].sh_flags & SHF_ALLOC))
1578 			continue;
1579 
1580 		if (info->sechdrs[i].sh_flags & SHF_RELA_LIVEPATCH)
1581 			err = klp_apply_section_relocs(mod, info->sechdrs,
1582 						       info->secstrings,
1583 						       info->strtab,
1584 						       info->index.sym, i,
1585 						       NULL);
1586 		else if (info->sechdrs[i].sh_type == SHT_REL)
1587 			err = apply_relocate(info->sechdrs, info->strtab,
1588 					     info->index.sym, i, mod);
1589 		else if (info->sechdrs[i].sh_type == SHT_RELA)
1590 			err = apply_relocate_add(info->sechdrs, info->strtab,
1591 						 info->index.sym, i, mod);
1592 		if (err < 0)
1593 			break;
1594 	}
1595 	return err;
1596 }
1597 
1598 /* Additional bytes needed by arch in front of individual sections */
1599 unsigned int __weak arch_mod_section_prepend(struct module *mod,
1600 					     unsigned int section)
1601 {
1602 	/* default implementation just returns zero */
1603 	return 0;
1604 }
1605 
1606 long module_get_offset_and_type(struct module *mod, enum mod_mem_type type,
1607 				Elf_Shdr *sechdr, unsigned int section)
1608 {
1609 	long offset;
1610 	long mask = ((unsigned long)(type) & SH_ENTSIZE_TYPE_MASK) << SH_ENTSIZE_TYPE_SHIFT;
1611 
1612 	mod->mem[type].size += arch_mod_section_prepend(mod, section);
1613 	offset = ALIGN(mod->mem[type].size, sechdr->sh_addralign ?: 1);
1614 	mod->mem[type].size = offset + sechdr->sh_size;
1615 
1616 	WARN_ON_ONCE(offset & mask);
1617 	return offset | mask;
1618 }
1619 
1620 bool module_init_layout_section(const char *sname)
1621 {
1622 #ifndef CONFIG_MODULE_UNLOAD
1623 	if (module_exit_section(sname))
1624 		return true;
1625 #endif
1626 	return module_init_section(sname);
1627 }
1628 
1629 static void __layout_sections(struct module *mod, struct load_info *info, bool is_init)
1630 {
1631 	unsigned int m, i;
1632 
1633 	static const unsigned long masks[][2] = {
1634 		/*
1635 		 * NOTE: all executable code must be the first section
1636 		 * in this array; otherwise modify the text_size
1637 		 * finder in the two loops below
1638 		 */
1639 		{ SHF_EXECINSTR | SHF_ALLOC, ARCH_SHF_SMALL },
1640 		{ SHF_ALLOC, SHF_WRITE | ARCH_SHF_SMALL },
1641 		{ SHF_RO_AFTER_INIT | SHF_ALLOC, ARCH_SHF_SMALL },
1642 		{ SHF_WRITE | SHF_ALLOC, ARCH_SHF_SMALL },
1643 		{ ARCH_SHF_SMALL | SHF_ALLOC, 0 }
1644 	};
1645 	static const int core_m_to_mem_type[] = {
1646 		MOD_TEXT,
1647 		MOD_RODATA,
1648 		MOD_RO_AFTER_INIT,
1649 		MOD_DATA,
1650 		MOD_DATA,
1651 	};
1652 	static const int init_m_to_mem_type[] = {
1653 		MOD_INIT_TEXT,
1654 		MOD_INIT_RODATA,
1655 		MOD_INVALID,
1656 		MOD_INIT_DATA,
1657 		MOD_INIT_DATA,
1658 	};
1659 
1660 	for (m = 0; m < ARRAY_SIZE(masks); ++m) {
1661 		enum mod_mem_type type = is_init ? init_m_to_mem_type[m] : core_m_to_mem_type[m];
1662 
1663 		for (i = 0; i < info->hdr->e_shnum; ++i) {
1664 			Elf_Shdr *s = &info->sechdrs[i];
1665 			const char *sname = info->secstrings + s->sh_name;
1666 
1667 			if ((s->sh_flags & masks[m][0]) != masks[m][0]
1668 			    || (s->sh_flags & masks[m][1])
1669 			    || s->sh_entsize != ~0UL
1670 			    || is_init != module_init_layout_section(sname))
1671 				continue;
1672 
1673 			if (WARN_ON_ONCE(type == MOD_INVALID))
1674 				continue;
1675 
1676 			/*
1677 			 * Do not allocate codetag memory as we load it into
1678 			 * preallocated contiguous memory.
1679 			 */
1680 			if (codetag_needs_module_section(mod, sname, s->sh_size)) {
1681 				/*
1682 				 * s->sh_entsize won't be used but populate the
1683 				 * type field to avoid confusion.
1684 				 */
1685 				s->sh_entsize = ((unsigned long)(type) & SH_ENTSIZE_TYPE_MASK)
1686 						<< SH_ENTSIZE_TYPE_SHIFT;
1687 				continue;
1688 			}
1689 
1690 			s->sh_entsize = module_get_offset_and_type(mod, type, s, i);
1691 			pr_debug("\t%s\n", sname);
1692 		}
1693 	}
1694 }
1695 
1696 /*
1697  * Lay out the SHF_ALLOC sections in a way not dissimilar to how ld
1698  * might -- code, read-only data, read-write data, small data.  Tally
1699  * sizes, and place the offsets into sh_entsize fields: high bit means it
1700  * belongs in init.
1701  */
1702 static void layout_sections(struct module *mod, struct load_info *info)
1703 {
1704 	unsigned int i;
1705 
1706 	for (i = 0; i < info->hdr->e_shnum; i++)
1707 		info->sechdrs[i].sh_entsize = ~0UL;
1708 
1709 	pr_debug("Core section allocation order for %s:\n", mod->name);
1710 	__layout_sections(mod, info, false);
1711 
1712 	pr_debug("Init section allocation order for %s:\n", mod->name);
1713 	__layout_sections(mod, info, true);
1714 }
1715 
1716 static void module_license_taint_check(struct module *mod, const char *license)
1717 {
1718 	if (!license)
1719 		license = "unspecified";
1720 
1721 	if (!license_is_gpl_compatible(license)) {
1722 		if (!test_taint(TAINT_PROPRIETARY_MODULE))
1723 			pr_warn("%s: module license '%s' taints kernel.\n",
1724 				mod->name, license);
1725 		add_taint_module(mod, TAINT_PROPRIETARY_MODULE,
1726 				 LOCKDEP_NOW_UNRELIABLE);
1727 	}
1728 }
1729 
1730 static int setup_modinfo(struct module *mod, struct load_info *info)
1731 {
1732 	const struct module_attribute *attr;
1733 	char *imported_namespace;
1734 	int i;
1735 
1736 	for (i = 0; (attr = modinfo_attrs[i]); i++) {
1737 		if (attr->setup)
1738 			attr->setup(mod, get_modinfo(info, attr->attr.name));
1739 	}
1740 
1741 	for_each_modinfo_entry(imported_namespace, info, "import_ns") {
1742 		/*
1743 		 * 'module:' prefixed namespaces are implicit, disallow
1744 		 * explicit imports.
1745 		 */
1746 		if (strstarts(imported_namespace, "module:")) {
1747 			pr_err("%s: module tries to import module namespace: %s\n",
1748 			       mod->name, imported_namespace);
1749 			return -EPERM;
1750 		}
1751 	}
1752 
1753 	return 0;
1754 }
1755 
1756 static void free_modinfo(struct module *mod)
1757 {
1758 	const struct module_attribute *attr;
1759 	int i;
1760 
1761 	for (i = 0; (attr = modinfo_attrs[i]); i++) {
1762 		if (attr->free)
1763 			attr->free(mod);
1764 	}
1765 }
1766 
1767 bool __weak module_init_section(const char *name)
1768 {
1769 	return strstarts(name, ".init");
1770 }
1771 
1772 bool __weak module_exit_section(const char *name)
1773 {
1774 	return strstarts(name, ".exit");
1775 }
1776 
1777 static int validate_section_offset(const struct load_info *info, Elf_Shdr *shdr)
1778 {
1779 #if defined(CONFIG_64BIT)
1780 	unsigned long long secend;
1781 #else
1782 	unsigned long secend;
1783 #endif
1784 
1785 	/*
1786 	 * Check for both overflow and offset/size being
1787 	 * too large.
1788 	 */
1789 	secend = shdr->sh_offset + shdr->sh_size;
1790 	if (secend < shdr->sh_offset || secend > info->len)
1791 		return -ENOEXEC;
1792 
1793 	return 0;
1794 }
1795 
1796 /**
1797  * elf_validity_ehdr() - Checks an ELF header for module validity
1798  * @info: Load info containing the ELF header to check
1799  *
1800  * Checks whether an ELF header could belong to a valid module. Checks:
1801  *
1802  * * ELF header is within the data the user provided
1803  * * ELF magic is present
1804  * * It is relocatable (not final linked, not core file, etc.)
1805  * * The header's machine type matches what the architecture expects.
1806  * * Optional arch-specific hook for other properties
1807  *   - module_elf_check_arch() is currently only used by PPC to check
1808  *   ELF ABI version, but may be used by others in the future.
1809  *
1810  * Return: %0 if valid, %-ENOEXEC on failure.
1811  */
1812 static int elf_validity_ehdr(const struct load_info *info)
1813 {
1814 	if (info->len < sizeof(*(info->hdr))) {
1815 		pr_err("Invalid ELF header len %lu\n", info->len);
1816 		return -ENOEXEC;
1817 	}
1818 	if (memcmp(info->hdr->e_ident, ELFMAG, SELFMAG) != 0) {
1819 		pr_err("Invalid ELF header magic: != %s\n", ELFMAG);
1820 		return -ENOEXEC;
1821 	}
1822 	if (info->hdr->e_type != ET_REL) {
1823 		pr_err("Invalid ELF header type: %u != %u\n",
1824 		       info->hdr->e_type, ET_REL);
1825 		return -ENOEXEC;
1826 	}
1827 	if (!elf_check_arch(info->hdr)) {
1828 		pr_err("Invalid architecture in ELF header: %u\n",
1829 		       info->hdr->e_machine);
1830 		return -ENOEXEC;
1831 	}
1832 	if (!module_elf_check_arch(info->hdr)) {
1833 		pr_err("Invalid module architecture in ELF header: %u\n",
1834 		       info->hdr->e_machine);
1835 		return -ENOEXEC;
1836 	}
1837 	return 0;
1838 }
1839 
1840 /**
1841  * elf_validity_cache_sechdrs() - Cache section headers if valid
1842  * @info: Load info to compute section headers from
1843  *
1844  * Checks:
1845  *
1846  * * ELF header is valid (see elf_validity_ehdr())
1847  * * Section headers are the size we expect
1848  * * Section array fits in the user provided data
1849  * * Section index 0 is NULL
1850  * * Section contents are inbounds
1851  *
1852  * Then updates @info with a &load_info->sechdrs pointer if valid.
1853  *
1854  * Return: %0 if valid, negative error code if validation failed.
1855  */
1856 static int elf_validity_cache_sechdrs(struct load_info *info)
1857 {
1858 	Elf_Shdr *sechdrs;
1859 	Elf_Shdr *shdr;
1860 	int i;
1861 	int err;
1862 
1863 	err = elf_validity_ehdr(info);
1864 	if (err < 0)
1865 		return err;
1866 
1867 	if (info->hdr->e_shentsize != sizeof(Elf_Shdr)) {
1868 		pr_err("Invalid ELF section header size\n");
1869 		return -ENOEXEC;
1870 	}
1871 
1872 	/*
1873 	 * e_shnum is 16 bits, and sizeof(Elf_Shdr) is
1874 	 * known and small. So e_shnum * sizeof(Elf_Shdr)
1875 	 * will not overflow unsigned long on any platform.
1876 	 */
1877 	if (info->hdr->e_shoff >= info->len
1878 	    || (info->hdr->e_shnum * sizeof(Elf_Shdr) >
1879 		info->len - info->hdr->e_shoff)) {
1880 		pr_err("Invalid ELF section header overflow\n");
1881 		return -ENOEXEC;
1882 	}
1883 
1884 	sechdrs = (void *)info->hdr + info->hdr->e_shoff;
1885 
1886 	/*
1887 	 * The code assumes that section 0 has a length of zero and
1888 	 * an addr of zero, so check for it.
1889 	 */
1890 	if (sechdrs[0].sh_type != SHT_NULL
1891 	    || sechdrs[0].sh_size != 0
1892 	    || sechdrs[0].sh_addr != 0) {
1893 		pr_err("ELF Spec violation: section 0 type(%d)!=SH_NULL or non-zero len or addr\n",
1894 		       sechdrs[0].sh_type);
1895 		return -ENOEXEC;
1896 	}
1897 
1898 	/* Validate contents are inbounds */
1899 	for (i = 1; i < info->hdr->e_shnum; i++) {
1900 		shdr = &sechdrs[i];
1901 		switch (shdr->sh_type) {
1902 		case SHT_NULL:
1903 		case SHT_NOBITS:
1904 			/* No contents, offset/size don't mean anything */
1905 			continue;
1906 		default:
1907 			err = validate_section_offset(info, shdr);
1908 			if (err < 0) {
1909 				pr_err("Invalid ELF section in module (section %u type %u)\n",
1910 				       i, shdr->sh_type);
1911 				return err;
1912 			}
1913 		}
1914 	}
1915 
1916 	info->sechdrs = sechdrs;
1917 
1918 	return 0;
1919 }
1920 
1921 /**
1922  * elf_validity_cache_secstrings() - Caches section names if valid
1923  * @info: Load info to cache section names from. Must have valid sechdrs.
1924  *
1925  * Specifically checks:
1926  *
1927  * * Section name table index is inbounds of section headers
1928  * * Section name table is not empty
1929  * * Section name table is NUL terminated
1930  * * All section name offsets are inbounds of the section
1931  *
1932  * Then updates @info with a &load_info->secstrings pointer if valid.
1933  *
1934  * Return: %0 if valid, negative error code if validation failed.
1935  */
1936 static int elf_validity_cache_secstrings(struct load_info *info)
1937 {
1938 	Elf_Shdr *strhdr, *shdr;
1939 	char *secstrings;
1940 	int i;
1941 
1942 	/*
1943 	 * Verify if the section name table index is valid.
1944 	 */
1945 	if (info->hdr->e_shstrndx == SHN_UNDEF
1946 	    || info->hdr->e_shstrndx >= info->hdr->e_shnum) {
1947 		pr_err("Invalid ELF section name index: %d || e_shstrndx (%d) >= e_shnum (%d)\n",
1948 		       info->hdr->e_shstrndx, info->hdr->e_shstrndx,
1949 		       info->hdr->e_shnum);
1950 		return -ENOEXEC;
1951 	}
1952 
1953 	strhdr = &info->sechdrs[info->hdr->e_shstrndx];
1954 
1955 	/*
1956 	 * The section name table must be NUL-terminated, as required
1957 	 * by the spec. This makes strcmp and pr_* calls that access
1958 	 * strings in the section safe.
1959 	 */
1960 	secstrings = (void *)info->hdr + strhdr->sh_offset;
1961 	if (strhdr->sh_size == 0) {
1962 		pr_err("empty section name table\n");
1963 		return -ENOEXEC;
1964 	}
1965 	if (secstrings[strhdr->sh_size - 1] != '\0') {
1966 		pr_err("ELF Spec violation: section name table isn't null terminated\n");
1967 		return -ENOEXEC;
1968 	}
1969 
1970 	for (i = 0; i < info->hdr->e_shnum; i++) {
1971 		shdr = &info->sechdrs[i];
1972 		/* SHT_NULL means sh_name has an undefined value */
1973 		if (shdr->sh_type == SHT_NULL)
1974 			continue;
1975 		if (shdr->sh_name >= strhdr->sh_size) {
1976 			pr_err("Invalid ELF section name in module (section %u type %u)\n",
1977 			       i, shdr->sh_type);
1978 			return -ENOEXEC;
1979 		}
1980 	}
1981 
1982 	info->secstrings = secstrings;
1983 	return 0;
1984 }
1985 
1986 /**
1987  * elf_validity_cache_index_info() - Validate and cache modinfo section
1988  * @info: Load info to populate the modinfo index on.
1989  *        Must have &load_info->sechdrs and &load_info->secstrings populated
1990  *
1991  * Checks that if there is a .modinfo section, it is unique.
1992  * Then, it caches its index in &load_info->index.info.
1993  * Finally, it tries to populate the name to improve error messages.
1994  *
1995  * Return: %0 if valid, %-ENOEXEC if multiple modinfo sections were found.
1996  */
1997 static int elf_validity_cache_index_info(struct load_info *info)
1998 {
1999 	int info_idx;
2000 
2001 	info_idx = find_any_unique_sec(info, ".modinfo");
2002 
2003 	if (info_idx == 0)
2004 		/* Early return, no .modinfo */
2005 		return 0;
2006 
2007 	if (info_idx < 0) {
2008 		pr_err("Only one .modinfo section must exist.\n");
2009 		return -ENOEXEC;
2010 	}
2011 
2012 	info->index.info = info_idx;
2013 	/* Try to find a name early so we can log errors with a module name */
2014 	info->name = get_modinfo(info, "name");
2015 
2016 	return 0;
2017 }
2018 
2019 /**
2020  * elf_validity_cache_index_mod() - Validates and caches this_module section
2021  * @info: Load info to cache this_module on.
2022  *        Must have &load_info->sechdrs and &load_info->secstrings populated
2023  *
2024  * The ".gnu.linkonce.this_module" ELF section is special. It is what modpost
2025  * uses to refer to __this_module and let's use rely on THIS_MODULE to point
2026  * to &__this_module properly. The kernel's modpost declares it on each
2027  * modules's *.mod.c file. If the struct module of the kernel changes a full
2028  * kernel rebuild is required.
2029  *
2030  * We have a few expectations for this special section, this function
2031  * validates all this for us:
2032  *
2033  * * The section has contents
2034  * * The section is unique
2035  * * We expect the kernel to always have to allocate it: SHF_ALLOC
2036  * * The section size must match the kernel's run time's struct module
2037  *   size
2038  *
2039  * If all checks pass, the index will be cached in &load_info->index.mod
2040  *
2041  * Return: %0 on validation success, %-ENOEXEC on failure
2042  */
2043 static int elf_validity_cache_index_mod(struct load_info *info)
2044 {
2045 	Elf_Shdr *shdr;
2046 	int mod_idx;
2047 
2048 	mod_idx = find_any_unique_sec(info, ".gnu.linkonce.this_module");
2049 	if (mod_idx <= 0) {
2050 		pr_err("module %s: Exactly one .gnu.linkonce.this_module section must exist.\n",
2051 		       info->name ?: "(missing .modinfo section or name field)");
2052 		return -ENOEXEC;
2053 	}
2054 
2055 	shdr = &info->sechdrs[mod_idx];
2056 
2057 	if (shdr->sh_type == SHT_NOBITS) {
2058 		pr_err("module %s: .gnu.linkonce.this_module section must have a size set\n",
2059 		       info->name ?: "(missing .modinfo section or name field)");
2060 		return -ENOEXEC;
2061 	}
2062 
2063 	if (!(shdr->sh_flags & SHF_ALLOC)) {
2064 		pr_err("module %s: .gnu.linkonce.this_module must occupy memory during process execution\n",
2065 		       info->name ?: "(missing .modinfo section or name field)");
2066 		return -ENOEXEC;
2067 	}
2068 
2069 	if (shdr->sh_size != sizeof(struct module)) {
2070 		pr_err("module %s: .gnu.linkonce.this_module section size must match the kernel's built struct module size at run time\n",
2071 		       info->name ?: "(missing .modinfo section or name field)");
2072 		return -ENOEXEC;
2073 	}
2074 
2075 	info->index.mod = mod_idx;
2076 
2077 	return 0;
2078 }
2079 
2080 /**
2081  * elf_validity_cache_index_sym() - Validate and cache symtab index
2082  * @info: Load info to cache symtab index in.
2083  *        Must have &load_info->sechdrs and &load_info->secstrings populated.
2084  *
2085  * Checks that there is exactly one symbol table, then caches its index in
2086  * &load_info->index.sym.
2087  *
2088  * Return: %0 if valid, %-ENOEXEC on failure.
2089  */
2090 static int elf_validity_cache_index_sym(struct load_info *info)
2091 {
2092 	unsigned int sym_idx;
2093 	unsigned int num_sym_secs = 0;
2094 	int i;
2095 
2096 	for (i = 1; i < info->hdr->e_shnum; i++) {
2097 		if (info->sechdrs[i].sh_type == SHT_SYMTAB) {
2098 			num_sym_secs++;
2099 			sym_idx = i;
2100 		}
2101 	}
2102 
2103 	if (num_sym_secs != 1) {
2104 		pr_warn("%s: module has no symbols (stripped?)\n",
2105 			info->name ?: "(missing .modinfo section or name field)");
2106 		return -ENOEXEC;
2107 	}
2108 
2109 	info->index.sym = sym_idx;
2110 
2111 	return 0;
2112 }
2113 
2114 /**
2115  * elf_validity_cache_index_str() - Validate and cache strtab index
2116  * @info: Load info to cache strtab index in.
2117  *        Must have &load_info->sechdrs and &load_info->secstrings populated.
2118  *        Must have &load_info->index.sym populated.
2119  *
2120  * Looks at the symbol table's associated string table, makes sure it is
2121  * in-bounds, and caches it.
2122  *
2123  * Return: %0 if valid, %-ENOEXEC on failure.
2124  */
2125 static int elf_validity_cache_index_str(struct load_info *info)
2126 {
2127 	unsigned int str_idx = info->sechdrs[info->index.sym].sh_link;
2128 
2129 	if (str_idx == SHN_UNDEF || str_idx >= info->hdr->e_shnum) {
2130 		pr_err("Invalid ELF sh_link!=SHN_UNDEF(%d) or (sh_link(%d) >= hdr->e_shnum(%d)\n",
2131 		       str_idx, str_idx, info->hdr->e_shnum);
2132 		return -ENOEXEC;
2133 	}
2134 
2135 	info->index.str = str_idx;
2136 	return 0;
2137 }
2138 
2139 /**
2140  * elf_validity_cache_index_versions() - Validate and cache version indices
2141  * @info:  Load info to cache version indices in.
2142  *         Must have &load_info->sechdrs and &load_info->secstrings populated.
2143  * @flags: Load flags, relevant to suppress version loading, see
2144  *         uapi/linux/module.h
2145  *
2146  * If we're ignoring modversions based on @flags, zero all version indices
2147  * and return validity. Othewrise check:
2148  *
2149  * * If "__version_ext_crcs" is present, "__version_ext_names" is present
2150  * * There is a name present for every crc
2151  *
2152  * Then populate:
2153  *
2154  * * &load_info->index.vers
2155  * * &load_info->index.vers_ext_crc
2156  * * &load_info->index.vers_ext_names
2157  *
2158  * if present.
2159  *
2160  * Return: %0 if valid, %-ENOEXEC on failure.
2161  */
2162 static int elf_validity_cache_index_versions(struct load_info *info, int flags)
2163 {
2164 	unsigned int vers_ext_crc;
2165 	unsigned int vers_ext_name;
2166 	size_t crc_count;
2167 	size_t remaining_len;
2168 	size_t name_size;
2169 	char *name;
2170 
2171 	/* If modversions were suppressed, pretend we didn't find any */
2172 	if (flags & MODULE_INIT_IGNORE_MODVERSIONS) {
2173 		info->index.vers = 0;
2174 		info->index.vers_ext_crc = 0;
2175 		info->index.vers_ext_name = 0;
2176 		return 0;
2177 	}
2178 
2179 	vers_ext_crc = find_sec(info, "__version_ext_crcs");
2180 	vers_ext_name = find_sec(info, "__version_ext_names");
2181 
2182 	/* If we have one field, we must have the other */
2183 	if (!!vers_ext_crc != !!vers_ext_name) {
2184 		pr_err("extended version crc+name presence does not match");
2185 		return -ENOEXEC;
2186 	}
2187 
2188 	/*
2189 	 * If we have extended version information, we should have the same
2190 	 * number of entries in every section.
2191 	 */
2192 	if (vers_ext_crc) {
2193 		crc_count = info->sechdrs[vers_ext_crc].sh_size / sizeof(u32);
2194 		name = (void *)info->hdr +
2195 			info->sechdrs[vers_ext_name].sh_offset;
2196 		remaining_len = info->sechdrs[vers_ext_name].sh_size;
2197 
2198 		while (crc_count--) {
2199 			name_size = strnlen(name, remaining_len) + 1;
2200 			if (name_size > remaining_len) {
2201 				pr_err("more extended version crcs than names");
2202 				return -ENOEXEC;
2203 			}
2204 			remaining_len -= name_size;
2205 			name += name_size;
2206 		}
2207 	}
2208 
2209 	info->index.vers = find_sec(info, "__versions");
2210 	info->index.vers_ext_crc = vers_ext_crc;
2211 	info->index.vers_ext_name = vers_ext_name;
2212 	return 0;
2213 }
2214 
2215 /**
2216  * elf_validity_cache_index() - Resolve, validate, cache section indices
2217  * @info:  Load info to read from and update.
2218  *         &load_info->sechdrs and &load_info->secstrings must be populated.
2219  * @flags: Load flags, relevant to suppress version loading, see
2220  *         uapi/linux/module.h
2221  *
2222  * Populates &load_info->index, validating as it goes.
2223  * See child functions for per-field validation:
2224  *
2225  * * elf_validity_cache_index_info()
2226  * * elf_validity_cache_index_mod()
2227  * * elf_validity_cache_index_sym()
2228  * * elf_validity_cache_index_str()
2229  * * elf_validity_cache_index_versions()
2230  *
2231  * If CONFIG_SMP is enabled, load the percpu section by name with no
2232  * validation.
2233  *
2234  * Return: 0 on success, negative error code if an index failed validation.
2235  */
2236 static int elf_validity_cache_index(struct load_info *info, int flags)
2237 {
2238 	int err;
2239 
2240 	err = elf_validity_cache_index_info(info);
2241 	if (err < 0)
2242 		return err;
2243 	err = elf_validity_cache_index_mod(info);
2244 	if (err < 0)
2245 		return err;
2246 	err = elf_validity_cache_index_sym(info);
2247 	if (err < 0)
2248 		return err;
2249 	err = elf_validity_cache_index_str(info);
2250 	if (err < 0)
2251 		return err;
2252 	err = elf_validity_cache_index_versions(info, flags);
2253 	if (err < 0)
2254 		return err;
2255 
2256 	info->index.pcpu = find_pcpusec(info);
2257 
2258 	return 0;
2259 }
2260 
2261 /**
2262  * elf_validity_cache_strtab() - Validate and cache symbol string table
2263  * @info: Load info to read from and update.
2264  *        Must have &load_info->sechdrs and &load_info->secstrings populated.
2265  *        Must have &load_info->index populated.
2266  *
2267  * Checks:
2268  *
2269  * * The string table is not empty.
2270  * * The string table starts and ends with NUL (required by ELF spec).
2271  * * Every &Elf_Sym->st_name offset in the symbol table is inbounds of the
2272  *   string table.
2273  *
2274  * And caches the pointer as &load_info->strtab in @info.
2275  *
2276  * Return: 0 on success, negative error code if a check failed.
2277  */
2278 static int elf_validity_cache_strtab(struct load_info *info)
2279 {
2280 	Elf_Shdr *str_shdr = &info->sechdrs[info->index.str];
2281 	Elf_Shdr *sym_shdr = &info->sechdrs[info->index.sym];
2282 	char *strtab = (char *)info->hdr + str_shdr->sh_offset;
2283 	Elf_Sym *syms = (void *)info->hdr + sym_shdr->sh_offset;
2284 	int i;
2285 
2286 	if (str_shdr->sh_size == 0) {
2287 		pr_err("empty symbol string table\n");
2288 		return -ENOEXEC;
2289 	}
2290 	if (strtab[0] != '\0') {
2291 		pr_err("symbol string table missing leading NUL\n");
2292 		return -ENOEXEC;
2293 	}
2294 	if (strtab[str_shdr->sh_size - 1] != '\0') {
2295 		pr_err("symbol string table isn't NUL terminated\n");
2296 		return -ENOEXEC;
2297 	}
2298 
2299 	/*
2300 	 * Now that we know strtab is correctly structured, check symbol
2301 	 * starts are inbounds before they're used later.
2302 	 */
2303 	for (i = 0; i < sym_shdr->sh_size / sizeof(*syms); i++) {
2304 		if (syms[i].st_name >= str_shdr->sh_size) {
2305 			pr_err("symbol name out of bounds in string table");
2306 			return -ENOEXEC;
2307 		}
2308 	}
2309 
2310 	info->strtab = strtab;
2311 	return 0;
2312 }
2313 
2314 /*
2315  * Check userspace passed ELF module against our expectations, and cache
2316  * useful variables for further processing as we go.
2317  *
2318  * This does basic validity checks against section offsets and sizes, the
2319  * section name string table, and the indices used for it (sh_name).
2320  *
2321  * As a last step, since we're already checking the ELF sections we cache
2322  * useful variables which will be used later for our convenience:
2323  *
2324  * 	o pointers to section headers
2325  * 	o cache the modinfo symbol section
2326  * 	o cache the string symbol section
2327  * 	o cache the module section
2328  *
2329  * As a last step we set info->mod to the temporary copy of the module in
2330  * info->hdr. The final one will be allocated in move_module(). Any
2331  * modifications we make to our copy of the module will be carried over
2332  * to the final minted module.
2333  */
2334 static int elf_validity_cache_copy(struct load_info *info, int flags)
2335 {
2336 	int err;
2337 
2338 	err = elf_validity_cache_sechdrs(info);
2339 	if (err < 0)
2340 		return err;
2341 	err = elf_validity_cache_secstrings(info);
2342 	if (err < 0)
2343 		return err;
2344 	err = elf_validity_cache_index(info, flags);
2345 	if (err < 0)
2346 		return err;
2347 	err = elf_validity_cache_strtab(info);
2348 	if (err < 0)
2349 		return err;
2350 
2351 	/* This is temporary: point mod into copy of data. */
2352 	info->mod = (void *)info->hdr + info->sechdrs[info->index.mod].sh_offset;
2353 
2354 	/*
2355 	 * If we didn't load the .modinfo 'name' field earlier, fall back to
2356 	 * on-disk struct mod 'name' field.
2357 	 */
2358 	if (!info->name)
2359 		info->name = info->mod->name;
2360 
2361 	return 0;
2362 }
2363 
2364 #define COPY_CHUNK_SIZE (16*PAGE_SIZE)
2365 
2366 static int copy_chunked_from_user(void *dst, const void __user *usrc, unsigned long len)
2367 {
2368 	do {
2369 		unsigned long n = min(len, COPY_CHUNK_SIZE);
2370 
2371 		if (copy_from_user(dst, usrc, n) != 0)
2372 			return -EFAULT;
2373 		cond_resched();
2374 		dst += n;
2375 		usrc += n;
2376 		len -= n;
2377 	} while (len);
2378 	return 0;
2379 }
2380 
2381 static int check_modinfo_livepatch(struct module *mod, struct load_info *info)
2382 {
2383 	if (!get_modinfo(info, "livepatch"))
2384 		/* Nothing more to do */
2385 		return 0;
2386 
2387 	if (set_livepatch_module(mod))
2388 		return 0;
2389 
2390 	pr_err("%s: module is marked as livepatch module, but livepatch support is disabled",
2391 	       mod->name);
2392 	return -ENOEXEC;
2393 }
2394 
2395 static void check_modinfo_retpoline(struct module *mod, struct load_info *info)
2396 {
2397 	if (retpoline_module_ok(get_modinfo(info, "retpoline")))
2398 		return;
2399 
2400 	pr_warn("%s: loading module not compiled with retpoline compiler.\n",
2401 		mod->name);
2402 }
2403 
2404 /* Sets info->hdr and info->len. */
2405 static int copy_module_from_user(const void __user *umod, unsigned long len,
2406 				  struct load_info *info)
2407 {
2408 	int err;
2409 
2410 	info->len = len;
2411 	if (info->len < sizeof(*(info->hdr)))
2412 		return -ENOEXEC;
2413 
2414 	err = security_kernel_load_data(LOADING_MODULE, true);
2415 	if (err)
2416 		return err;
2417 
2418 	/* Suck in entire file: we'll want most of it. */
2419 	info->hdr = __vmalloc(info->len, GFP_KERNEL | __GFP_NOWARN);
2420 	if (!info->hdr)
2421 		return -ENOMEM;
2422 
2423 	if (copy_chunked_from_user(info->hdr, umod, info->len) != 0) {
2424 		err = -EFAULT;
2425 		goto out;
2426 	}
2427 
2428 	err = security_kernel_post_load_data((char *)info->hdr, info->len,
2429 					     LOADING_MODULE, "init_module");
2430 out:
2431 	if (err)
2432 		vfree(info->hdr);
2433 
2434 	return err;
2435 }
2436 
2437 static void free_copy(struct load_info *info, int flags)
2438 {
2439 	if (flags & MODULE_INIT_COMPRESSED_FILE)
2440 		module_decompress_cleanup(info);
2441 	else
2442 		vfree(info->hdr);
2443 }
2444 
2445 static int rewrite_section_headers(struct load_info *info, int flags)
2446 {
2447 	unsigned int i;
2448 
2449 	/* This should always be true, but let's be sure. */
2450 	info->sechdrs[0].sh_addr = 0;
2451 
2452 	for (i = 1; i < info->hdr->e_shnum; i++) {
2453 		Elf_Shdr *shdr = &info->sechdrs[i];
2454 
2455 		/*
2456 		 * Mark all sections sh_addr with their address in the
2457 		 * temporary image.
2458 		 */
2459 		shdr->sh_addr = (size_t)info->hdr + shdr->sh_offset;
2460 
2461 	}
2462 
2463 	/* Track but don't keep modinfo and version sections. */
2464 	info->sechdrs[info->index.vers].sh_flags &= ~(unsigned long)SHF_ALLOC;
2465 	info->sechdrs[info->index.vers_ext_crc].sh_flags &=
2466 		~(unsigned long)SHF_ALLOC;
2467 	info->sechdrs[info->index.vers_ext_name].sh_flags &=
2468 		~(unsigned long)SHF_ALLOC;
2469 	info->sechdrs[info->index.info].sh_flags &= ~(unsigned long)SHF_ALLOC;
2470 
2471 	return 0;
2472 }
2473 
2474 static const char *const module_license_offenders[] = {
2475 	/* driverloader was caught wrongly pretending to be under GPL */
2476 	"driverloader",
2477 
2478 	/* lve claims to be GPL but upstream won't provide source */
2479 	"lve",
2480 };
2481 
2482 /*
2483  * These calls taint the kernel depending certain module circumstances */
2484 static void module_augment_kernel_taints(struct module *mod, struct load_info *info)
2485 {
2486 	int prev_taint = test_taint(TAINT_PROPRIETARY_MODULE);
2487 	size_t i;
2488 
2489 	if (!get_modinfo(info, "intree")) {
2490 		if (!test_taint(TAINT_OOT_MODULE))
2491 			pr_warn("%s: loading out-of-tree module taints kernel.\n",
2492 				mod->name);
2493 		add_taint_module(mod, TAINT_OOT_MODULE, LOCKDEP_STILL_OK);
2494 	}
2495 
2496 	check_modinfo_retpoline(mod, info);
2497 
2498 	if (get_modinfo(info, "staging")) {
2499 		add_taint_module(mod, TAINT_CRAP, LOCKDEP_STILL_OK);
2500 		pr_warn("%s: module is from the staging directory, the quality "
2501 			"is unknown, you have been warned.\n", mod->name);
2502 	}
2503 
2504 	if (is_livepatch_module(mod)) {
2505 		add_taint_module(mod, TAINT_LIVEPATCH, LOCKDEP_STILL_OK);
2506 		pr_notice_once("%s: tainting kernel with TAINT_LIVEPATCH\n",
2507 				mod->name);
2508 	}
2509 
2510 	module_license_taint_check(mod, get_modinfo(info, "license"));
2511 
2512 	if (get_modinfo(info, "test")) {
2513 		if (!test_taint(TAINT_TEST))
2514 			pr_warn("%s: loading test module taints kernel.\n",
2515 				mod->name);
2516 		add_taint_module(mod, TAINT_TEST, LOCKDEP_STILL_OK);
2517 	}
2518 #ifdef CONFIG_MODULE_SIG
2519 	mod->sig_ok = info->sig_ok;
2520 	if (!mod->sig_ok) {
2521 		pr_notice_once("%s: module verification failed: signature "
2522 			       "and/or required key missing - tainting "
2523 			       "kernel\n", mod->name);
2524 		add_taint_module(mod, TAINT_UNSIGNED_MODULE, LOCKDEP_STILL_OK);
2525 	}
2526 #endif
2527 
2528 	/*
2529 	 * ndiswrapper is under GPL by itself, but loads proprietary modules.
2530 	 * Don't use add_taint_module(), as it would prevent ndiswrapper from
2531 	 * using GPL-only symbols it needs.
2532 	 */
2533 	if (strcmp(mod->name, "ndiswrapper") == 0)
2534 		add_taint(TAINT_PROPRIETARY_MODULE, LOCKDEP_NOW_UNRELIABLE);
2535 
2536 	for (i = 0; i < ARRAY_SIZE(module_license_offenders); ++i) {
2537 		if (strcmp(mod->name, module_license_offenders[i]) == 0)
2538 			add_taint_module(mod, TAINT_PROPRIETARY_MODULE,
2539 					 LOCKDEP_NOW_UNRELIABLE);
2540 	}
2541 
2542 	if (!prev_taint && test_taint(TAINT_PROPRIETARY_MODULE))
2543 		pr_warn("%s: module license taints kernel.\n", mod->name);
2544 
2545 }
2546 
2547 static int check_modinfo(struct module *mod, struct load_info *info, int flags)
2548 {
2549 	const char *modmagic = get_modinfo(info, "vermagic");
2550 	int err;
2551 
2552 	if (flags & MODULE_INIT_IGNORE_VERMAGIC)
2553 		modmagic = NULL;
2554 
2555 	/* This is allowed: modprobe --force will invalidate it. */
2556 	if (!modmagic) {
2557 		err = try_to_force_load(mod, "bad vermagic");
2558 		if (err)
2559 			return err;
2560 	} else if (!same_magic(modmagic, vermagic, info->index.vers)) {
2561 		pr_err("%s: version magic '%s' should be '%s'\n",
2562 		       info->name, modmagic, vermagic);
2563 		return -ENOEXEC;
2564 	}
2565 
2566 	err = check_modinfo_livepatch(mod, info);
2567 	if (err)
2568 		return err;
2569 
2570 	return 0;
2571 }
2572 
2573 static int find_module_sections(struct module *mod, struct load_info *info)
2574 {
2575 	mod->kp = section_objs(info, "__param",
2576 			       sizeof(*mod->kp), &mod->num_kp);
2577 	mod->syms = section_objs(info, "__ksymtab",
2578 				 sizeof(*mod->syms), &mod->num_syms);
2579 	mod->crcs = section_addr(info, "__kcrctab");
2580 	mod->gpl_syms = section_objs(info, "__ksymtab_gpl",
2581 				     sizeof(*mod->gpl_syms),
2582 				     &mod->num_gpl_syms);
2583 	mod->gpl_crcs = section_addr(info, "__kcrctab_gpl");
2584 
2585 #ifdef CONFIG_CONSTRUCTORS
2586 	mod->ctors = section_objs(info, ".ctors",
2587 				  sizeof(*mod->ctors), &mod->num_ctors);
2588 	if (!mod->ctors)
2589 		mod->ctors = section_objs(info, ".init_array",
2590 				sizeof(*mod->ctors), &mod->num_ctors);
2591 	else if (find_sec(info, ".init_array")) {
2592 		/*
2593 		 * This shouldn't happen with same compiler and binutils
2594 		 * building all parts of the module.
2595 		 */
2596 		pr_warn("%s: has both .ctors and .init_array.\n",
2597 		       mod->name);
2598 		return -EINVAL;
2599 	}
2600 #endif
2601 
2602 	mod->noinstr_text_start = section_objs(info, ".noinstr.text", 1,
2603 						&mod->noinstr_text_size);
2604 
2605 #ifdef CONFIG_TRACEPOINTS
2606 	mod->tracepoints_ptrs = section_objs(info, "__tracepoints_ptrs",
2607 					     sizeof(*mod->tracepoints_ptrs),
2608 					     &mod->num_tracepoints);
2609 #endif
2610 #ifdef CONFIG_TREE_SRCU
2611 	mod->srcu_struct_ptrs = section_objs(info, "___srcu_struct_ptrs",
2612 					     sizeof(*mod->srcu_struct_ptrs),
2613 					     &mod->num_srcu_structs);
2614 #endif
2615 #ifdef CONFIG_BPF_EVENTS
2616 	mod->bpf_raw_events = section_objs(info, "__bpf_raw_tp_map",
2617 					   sizeof(*mod->bpf_raw_events),
2618 					   &mod->num_bpf_raw_events);
2619 #endif
2620 #ifdef CONFIG_DEBUG_INFO_BTF_MODULES
2621 	mod->btf_data = any_section_objs(info, ".BTF", 1, &mod->btf_data_size);
2622 	mod->btf_base_data = any_section_objs(info, ".BTF.base", 1,
2623 					      &mod->btf_base_data_size);
2624 #endif
2625 #ifdef CONFIG_JUMP_LABEL
2626 	mod->jump_entries = section_objs(info, "__jump_table",
2627 					sizeof(*mod->jump_entries),
2628 					&mod->num_jump_entries);
2629 #endif
2630 #ifdef CONFIG_EVENT_TRACING
2631 	mod->trace_events = section_objs(info, "_ftrace_events",
2632 					 sizeof(*mod->trace_events),
2633 					 &mod->num_trace_events);
2634 	mod->trace_evals = section_objs(info, "_ftrace_eval_map",
2635 					sizeof(*mod->trace_evals),
2636 					&mod->num_trace_evals);
2637 #endif
2638 #ifdef CONFIG_TRACING
2639 	mod->trace_bprintk_fmt_start = section_objs(info, "__trace_printk_fmt",
2640 					 sizeof(*mod->trace_bprintk_fmt_start),
2641 					 &mod->num_trace_bprintk_fmt);
2642 #endif
2643 #ifdef CONFIG_FTRACE_MCOUNT_RECORD
2644 	/* sechdrs[0].sh_size is always zero */
2645 	mod->ftrace_callsites = section_objs(info, FTRACE_CALLSITE_SECTION,
2646 					     sizeof(*mod->ftrace_callsites),
2647 					     &mod->num_ftrace_callsites);
2648 #endif
2649 #ifdef CONFIG_FUNCTION_ERROR_INJECTION
2650 	mod->ei_funcs = section_objs(info, "_error_injection_whitelist",
2651 					    sizeof(*mod->ei_funcs),
2652 					    &mod->num_ei_funcs);
2653 #endif
2654 #ifdef CONFIG_KPROBES
2655 	mod->kprobes_text_start = section_objs(info, ".kprobes.text", 1,
2656 						&mod->kprobes_text_size);
2657 	mod->kprobe_blacklist = section_objs(info, "_kprobe_blacklist",
2658 						sizeof(unsigned long),
2659 						&mod->num_kprobe_blacklist);
2660 #endif
2661 #ifdef CONFIG_PRINTK_INDEX
2662 	mod->printk_index_start = section_objs(info, ".printk_index",
2663 					       sizeof(*mod->printk_index_start),
2664 					       &mod->printk_index_size);
2665 #endif
2666 #ifdef CONFIG_HAVE_STATIC_CALL_INLINE
2667 	mod->static_call_sites = section_objs(info, ".static_call_sites",
2668 					      sizeof(*mod->static_call_sites),
2669 					      &mod->num_static_call_sites);
2670 #endif
2671 #if IS_ENABLED(CONFIG_KUNIT)
2672 	mod->kunit_suites = section_objs(info, ".kunit_test_suites",
2673 					      sizeof(*mod->kunit_suites),
2674 					      &mod->num_kunit_suites);
2675 	mod->kunit_init_suites = section_objs(info, ".kunit_init_test_suites",
2676 					      sizeof(*mod->kunit_init_suites),
2677 					      &mod->num_kunit_init_suites);
2678 #endif
2679 
2680 	mod->extable = section_objs(info, "__ex_table",
2681 				    sizeof(*mod->extable), &mod->num_exentries);
2682 
2683 	if (section_addr(info, "__obsparm"))
2684 		pr_warn("%s: Ignoring obsolete parameters\n", mod->name);
2685 
2686 #ifdef CONFIG_DYNAMIC_DEBUG_CORE
2687 	mod->dyndbg_info.descs = section_objs(info, "__dyndbg",
2688 					      sizeof(*mod->dyndbg_info.descs),
2689 					      &mod->dyndbg_info.num_descs);
2690 	mod->dyndbg_info.classes = section_objs(info, "__dyndbg_classes",
2691 						sizeof(*mod->dyndbg_info.classes),
2692 						&mod->dyndbg_info.num_classes);
2693 #endif
2694 
2695 	return 0;
2696 }
2697 
2698 static int move_module(struct module *mod, struct load_info *info)
2699 {
2700 	int i;
2701 	enum mod_mem_type t = 0;
2702 	int ret = -ENOMEM;
2703 	bool codetag_section_found = false;
2704 
2705 	for_each_mod_mem_type(type) {
2706 		if (!mod->mem[type].size) {
2707 			mod->mem[type].base = NULL;
2708 			continue;
2709 		}
2710 
2711 		ret = module_memory_alloc(mod, type);
2712 		if (ret) {
2713 			t = type;
2714 			goto out_err;
2715 		}
2716 	}
2717 
2718 	/* Transfer each section which specifies SHF_ALLOC */
2719 	pr_debug("Final section addresses for %s:\n", mod->name);
2720 	for (i = 0; i < info->hdr->e_shnum; i++) {
2721 		void *dest;
2722 		Elf_Shdr *shdr = &info->sechdrs[i];
2723 		const char *sname;
2724 
2725 		if (!(shdr->sh_flags & SHF_ALLOC))
2726 			continue;
2727 
2728 		sname = info->secstrings + shdr->sh_name;
2729 		/*
2730 		 * Load codetag sections separately as they might still be used
2731 		 * after module unload.
2732 		 */
2733 		if (codetag_needs_module_section(mod, sname, shdr->sh_size)) {
2734 			dest = codetag_alloc_module_section(mod, sname, shdr->sh_size,
2735 					arch_mod_section_prepend(mod, i), shdr->sh_addralign);
2736 			if (WARN_ON(!dest)) {
2737 				ret = -EINVAL;
2738 				goto out_err;
2739 			}
2740 			if (IS_ERR(dest)) {
2741 				ret = PTR_ERR(dest);
2742 				goto out_err;
2743 			}
2744 			codetag_section_found = true;
2745 		} else {
2746 			enum mod_mem_type type = shdr->sh_entsize >> SH_ENTSIZE_TYPE_SHIFT;
2747 			unsigned long offset = shdr->sh_entsize & SH_ENTSIZE_OFFSET_MASK;
2748 
2749 			dest = mod->mem[type].base + offset;
2750 		}
2751 
2752 		if (shdr->sh_type != SHT_NOBITS) {
2753 			/*
2754 			 * Our ELF checker already validated this, but let's
2755 			 * be pedantic and make the goal clearer. We actually
2756 			 * end up copying over all modifications made to the
2757 			 * userspace copy of the entire struct module.
2758 			 */
2759 			if (i == info->index.mod &&
2760 			   (WARN_ON_ONCE(shdr->sh_size != sizeof(struct module)))) {
2761 				ret = -ENOEXEC;
2762 				goto out_err;
2763 			}
2764 			memcpy(dest, (void *)shdr->sh_addr, shdr->sh_size);
2765 		}
2766 		/*
2767 		 * Update the userspace copy's ELF section address to point to
2768 		 * our newly allocated memory as a pure convenience so that
2769 		 * users of info can keep taking advantage and using the newly
2770 		 * minted official memory area.
2771 		 */
2772 		shdr->sh_addr = (unsigned long)dest;
2773 		pr_debug("\t0x%lx 0x%.8lx %s\n", (long)shdr->sh_addr,
2774 			 (long)shdr->sh_size, info->secstrings + shdr->sh_name);
2775 	}
2776 
2777 	return 0;
2778 out_err:
2779 	module_memory_restore_rox(mod);
2780 	for (t--; t >= 0; t--)
2781 		module_memory_free(mod, t);
2782 	if (codetag_section_found)
2783 		codetag_free_module_sections(mod);
2784 
2785 	return ret;
2786 }
2787 
2788 static int check_export_symbol_versions(struct module *mod)
2789 {
2790 #ifdef CONFIG_MODVERSIONS
2791 	if ((mod->num_syms && !mod->crcs) ||
2792 	    (mod->num_gpl_syms && !mod->gpl_crcs)) {
2793 		return try_to_force_load(mod,
2794 					 "no versions for exported symbols");
2795 	}
2796 #endif
2797 	return 0;
2798 }
2799 
2800 static void flush_module_icache(const struct module *mod)
2801 {
2802 	/*
2803 	 * Flush the instruction cache, since we've played with text.
2804 	 * Do it before processing of module parameters, so the module
2805 	 * can provide parameter accessor functions of its own.
2806 	 */
2807 	for_each_mod_mem_type(type) {
2808 		const struct module_memory *mod_mem = &mod->mem[type];
2809 
2810 		if (mod_mem->size) {
2811 			flush_icache_range((unsigned long)mod_mem->base,
2812 					   (unsigned long)mod_mem->base + mod_mem->size);
2813 		}
2814 	}
2815 }
2816 
2817 bool __weak module_elf_check_arch(Elf_Ehdr *hdr)
2818 {
2819 	return true;
2820 }
2821 
2822 int __weak module_frob_arch_sections(Elf_Ehdr *hdr,
2823 				     Elf_Shdr *sechdrs,
2824 				     char *secstrings,
2825 				     struct module *mod)
2826 {
2827 	return 0;
2828 }
2829 
2830 /* module_blacklist is a comma-separated list of module names */
2831 static char *module_blacklist;
2832 static bool blacklisted(const char *module_name)
2833 {
2834 	const char *p;
2835 	size_t len;
2836 
2837 	if (!module_blacklist)
2838 		return false;
2839 
2840 	for (p = module_blacklist; *p; p += len) {
2841 		len = strcspn(p, ",");
2842 		if (strlen(module_name) == len && !memcmp(module_name, p, len))
2843 			return true;
2844 		if (p[len] == ',')
2845 			len++;
2846 	}
2847 	return false;
2848 }
2849 core_param(module_blacklist, module_blacklist, charp, 0400);
2850 
2851 static struct module *layout_and_allocate(struct load_info *info, int flags)
2852 {
2853 	struct module *mod;
2854 	unsigned int ndx;
2855 	int err;
2856 
2857 	/* Allow arches to frob section contents and sizes.  */
2858 	err = module_frob_arch_sections(info->hdr, info->sechdrs,
2859 					info->secstrings, info->mod);
2860 	if (err < 0)
2861 		return ERR_PTR(err);
2862 
2863 	err = module_enforce_rwx_sections(info->hdr, info->sechdrs,
2864 					  info->secstrings, info->mod);
2865 	if (err < 0)
2866 		return ERR_PTR(err);
2867 
2868 	/* We will do a special allocation for per-cpu sections later. */
2869 	info->sechdrs[info->index.pcpu].sh_flags &= ~(unsigned long)SHF_ALLOC;
2870 
2871 	/*
2872 	 * Mark ro_after_init section with SHF_RO_AFTER_INIT so that
2873 	 * layout_sections() can put it in the right place.
2874 	 * Note: ro_after_init sections also have SHF_{WRITE,ALLOC} set.
2875 	 */
2876 	ndx = find_sec(info, ".data..ro_after_init");
2877 	if (ndx)
2878 		info->sechdrs[ndx].sh_flags |= SHF_RO_AFTER_INIT;
2879 	/*
2880 	 * Mark the __jump_table section as ro_after_init as well: these data
2881 	 * structures are never modified, with the exception of entries that
2882 	 * refer to code in the __init section, which are annotated as such
2883 	 * at module load time.
2884 	 */
2885 	ndx = find_sec(info, "__jump_table");
2886 	if (ndx)
2887 		info->sechdrs[ndx].sh_flags |= SHF_RO_AFTER_INIT;
2888 
2889 	/*
2890 	 * Determine total sizes, and put offsets in sh_entsize.  For now
2891 	 * this is done generically; there doesn't appear to be any
2892 	 * special cases for the architectures.
2893 	 */
2894 	layout_sections(info->mod, info);
2895 	layout_symtab(info->mod, info);
2896 
2897 	/* Allocate and move to the final place */
2898 	err = move_module(info->mod, info);
2899 	if (err)
2900 		return ERR_PTR(err);
2901 
2902 	/* Module has been copied to its final place now: return it. */
2903 	mod = (void *)info->sechdrs[info->index.mod].sh_addr;
2904 	kmemleak_load_module(mod, info);
2905 	codetag_module_replaced(info->mod, mod);
2906 
2907 	return mod;
2908 }
2909 
2910 /* mod is no longer valid after this! */
2911 static void module_deallocate(struct module *mod, struct load_info *info)
2912 {
2913 	percpu_modfree(mod);
2914 	module_arch_freeing_init(mod);
2915 
2916 	free_mod_mem(mod);
2917 }
2918 
2919 int __weak module_finalize(const Elf_Ehdr *hdr,
2920 			   const Elf_Shdr *sechdrs,
2921 			   struct module *me)
2922 {
2923 	return 0;
2924 }
2925 
2926 static int post_relocation(struct module *mod, const struct load_info *info)
2927 {
2928 	/* Sort exception table now relocations are done. */
2929 	sort_extable(mod->extable, mod->extable + mod->num_exentries);
2930 
2931 	/* Copy relocated percpu area over. */
2932 	percpu_modcopy(mod, (void *)info->sechdrs[info->index.pcpu].sh_addr,
2933 		       info->sechdrs[info->index.pcpu].sh_size);
2934 
2935 	/* Setup kallsyms-specific fields. */
2936 	add_kallsyms(mod, info);
2937 
2938 	/* Arch-specific module finalizing. */
2939 	return module_finalize(info->hdr, info->sechdrs, mod);
2940 }
2941 
2942 /* Call module constructors. */
2943 static void do_mod_ctors(struct module *mod)
2944 {
2945 #ifdef CONFIG_CONSTRUCTORS
2946 	unsigned long i;
2947 
2948 	for (i = 0; i < mod->num_ctors; i++)
2949 		mod->ctors[i]();
2950 #endif
2951 }
2952 
2953 /* For freeing module_init on success, in case kallsyms traversing */
2954 struct mod_initfree {
2955 	struct llist_node node;
2956 	void *init_text;
2957 	void *init_data;
2958 	void *init_rodata;
2959 };
2960 
2961 static void do_free_init(struct work_struct *w)
2962 {
2963 	struct llist_node *pos, *n, *list;
2964 	struct mod_initfree *initfree;
2965 
2966 	list = llist_del_all(&init_free_list);
2967 
2968 	synchronize_rcu();
2969 
2970 	llist_for_each_safe(pos, n, list) {
2971 		initfree = container_of(pos, struct mod_initfree, node);
2972 		execmem_free(initfree->init_text);
2973 		execmem_free(initfree->init_data);
2974 		execmem_free(initfree->init_rodata);
2975 		kfree(initfree);
2976 	}
2977 }
2978 
2979 void flush_module_init_free_work(void)
2980 {
2981 	flush_work(&init_free_wq);
2982 }
2983 
2984 #undef MODULE_PARAM_PREFIX
2985 #define MODULE_PARAM_PREFIX "module."
2986 /* Default value for module->async_probe_requested */
2987 static bool async_probe;
2988 module_param(async_probe, bool, 0644);
2989 
2990 /*
2991  * This is where the real work happens.
2992  *
2993  * Keep it uninlined to provide a reliable breakpoint target, e.g. for the gdb
2994  * helper command 'lx-symbols'.
2995  */
2996 static noinline int do_init_module(struct module *mod)
2997 {
2998 	int ret = 0;
2999 	struct mod_initfree *freeinit;
3000 #if defined(CONFIG_MODULE_STATS)
3001 	unsigned int text_size = 0, total_size = 0;
3002 
3003 	for_each_mod_mem_type(type) {
3004 		const struct module_memory *mod_mem = &mod->mem[type];
3005 		if (mod_mem->size) {
3006 			total_size += mod_mem->size;
3007 			if (type == MOD_TEXT || type == MOD_INIT_TEXT)
3008 				text_size += mod_mem->size;
3009 		}
3010 	}
3011 #endif
3012 
3013 	freeinit = kmalloc(sizeof(*freeinit), GFP_KERNEL);
3014 	if (!freeinit) {
3015 		ret = -ENOMEM;
3016 		goto fail;
3017 	}
3018 	freeinit->init_text = mod->mem[MOD_INIT_TEXT].base;
3019 	freeinit->init_data = mod->mem[MOD_INIT_DATA].base;
3020 	freeinit->init_rodata = mod->mem[MOD_INIT_RODATA].base;
3021 
3022 	do_mod_ctors(mod);
3023 	/* Start the module */
3024 	if (mod->init != NULL)
3025 		ret = do_one_initcall(mod->init);
3026 	if (ret < 0) {
3027 		goto fail_free_freeinit;
3028 	}
3029 	if (ret > 0) {
3030 		pr_warn("%s: '%s'->init suspiciously returned %d, it should "
3031 			"follow 0/-E convention\n"
3032 			"%s: loading module anyway...\n",
3033 			__func__, mod->name, ret, __func__);
3034 		dump_stack();
3035 	}
3036 
3037 	/* Now it's a first class citizen! */
3038 	mod->state = MODULE_STATE_LIVE;
3039 	blocking_notifier_call_chain(&module_notify_list,
3040 				     MODULE_STATE_LIVE, mod);
3041 
3042 	/* Delay uevent until module has finished its init routine */
3043 	kobject_uevent(&mod->mkobj.kobj, KOBJ_ADD);
3044 
3045 	/*
3046 	 * We need to finish all async code before the module init sequence
3047 	 * is done. This has potential to deadlock if synchronous module
3048 	 * loading is requested from async (which is not allowed!).
3049 	 *
3050 	 * See commit 0fdff3ec6d87 ("async, kmod: warn on synchronous
3051 	 * request_module() from async workers") for more details.
3052 	 */
3053 	if (!mod->async_probe_requested)
3054 		async_synchronize_full();
3055 
3056 	ftrace_free_mem(mod, mod->mem[MOD_INIT_TEXT].base,
3057 			mod->mem[MOD_INIT_TEXT].base + mod->mem[MOD_INIT_TEXT].size);
3058 	mutex_lock(&module_mutex);
3059 	/* Drop initial reference. */
3060 	module_put(mod);
3061 	trim_init_extable(mod);
3062 #ifdef CONFIG_KALLSYMS
3063 	/* Switch to core kallsyms now init is done: kallsyms may be walking! */
3064 	rcu_assign_pointer(mod->kallsyms, &mod->core_kallsyms);
3065 #endif
3066 	ret = module_enable_rodata_ro_after_init(mod);
3067 	if (ret)
3068 		pr_warn("%s: module_enable_rodata_ro_after_init() returned %d, "
3069 			"ro_after_init data might still be writable\n",
3070 			mod->name, ret);
3071 
3072 	mod_tree_remove_init(mod);
3073 	module_arch_freeing_init(mod);
3074 	for_class_mod_mem_type(type, init) {
3075 		mod->mem[type].base = NULL;
3076 		mod->mem[type].size = 0;
3077 	}
3078 
3079 #ifdef CONFIG_DEBUG_INFO_BTF_MODULES
3080 	/* .BTF is not SHF_ALLOC and will get removed, so sanitize pointers */
3081 	mod->btf_data = NULL;
3082 	mod->btf_base_data = NULL;
3083 #endif
3084 	/*
3085 	 * We want to free module_init, but be aware that kallsyms may be
3086 	 * walking this within an RCU read section. In all the failure paths, we
3087 	 * call synchronize_rcu(), but we don't want to slow down the success
3088 	 * path. execmem_free() cannot be called in an interrupt, so do the
3089 	 * work and call synchronize_rcu() in a work queue.
3090 	 *
3091 	 * Note that execmem_alloc() on most architectures creates W+X page
3092 	 * mappings which won't be cleaned up until do_free_init() runs.  Any
3093 	 * code such as mark_rodata_ro() which depends on those mappings to
3094 	 * be cleaned up needs to sync with the queued work by invoking
3095 	 * flush_module_init_free_work().
3096 	 */
3097 	if (llist_add(&freeinit->node, &init_free_list))
3098 		schedule_work(&init_free_wq);
3099 
3100 	mutex_unlock(&module_mutex);
3101 	wake_up_all(&module_wq);
3102 
3103 	mod_stat_add_long(text_size, &total_text_size);
3104 	mod_stat_add_long(total_size, &total_mod_size);
3105 
3106 	mod_stat_inc(&modcount);
3107 
3108 	return 0;
3109 
3110 fail_free_freeinit:
3111 	kfree(freeinit);
3112 fail:
3113 	/* Try to protect us from buggy refcounters. */
3114 	mod->state = MODULE_STATE_GOING;
3115 	synchronize_rcu();
3116 	module_put(mod);
3117 	blocking_notifier_call_chain(&module_notify_list,
3118 				     MODULE_STATE_GOING, mod);
3119 	klp_module_going(mod);
3120 	ftrace_release_mod(mod);
3121 	free_module(mod);
3122 	wake_up_all(&module_wq);
3123 
3124 	return ret;
3125 }
3126 
3127 static int may_init_module(void)
3128 {
3129 	if (!capable(CAP_SYS_MODULE) || modules_disabled)
3130 		return -EPERM;
3131 
3132 	return 0;
3133 }
3134 
3135 /* Is this module of this name done loading?  No locks held. */
3136 static bool finished_loading(const char *name)
3137 {
3138 	struct module *mod;
3139 	bool ret;
3140 
3141 	/*
3142 	 * The module_mutex should not be a heavily contended lock;
3143 	 * if we get the occasional sleep here, we'll go an extra iteration
3144 	 * in the wait_event_interruptible(), which is harmless.
3145 	 */
3146 	sched_annotate_sleep();
3147 	mutex_lock(&module_mutex);
3148 	mod = find_module_all(name, strlen(name), true);
3149 	ret = !mod || mod->state == MODULE_STATE_LIVE
3150 		|| mod->state == MODULE_STATE_GOING;
3151 	mutex_unlock(&module_mutex);
3152 
3153 	return ret;
3154 }
3155 
3156 /* Must be called with module_mutex held */
3157 static int module_patient_check_exists(const char *name,
3158 				       enum fail_dup_mod_reason reason)
3159 {
3160 	struct module *old;
3161 	int err = 0;
3162 
3163 	old = find_module_all(name, strlen(name), true);
3164 	if (old == NULL)
3165 		return 0;
3166 
3167 	if (old->state == MODULE_STATE_COMING ||
3168 	    old->state == MODULE_STATE_UNFORMED) {
3169 		/* Wait in case it fails to load. */
3170 		mutex_unlock(&module_mutex);
3171 		err = wait_event_interruptible(module_wq,
3172 				       finished_loading(name));
3173 		mutex_lock(&module_mutex);
3174 		if (err)
3175 			return err;
3176 
3177 		/* The module might have gone in the meantime. */
3178 		old = find_module_all(name, strlen(name), true);
3179 	}
3180 
3181 	if (try_add_failed_module(name, reason))
3182 		pr_warn("Could not add fail-tracking for module: %s\n", name);
3183 
3184 	/*
3185 	 * We are here only when the same module was being loaded. Do
3186 	 * not try to load it again right now. It prevents long delays
3187 	 * caused by serialized module load failures. It might happen
3188 	 * when more devices of the same type trigger load of
3189 	 * a particular module.
3190 	 */
3191 	if (old && old->state == MODULE_STATE_LIVE)
3192 		return -EEXIST;
3193 	return -EBUSY;
3194 }
3195 
3196 /*
3197  * We try to place it in the list now to make sure it's unique before
3198  * we dedicate too many resources.  In particular, temporary percpu
3199  * memory exhaustion.
3200  */
3201 static int add_unformed_module(struct module *mod)
3202 {
3203 	int err;
3204 
3205 	mod->state = MODULE_STATE_UNFORMED;
3206 
3207 	mutex_lock(&module_mutex);
3208 	err = module_patient_check_exists(mod->name, FAIL_DUP_MOD_LOAD);
3209 	if (err)
3210 		goto out;
3211 
3212 	mod_update_bounds(mod);
3213 	list_add_rcu(&mod->list, &modules);
3214 	mod_tree_insert(mod);
3215 	err = 0;
3216 
3217 out:
3218 	mutex_unlock(&module_mutex);
3219 	return err;
3220 }
3221 
3222 static int complete_formation(struct module *mod, struct load_info *info)
3223 {
3224 	int err;
3225 
3226 	mutex_lock(&module_mutex);
3227 
3228 	/* Find duplicate symbols (must be called under lock). */
3229 	err = verify_exported_symbols(mod);
3230 	if (err < 0)
3231 		goto out;
3232 
3233 	/* These rely on module_mutex for list integrity. */
3234 	module_bug_finalize(info->hdr, info->sechdrs, mod);
3235 	module_cfi_finalize(info->hdr, info->sechdrs, mod);
3236 
3237 	err = module_enable_rodata_ro(mod);
3238 	if (err)
3239 		goto out_strict_rwx;
3240 	err = module_enable_data_nx(mod);
3241 	if (err)
3242 		goto out_strict_rwx;
3243 	err = module_enable_text_rox(mod);
3244 	if (err)
3245 		goto out_strict_rwx;
3246 
3247 	/*
3248 	 * Mark state as coming so strong_try_module_get() ignores us,
3249 	 * but kallsyms etc. can see us.
3250 	 */
3251 	mod->state = MODULE_STATE_COMING;
3252 	mutex_unlock(&module_mutex);
3253 
3254 	return 0;
3255 
3256 out_strict_rwx:
3257 	module_bug_cleanup(mod);
3258 out:
3259 	mutex_unlock(&module_mutex);
3260 	return err;
3261 }
3262 
3263 static int prepare_coming_module(struct module *mod)
3264 {
3265 	int err;
3266 
3267 	ftrace_module_enable(mod);
3268 	err = klp_module_coming(mod);
3269 	if (err)
3270 		return err;
3271 
3272 	err = blocking_notifier_call_chain_robust(&module_notify_list,
3273 			MODULE_STATE_COMING, MODULE_STATE_GOING, mod);
3274 	err = notifier_to_errno(err);
3275 	if (err)
3276 		klp_module_going(mod);
3277 
3278 	return err;
3279 }
3280 
3281 static int unknown_module_param_cb(char *param, char *val, const char *modname,
3282 				   void *arg)
3283 {
3284 	struct module *mod = arg;
3285 	int ret;
3286 
3287 	if (strcmp(param, "async_probe") == 0) {
3288 		if (kstrtobool(val, &mod->async_probe_requested))
3289 			mod->async_probe_requested = true;
3290 		return 0;
3291 	}
3292 
3293 	/* Check for magic 'dyndbg' arg */
3294 	ret = ddebug_dyndbg_module_param_cb(param, val, modname);
3295 	if (ret != 0)
3296 		pr_warn("%s: unknown parameter '%s' ignored\n", modname, param);
3297 	return 0;
3298 }
3299 
3300 /* Module within temporary copy, this doesn't do any allocation  */
3301 static int early_mod_check(struct load_info *info, int flags)
3302 {
3303 	int err;
3304 
3305 	/*
3306 	 * Now that we know we have the correct module name, check
3307 	 * if it's blacklisted.
3308 	 */
3309 	if (blacklisted(info->name)) {
3310 		pr_err("Module %s is blacklisted\n", info->name);
3311 		return -EPERM;
3312 	}
3313 
3314 	err = rewrite_section_headers(info, flags);
3315 	if (err)
3316 		return err;
3317 
3318 	/* Check module struct version now, before we try to use module. */
3319 	if (!check_modstruct_version(info, info->mod))
3320 		return -ENOEXEC;
3321 
3322 	err = check_modinfo(info->mod, info, flags);
3323 	if (err)
3324 		return err;
3325 
3326 	mutex_lock(&module_mutex);
3327 	err = module_patient_check_exists(info->mod->name, FAIL_DUP_MOD_BECOMING);
3328 	mutex_unlock(&module_mutex);
3329 
3330 	return err;
3331 }
3332 
3333 /*
3334  * Allocate and load the module: note that size of section 0 is always
3335  * zero, and we rely on this for optional sections.
3336  */
3337 static int load_module(struct load_info *info, const char __user *uargs,
3338 		       int flags)
3339 {
3340 	struct module *mod;
3341 	bool module_allocated = false;
3342 	long err = 0;
3343 	char *after_dashes;
3344 
3345 	/*
3346 	 * Do the signature check (if any) first. All that
3347 	 * the signature check needs is info->len, it does
3348 	 * not need any of the section info. That can be
3349 	 * set up later. This will minimize the chances
3350 	 * of a corrupt module causing problems before
3351 	 * we even get to the signature check.
3352 	 *
3353 	 * The check will also adjust info->len by stripping
3354 	 * off the sig length at the end of the module, making
3355 	 * checks against info->len more correct.
3356 	 */
3357 	err = module_sig_check(info, flags);
3358 	if (err)
3359 		goto free_copy;
3360 
3361 	/*
3362 	 * Do basic sanity checks against the ELF header and
3363 	 * sections. Cache useful sections and set the
3364 	 * info->mod to the userspace passed struct module.
3365 	 */
3366 	err = elf_validity_cache_copy(info, flags);
3367 	if (err)
3368 		goto free_copy;
3369 
3370 	err = early_mod_check(info, flags);
3371 	if (err)
3372 		goto free_copy;
3373 
3374 	/* Figure out module layout, and allocate all the memory. */
3375 	mod = layout_and_allocate(info, flags);
3376 	if (IS_ERR(mod)) {
3377 		err = PTR_ERR(mod);
3378 		goto free_copy;
3379 	}
3380 
3381 	module_allocated = true;
3382 
3383 	audit_log_kern_module(mod->name);
3384 
3385 	/* Reserve our place in the list. */
3386 	err = add_unformed_module(mod);
3387 	if (err)
3388 		goto free_module;
3389 
3390 	/*
3391 	 * We are tainting your kernel if your module gets into
3392 	 * the modules linked list somehow.
3393 	 */
3394 	module_augment_kernel_taints(mod, info);
3395 
3396 	/* To avoid stressing percpu allocator, do this once we're unique. */
3397 	err = percpu_modalloc(mod, info);
3398 	if (err)
3399 		goto unlink_mod;
3400 
3401 	/* Now module is in final location, initialize linked lists, etc. */
3402 	err = module_unload_init(mod);
3403 	if (err)
3404 		goto unlink_mod;
3405 
3406 	init_param_lock(mod);
3407 
3408 	/*
3409 	 * Now we've got everything in the final locations, we can
3410 	 * find optional sections.
3411 	 */
3412 	err = find_module_sections(mod, info);
3413 	if (err)
3414 		goto free_unload;
3415 
3416 	err = check_export_symbol_versions(mod);
3417 	if (err)
3418 		goto free_unload;
3419 
3420 	/* Set up MODINFO_ATTR fields */
3421 	err = setup_modinfo(mod, info);
3422 	if (err)
3423 		goto free_modinfo;
3424 
3425 	/* Fix up syms, so that st_value is a pointer to location. */
3426 	err = simplify_symbols(mod, info);
3427 	if (err < 0)
3428 		goto free_modinfo;
3429 
3430 	err = apply_relocations(mod, info);
3431 	if (err < 0)
3432 		goto free_modinfo;
3433 
3434 	err = post_relocation(mod, info);
3435 	if (err < 0)
3436 		goto free_modinfo;
3437 
3438 	flush_module_icache(mod);
3439 
3440 	/* Now copy in args */
3441 	mod->args = strndup_user(uargs, ~0UL >> 1);
3442 	if (IS_ERR(mod->args)) {
3443 		err = PTR_ERR(mod->args);
3444 		goto free_arch_cleanup;
3445 	}
3446 
3447 	init_build_id(mod, info);
3448 
3449 	/* Ftrace init must be called in the MODULE_STATE_UNFORMED state */
3450 	ftrace_module_init(mod);
3451 
3452 	/* Finally it's fully formed, ready to start executing. */
3453 	err = complete_formation(mod, info);
3454 	if (err)
3455 		goto ddebug_cleanup;
3456 
3457 	err = prepare_coming_module(mod);
3458 	if (err)
3459 		goto bug_cleanup;
3460 
3461 	mod->async_probe_requested = async_probe;
3462 
3463 	/* Module is ready to execute: parsing args may do that. */
3464 	after_dashes = parse_args(mod->name, mod->args, mod->kp, mod->num_kp,
3465 				  -32768, 32767, mod,
3466 				  unknown_module_param_cb);
3467 	if (IS_ERR(after_dashes)) {
3468 		err = PTR_ERR(after_dashes);
3469 		goto coming_cleanup;
3470 	} else if (after_dashes) {
3471 		pr_warn("%s: parameters '%s' after `--' ignored\n",
3472 		       mod->name, after_dashes);
3473 	}
3474 
3475 	/* Link in to sysfs. */
3476 	err = mod_sysfs_setup(mod, info, mod->kp, mod->num_kp);
3477 	if (err < 0)
3478 		goto coming_cleanup;
3479 
3480 	if (is_livepatch_module(mod)) {
3481 		err = copy_module_elf(mod, info);
3482 		if (err < 0)
3483 			goto sysfs_cleanup;
3484 	}
3485 
3486 	/* Get rid of temporary copy. */
3487 	free_copy(info, flags);
3488 
3489 	codetag_load_module(mod);
3490 
3491 	/* Done! */
3492 	trace_module_load(mod);
3493 
3494 	return do_init_module(mod);
3495 
3496  sysfs_cleanup:
3497 	mod_sysfs_teardown(mod);
3498  coming_cleanup:
3499 	mod->state = MODULE_STATE_GOING;
3500 	destroy_params(mod->kp, mod->num_kp);
3501 	blocking_notifier_call_chain(&module_notify_list,
3502 				     MODULE_STATE_GOING, mod);
3503 	klp_module_going(mod);
3504  bug_cleanup:
3505 	mod->state = MODULE_STATE_GOING;
3506 	/* module_bug_cleanup needs module_mutex protection */
3507 	mutex_lock(&module_mutex);
3508 	module_bug_cleanup(mod);
3509 	mutex_unlock(&module_mutex);
3510 
3511  ddebug_cleanup:
3512 	ftrace_release_mod(mod);
3513 	synchronize_rcu();
3514 	kfree(mod->args);
3515  free_arch_cleanup:
3516 	module_arch_cleanup(mod);
3517  free_modinfo:
3518 	free_modinfo(mod);
3519  free_unload:
3520 	module_unload_free(mod);
3521  unlink_mod:
3522 	mutex_lock(&module_mutex);
3523 	/* Unlink carefully: kallsyms could be walking list. */
3524 	list_del_rcu(&mod->list);
3525 	mod_tree_remove(mod);
3526 	wake_up_all(&module_wq);
3527 	/* Wait for RCU-sched synchronizing before releasing mod->list. */
3528 	synchronize_rcu();
3529 	mutex_unlock(&module_mutex);
3530  free_module:
3531 	mod_stat_bump_invalid(info, flags);
3532 	/* Free lock-classes; relies on the preceding sync_rcu() */
3533 	for_class_mod_mem_type(type, core_data) {
3534 		lockdep_free_key_range(mod->mem[type].base,
3535 				       mod->mem[type].size);
3536 	}
3537 
3538 	module_memory_restore_rox(mod);
3539 	module_deallocate(mod, info);
3540  free_copy:
3541 	/*
3542 	 * The info->len is always set. We distinguish between
3543 	 * failures once the proper module was allocated and
3544 	 * before that.
3545 	 */
3546 	if (!module_allocated)
3547 		mod_stat_bump_becoming(info, flags);
3548 	free_copy(info, flags);
3549 	return err;
3550 }
3551 
3552 SYSCALL_DEFINE3(init_module, void __user *, umod,
3553 		unsigned long, len, const char __user *, uargs)
3554 {
3555 	int err;
3556 	struct load_info info = { };
3557 
3558 	err = may_init_module();
3559 	if (err)
3560 		return err;
3561 
3562 	pr_debug("init_module: umod=%p, len=%lu, uargs=%p\n",
3563 	       umod, len, uargs);
3564 
3565 	err = copy_module_from_user(umod, len, &info);
3566 	if (err) {
3567 		mod_stat_inc(&failed_kreads);
3568 		mod_stat_add_long(len, &invalid_kread_bytes);
3569 		return err;
3570 	}
3571 
3572 	return load_module(&info, uargs, 0);
3573 }
3574 
3575 struct idempotent {
3576 	const void *cookie;
3577 	struct hlist_node entry;
3578 	struct completion complete;
3579 	int ret;
3580 };
3581 
3582 #define IDEM_HASH_BITS 8
3583 static struct hlist_head idem_hash[1 << IDEM_HASH_BITS];
3584 static DEFINE_SPINLOCK(idem_lock);
3585 
3586 static bool idempotent(struct idempotent *u, const void *cookie)
3587 {
3588 	int hash = hash_ptr(cookie, IDEM_HASH_BITS);
3589 	struct hlist_head *head = idem_hash + hash;
3590 	struct idempotent *existing;
3591 	bool first;
3592 
3593 	u->ret = -EINTR;
3594 	u->cookie = cookie;
3595 	init_completion(&u->complete);
3596 
3597 	spin_lock(&idem_lock);
3598 	first = true;
3599 	hlist_for_each_entry(existing, head, entry) {
3600 		if (existing->cookie != cookie)
3601 			continue;
3602 		first = false;
3603 		break;
3604 	}
3605 	hlist_add_head(&u->entry, idem_hash + hash);
3606 	spin_unlock(&idem_lock);
3607 
3608 	return !first;
3609 }
3610 
3611 /*
3612  * We were the first one with 'cookie' on the list, and we ended
3613  * up completing the operation. We now need to walk the list,
3614  * remove everybody - which includes ourselves - fill in the return
3615  * value, and then complete the operation.
3616  */
3617 static int idempotent_complete(struct idempotent *u, int ret)
3618 {
3619 	const void *cookie = u->cookie;
3620 	int hash = hash_ptr(cookie, IDEM_HASH_BITS);
3621 	struct hlist_head *head = idem_hash + hash;
3622 	struct hlist_node *next;
3623 	struct idempotent *pos;
3624 
3625 	spin_lock(&idem_lock);
3626 	hlist_for_each_entry_safe(pos, next, head, entry) {
3627 		if (pos->cookie != cookie)
3628 			continue;
3629 		hlist_del_init(&pos->entry);
3630 		pos->ret = ret;
3631 		complete(&pos->complete);
3632 	}
3633 	spin_unlock(&idem_lock);
3634 	return ret;
3635 }
3636 
3637 /*
3638  * Wait for the idempotent worker.
3639  *
3640  * If we get interrupted, we need to remove ourselves from the
3641  * the idempotent list, and the completion may still come in.
3642  *
3643  * The 'idem_lock' protects against the race, and 'idem.ret' was
3644  * initialized to -EINTR and is thus always the right return
3645  * value even if the idempotent work then completes between
3646  * the wait_for_completion and the cleanup.
3647  */
3648 static int idempotent_wait_for_completion(struct idempotent *u)
3649 {
3650 	if (wait_for_completion_interruptible(&u->complete)) {
3651 		spin_lock(&idem_lock);
3652 		if (!hlist_unhashed(&u->entry))
3653 			hlist_del(&u->entry);
3654 		spin_unlock(&idem_lock);
3655 	}
3656 	return u->ret;
3657 }
3658 
3659 static int init_module_from_file(struct file *f, const char __user * uargs, int flags)
3660 {
3661 	struct load_info info = { };
3662 	void *buf = NULL;
3663 	int len;
3664 
3665 	len = kernel_read_file(f, 0, &buf, INT_MAX, NULL, READING_MODULE);
3666 	if (len < 0) {
3667 		mod_stat_inc(&failed_kreads);
3668 		return len;
3669 	}
3670 
3671 	if (flags & MODULE_INIT_COMPRESSED_FILE) {
3672 		int err = module_decompress(&info, buf, len);
3673 		vfree(buf); /* compressed data is no longer needed */
3674 		if (err) {
3675 			mod_stat_inc(&failed_decompress);
3676 			mod_stat_add_long(len, &invalid_decompress_bytes);
3677 			return err;
3678 		}
3679 	} else {
3680 		info.hdr = buf;
3681 		info.len = len;
3682 	}
3683 
3684 	return load_module(&info, uargs, flags);
3685 }
3686 
3687 static int idempotent_init_module(struct file *f, const char __user * uargs, int flags)
3688 {
3689 	struct idempotent idem;
3690 
3691 	if (!(f->f_mode & FMODE_READ))
3692 		return -EBADF;
3693 
3694 	/* Are we the winners of the race and get to do this? */
3695 	if (!idempotent(&idem, file_inode(f))) {
3696 		int ret = init_module_from_file(f, uargs, flags);
3697 		return idempotent_complete(&idem, ret);
3698 	}
3699 
3700 	/*
3701 	 * Somebody else won the race and is loading the module.
3702 	 */
3703 	return idempotent_wait_for_completion(&idem);
3704 }
3705 
3706 SYSCALL_DEFINE3(finit_module, int, fd, const char __user *, uargs, int, flags)
3707 {
3708 	int err = may_init_module();
3709 	if (err)
3710 		return err;
3711 
3712 	pr_debug("finit_module: fd=%d, uargs=%p, flags=%i\n", fd, uargs, flags);
3713 
3714 	if (flags & ~(MODULE_INIT_IGNORE_MODVERSIONS
3715 		      |MODULE_INIT_IGNORE_VERMAGIC
3716 		      |MODULE_INIT_COMPRESSED_FILE))
3717 		return -EINVAL;
3718 
3719 	CLASS(fd, f)(fd);
3720 	if (fd_empty(f))
3721 		return -EBADF;
3722 	return idempotent_init_module(fd_file(f), uargs, flags);
3723 }
3724 
3725 /* Keep in sync with MODULE_FLAGS_BUF_SIZE !!! */
3726 char *module_flags(struct module *mod, char *buf, bool show_state)
3727 {
3728 	int bx = 0;
3729 
3730 	BUG_ON(mod->state == MODULE_STATE_UNFORMED);
3731 	if (!mod->taints && !show_state)
3732 		goto out;
3733 	if (mod->taints ||
3734 	    mod->state == MODULE_STATE_GOING ||
3735 	    mod->state == MODULE_STATE_COMING) {
3736 		buf[bx++] = '(';
3737 		bx += module_flags_taint(mod->taints, buf + bx);
3738 		/* Show a - for module-is-being-unloaded */
3739 		if (mod->state == MODULE_STATE_GOING && show_state)
3740 			buf[bx++] = '-';
3741 		/* Show a + for module-is-being-loaded */
3742 		if (mod->state == MODULE_STATE_COMING && show_state)
3743 			buf[bx++] = '+';
3744 		buf[bx++] = ')';
3745 	}
3746 out:
3747 	buf[bx] = '\0';
3748 
3749 	return buf;
3750 }
3751 
3752 /* Given an address, look for it in the module exception tables. */
3753 const struct exception_table_entry *search_module_extables(unsigned long addr)
3754 {
3755 	struct module *mod;
3756 
3757 	guard(rcu)();
3758 	mod = __module_address(addr);
3759 	if (!mod)
3760 		return NULL;
3761 
3762 	if (!mod->num_exentries)
3763 		return NULL;
3764 	/*
3765 	 * The address passed here belongs to a module that is currently
3766 	 * invoked (we are running inside it). Therefore its module::refcnt
3767 	 * needs already be >0 to ensure that it is not removed at this stage.
3768 	 * All other user need to invoke this function within a RCU read
3769 	 * section.
3770 	 */
3771 	return search_extable(mod->extable, mod->num_exentries, addr);
3772 }
3773 
3774 /**
3775  * is_module_address() - is this address inside a module?
3776  * @addr: the address to check.
3777  *
3778  * See is_module_text_address() if you simply want to see if the address
3779  * is code (not data).
3780  */
3781 bool is_module_address(unsigned long addr)
3782 {
3783 	guard(rcu)();
3784 	return __module_address(addr) != NULL;
3785 }
3786 
3787 /**
3788  * __module_address() - get the module which contains an address.
3789  * @addr: the address.
3790  *
3791  * Must be called within RCU read section or module mutex held so that
3792  * module doesn't get freed during this.
3793  */
3794 struct module *__module_address(unsigned long addr)
3795 {
3796 	struct module *mod;
3797 
3798 	if (addr >= mod_tree.addr_min && addr <= mod_tree.addr_max)
3799 		goto lookup;
3800 
3801 #ifdef CONFIG_ARCH_WANTS_MODULES_DATA_IN_VMALLOC
3802 	if (addr >= mod_tree.data_addr_min && addr <= mod_tree.data_addr_max)
3803 		goto lookup;
3804 #endif
3805 
3806 	return NULL;
3807 
3808 lookup:
3809 	mod = mod_find(addr, &mod_tree);
3810 	if (mod) {
3811 		BUG_ON(!within_module(addr, mod));
3812 		if (mod->state == MODULE_STATE_UNFORMED)
3813 			mod = NULL;
3814 	}
3815 	return mod;
3816 }
3817 
3818 /**
3819  * is_module_text_address() - is this address inside module code?
3820  * @addr: the address to check.
3821  *
3822  * See is_module_address() if you simply want to see if the address is
3823  * anywhere in a module.  See kernel_text_address() for testing if an
3824  * address corresponds to kernel or module code.
3825  */
3826 bool is_module_text_address(unsigned long addr)
3827 {
3828 	guard(rcu)();
3829 	return __module_text_address(addr) != NULL;
3830 }
3831 
3832 void module_for_each_mod(int(*func)(struct module *mod, void *data), void *data)
3833 {
3834 	struct module *mod;
3835 
3836 	guard(rcu)();
3837 	list_for_each_entry_rcu(mod, &modules, list) {
3838 		if (mod->state == MODULE_STATE_UNFORMED)
3839 			continue;
3840 		if (func(mod, data))
3841 			break;
3842 	}
3843 }
3844 
3845 /**
3846  * __module_text_address() - get the module whose code contains an address.
3847  * @addr: the address.
3848  *
3849  * Must be called within RCU read section or module mutex held so that
3850  * module doesn't get freed during this.
3851  */
3852 struct module *__module_text_address(unsigned long addr)
3853 {
3854 	struct module *mod = __module_address(addr);
3855 	if (mod) {
3856 		/* Make sure it's within the text section. */
3857 		if (!within_module_mem_type(addr, mod, MOD_TEXT) &&
3858 		    !within_module_mem_type(addr, mod, MOD_INIT_TEXT))
3859 			mod = NULL;
3860 	}
3861 	return mod;
3862 }
3863 
3864 /* Don't grab lock, we're oopsing. */
3865 void print_modules(void)
3866 {
3867 	struct module *mod;
3868 	char buf[MODULE_FLAGS_BUF_SIZE];
3869 
3870 	printk(KERN_DEFAULT "Modules linked in:");
3871 	/* Most callers should already have preempt disabled, but make sure */
3872 	guard(rcu)();
3873 	list_for_each_entry_rcu(mod, &modules, list) {
3874 		if (mod->state == MODULE_STATE_UNFORMED)
3875 			continue;
3876 		pr_cont(" %s%s", mod->name, module_flags(mod, buf, true));
3877 	}
3878 
3879 	print_unloaded_tainted_modules();
3880 	if (last_unloaded_module.name[0])
3881 		pr_cont(" [last unloaded: %s%s]", last_unloaded_module.name,
3882 			last_unloaded_module.taints);
3883 	pr_cont("\n");
3884 }
3885 
3886 #ifdef CONFIG_MODULE_DEBUGFS
3887 struct dentry *mod_debugfs_root;
3888 
3889 static int module_debugfs_init(void)
3890 {
3891 	mod_debugfs_root = debugfs_create_dir("modules", NULL);
3892 	return 0;
3893 }
3894 module_init(module_debugfs_init);
3895 #endif
3896