xref: /linux/fs/proc/generic.c (revision 260f6f4fda93c8485c8037865c941b42b9cba5d2)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * proc/fs/generic.c --- generic routines for the proc-fs
4  *
5  * This file contains generic proc-fs routines for handling
6  * directories and files.
7  *
8  * Copyright (C) 1991, 1992 Linus Torvalds.
9  * Copyright (C) 1997 Theodore Ts'o
10  */
11 
12 #include <linux/cache.h>
13 #include <linux/errno.h>
14 #include <linux/time.h>
15 #include <linux/proc_fs.h>
16 #include <linux/stat.h>
17 #include <linux/mm.h>
18 #include <linux/module.h>
19 #include <linux/namei.h>
20 #include <linux/slab.h>
21 #include <linux/printk.h>
22 #include <linux/mount.h>
23 #include <linux/init.h>
24 #include <linux/idr.h>
25 #include <linux/bitops.h>
26 #include <linux/spinlock.h>
27 #include <linux/completion.h>
28 #include <linux/uaccess.h>
29 #include <linux/seq_file.h>
30 
31 #include "internal.h"
32 
33 static DEFINE_RWLOCK(proc_subdir_lock);
34 
35 struct kmem_cache *proc_dir_entry_cache __ro_after_init;
36 
37 void pde_free(struct proc_dir_entry *pde)
38 {
39 	if (S_ISLNK(pde->mode))
40 		kfree(pde->data);
41 	if (pde->name != pde->inline_name)
42 		kfree(pde->name);
43 	kmem_cache_free(proc_dir_entry_cache, pde);
44 }
45 
46 static int proc_match(const char *name, struct proc_dir_entry *de, unsigned int len)
47 {
48 	if (len < de->namelen)
49 		return -1;
50 	if (len > de->namelen)
51 		return 1;
52 
53 	return memcmp(name, de->name, len);
54 }
55 
56 static struct proc_dir_entry *pde_subdir_first(struct proc_dir_entry *dir)
57 {
58 	return rb_entry_safe(rb_first(&dir->subdir), struct proc_dir_entry,
59 			     subdir_node);
60 }
61 
62 static struct proc_dir_entry *pde_subdir_next(struct proc_dir_entry *dir)
63 {
64 	return rb_entry_safe(rb_next(&dir->subdir_node), struct proc_dir_entry,
65 			     subdir_node);
66 }
67 
68 static struct proc_dir_entry *pde_subdir_find(struct proc_dir_entry *dir,
69 					      const char *name,
70 					      unsigned int len)
71 {
72 	struct rb_node *node = dir->subdir.rb_node;
73 
74 	while (node) {
75 		struct proc_dir_entry *de = rb_entry(node,
76 						     struct proc_dir_entry,
77 						     subdir_node);
78 		int result = proc_match(name, de, len);
79 
80 		if (result < 0)
81 			node = node->rb_left;
82 		else if (result > 0)
83 			node = node->rb_right;
84 		else
85 			return de;
86 	}
87 	return NULL;
88 }
89 
90 static bool pde_subdir_insert(struct proc_dir_entry *dir,
91 			      struct proc_dir_entry *de)
92 {
93 	struct rb_root *root = &dir->subdir;
94 	struct rb_node **new = &root->rb_node, *parent = NULL;
95 
96 	/* Figure out where to put new node */
97 	while (*new) {
98 		struct proc_dir_entry *this = rb_entry(*new,
99 						       struct proc_dir_entry,
100 						       subdir_node);
101 		int result = proc_match(de->name, this, de->namelen);
102 
103 		parent = *new;
104 		if (result < 0)
105 			new = &(*new)->rb_left;
106 		else if (result > 0)
107 			new = &(*new)->rb_right;
108 		else
109 			return false;
110 	}
111 
112 	/* Add new node and rebalance tree. */
113 	rb_link_node(&de->subdir_node, parent, new);
114 	rb_insert_color(&de->subdir_node, root);
115 	return true;
116 }
117 
118 static int proc_notify_change(struct mnt_idmap *idmap,
119 			      struct dentry *dentry, struct iattr *iattr)
120 {
121 	struct inode *inode = d_inode(dentry);
122 	struct proc_dir_entry *de = PDE(inode);
123 	int error;
124 
125 	error = setattr_prepare(&nop_mnt_idmap, dentry, iattr);
126 	if (error)
127 		return error;
128 
129 	setattr_copy(&nop_mnt_idmap, inode, iattr);
130 
131 	proc_set_user(de, inode->i_uid, inode->i_gid);
132 	de->mode = inode->i_mode;
133 	return 0;
134 }
135 
136 static int proc_getattr(struct mnt_idmap *idmap,
137 			const struct path *path, struct kstat *stat,
138 			u32 request_mask, unsigned int query_flags)
139 {
140 	struct inode *inode = d_inode(path->dentry);
141 	struct proc_dir_entry *de = PDE(inode);
142 	if (de) {
143 		nlink_t nlink = READ_ONCE(de->nlink);
144 		if (nlink > 0) {
145 			set_nlink(inode, nlink);
146 		}
147 	}
148 
149 	generic_fillattr(&nop_mnt_idmap, request_mask, inode, stat);
150 	return 0;
151 }
152 
153 static const struct inode_operations proc_file_inode_operations = {
154 	.setattr	= proc_notify_change,
155 };
156 
157 /*
158  * This function parses a name such as "tty/driver/serial", and
159  * returns the struct proc_dir_entry for "/proc/tty/driver", and
160  * returns "serial" in residual.
161  */
162 static int __xlate_proc_name(const char *name, struct proc_dir_entry **ret,
163 			     const char **residual)
164 {
165 	const char     		*cp = name, *next;
166 	struct proc_dir_entry	*de;
167 
168 	de = *ret ?: &proc_root;
169 	while ((next = strchr(cp, '/')) != NULL) {
170 		de = pde_subdir_find(de, cp, next - cp);
171 		if (!de) {
172 			WARN(1, "name '%s'\n", name);
173 			return -ENOENT;
174 		}
175 		cp = next + 1;
176 	}
177 	*residual = cp;
178 	*ret = de;
179 	return 0;
180 }
181 
182 static int xlate_proc_name(const char *name, struct proc_dir_entry **ret,
183 			   const char **residual)
184 {
185 	int rv;
186 
187 	read_lock(&proc_subdir_lock);
188 	rv = __xlate_proc_name(name, ret, residual);
189 	read_unlock(&proc_subdir_lock);
190 	return rv;
191 }
192 
193 static DEFINE_IDA(proc_inum_ida);
194 
195 #define PROC_DYNAMIC_FIRST 0xF0000000U
196 
197 /*
198  * Return an inode number between PROC_DYNAMIC_FIRST and
199  * 0xffffffff, or zero on failure.
200  */
201 int proc_alloc_inum(unsigned int *inum)
202 {
203 	int i;
204 
205 	i = ida_alloc_max(&proc_inum_ida, UINT_MAX - PROC_DYNAMIC_FIRST,
206 			  GFP_KERNEL);
207 	if (i < 0)
208 		return i;
209 
210 	*inum = PROC_DYNAMIC_FIRST + (unsigned int)i;
211 	return 0;
212 }
213 
214 void proc_free_inum(unsigned int inum)
215 {
216 	ida_free(&proc_inum_ida, inum - PROC_DYNAMIC_FIRST);
217 }
218 
219 static int proc_misc_d_revalidate(struct inode *dir, const struct qstr *name,
220 				  struct dentry *dentry, unsigned int flags)
221 {
222 	if (flags & LOOKUP_RCU)
223 		return -ECHILD;
224 
225 	if (atomic_read(&PDE(d_inode(dentry))->in_use) < 0)
226 		return 0; /* revalidate */
227 	return 1;
228 }
229 
230 static int proc_misc_d_delete(const struct dentry *dentry)
231 {
232 	return atomic_read(&PDE(d_inode(dentry))->in_use) < 0;
233 }
234 
235 static const struct dentry_operations proc_misc_dentry_ops = {
236 	.d_revalidate	= proc_misc_d_revalidate,
237 	.d_delete	= proc_misc_d_delete,
238 };
239 
240 /*
241  * Don't create negative dentries here, return -ENOENT by hand
242  * instead.
243  */
244 struct dentry *proc_lookup_de(struct inode *dir, struct dentry *dentry,
245 			      struct proc_dir_entry *de)
246 {
247 	struct inode *inode;
248 
249 	read_lock(&proc_subdir_lock);
250 	de = pde_subdir_find(de, dentry->d_name.name, dentry->d_name.len);
251 	if (de) {
252 		pde_get(de);
253 		read_unlock(&proc_subdir_lock);
254 		inode = proc_get_inode(dir->i_sb, de);
255 		if (!inode)
256 			return ERR_PTR(-ENOMEM);
257 		if (de->flags & PROC_ENTRY_FORCE_LOOKUP)
258 			return d_splice_alias_ops(inode, dentry,
259 						  &proc_net_dentry_ops);
260 		return d_splice_alias_ops(inode, dentry,
261 					  &proc_misc_dentry_ops);
262 	}
263 	read_unlock(&proc_subdir_lock);
264 	return ERR_PTR(-ENOENT);
265 }
266 
267 struct dentry *proc_lookup(struct inode *dir, struct dentry *dentry,
268 		unsigned int flags)
269 {
270 	struct proc_fs_info *fs_info = proc_sb_info(dir->i_sb);
271 
272 	if (fs_info->pidonly == PROC_PIDONLY_ON)
273 		return ERR_PTR(-ENOENT);
274 
275 	return proc_lookup_de(dir, dentry, PDE(dir));
276 }
277 
278 /*
279  * This returns non-zero if at EOF, so that the /proc
280  * root directory can use this and check if it should
281  * continue with the <pid> entries..
282  *
283  * Note that the VFS-layer doesn't care about the return
284  * value of the readdir() call, as long as it's non-negative
285  * for success..
286  */
287 int proc_readdir_de(struct file *file, struct dir_context *ctx,
288 		    struct proc_dir_entry *de)
289 {
290 	int i;
291 
292 	if (!dir_emit_dots(file, ctx))
293 		return 0;
294 
295 	i = ctx->pos - 2;
296 	read_lock(&proc_subdir_lock);
297 	de = pde_subdir_first(de);
298 	for (;;) {
299 		if (!de) {
300 			read_unlock(&proc_subdir_lock);
301 			return 0;
302 		}
303 		if (!i)
304 			break;
305 		de = pde_subdir_next(de);
306 		i--;
307 	}
308 
309 	do {
310 		struct proc_dir_entry *next;
311 		pde_get(de);
312 		read_unlock(&proc_subdir_lock);
313 		if (!dir_emit(ctx, de->name, de->namelen,
314 			    de->low_ino, de->mode >> 12)) {
315 			pde_put(de);
316 			return 0;
317 		}
318 		ctx->pos++;
319 		read_lock(&proc_subdir_lock);
320 		next = pde_subdir_next(de);
321 		pde_put(de);
322 		de = next;
323 	} while (de);
324 	read_unlock(&proc_subdir_lock);
325 	return 1;
326 }
327 
328 int proc_readdir(struct file *file, struct dir_context *ctx)
329 {
330 	struct inode *inode = file_inode(file);
331 	struct proc_fs_info *fs_info = proc_sb_info(inode->i_sb);
332 
333 	if (fs_info->pidonly == PROC_PIDONLY_ON)
334 		return 1;
335 
336 	return proc_readdir_de(file, ctx, PDE(inode));
337 }
338 
339 /*
340  * These are the generic /proc directory operations. They
341  * use the in-memory "struct proc_dir_entry" tree to parse
342  * the /proc directory.
343  */
344 static const struct file_operations proc_dir_operations = {
345 	.llseek			= generic_file_llseek,
346 	.read			= generic_read_dir,
347 	.iterate_shared		= proc_readdir,
348 };
349 
350 static int proc_net_d_revalidate(struct inode *dir, const struct qstr *name,
351 				 struct dentry *dentry, unsigned int flags)
352 {
353 	return 0;
354 }
355 
356 const struct dentry_operations proc_net_dentry_ops = {
357 	.d_revalidate	= proc_net_d_revalidate,
358 	.d_delete	= always_delete_dentry,
359 };
360 
361 /*
362  * proc directories can do almost nothing..
363  */
364 static const struct inode_operations proc_dir_inode_operations = {
365 	.lookup		= proc_lookup,
366 	.getattr	= proc_getattr,
367 	.setattr	= proc_notify_change,
368 };
369 
370 /* returns the registered entry, or frees dp and returns NULL on failure */
371 struct proc_dir_entry *proc_register(struct proc_dir_entry *dir,
372 		struct proc_dir_entry *dp)
373 {
374 	if (proc_alloc_inum(&dp->low_ino))
375 		goto out_free_entry;
376 
377 	write_lock(&proc_subdir_lock);
378 	dp->parent = dir;
379 	if (pde_subdir_insert(dir, dp) == false) {
380 		WARN(1, "proc_dir_entry '%s/%s' already registered\n",
381 		     dir->name, dp->name);
382 		write_unlock(&proc_subdir_lock);
383 		goto out_free_inum;
384 	}
385 	dir->nlink++;
386 	write_unlock(&proc_subdir_lock);
387 
388 	return dp;
389 out_free_inum:
390 	proc_free_inum(dp->low_ino);
391 out_free_entry:
392 	pde_free(dp);
393 	return NULL;
394 }
395 
396 static struct proc_dir_entry *__proc_create(struct proc_dir_entry **parent,
397 					  const char *name,
398 					  umode_t mode,
399 					  nlink_t nlink)
400 {
401 	struct proc_dir_entry *ent = NULL;
402 	const char *fn;
403 	struct qstr qstr;
404 
405 	if (xlate_proc_name(name, parent, &fn) != 0)
406 		goto out;
407 	qstr.name = fn;
408 	qstr.len = strlen(fn);
409 	if (qstr.len == 0 || qstr.len >= 256) {
410 		WARN(1, "name len %u\n", qstr.len);
411 		return NULL;
412 	}
413 	if (qstr.len == 1 && fn[0] == '.') {
414 		WARN(1, "name '.'\n");
415 		return NULL;
416 	}
417 	if (qstr.len == 2 && fn[0] == '.' && fn[1] == '.') {
418 		WARN(1, "name '..'\n");
419 		return NULL;
420 	}
421 	if (*parent == &proc_root && name_to_int(&qstr) != ~0U) {
422 		WARN(1, "create '/proc/%s' by hand\n", qstr.name);
423 		return NULL;
424 	}
425 	if (is_empty_pde(*parent)) {
426 		WARN(1, "attempt to add to permanently empty directory");
427 		return NULL;
428 	}
429 
430 	ent = kmem_cache_zalloc(proc_dir_entry_cache, GFP_KERNEL);
431 	if (!ent)
432 		goto out;
433 
434 	if (qstr.len + 1 <= SIZEOF_PDE_INLINE_NAME) {
435 		ent->name = ent->inline_name;
436 	} else {
437 		ent->name = kmalloc(qstr.len + 1, GFP_KERNEL);
438 		if (!ent->name) {
439 			pde_free(ent);
440 			return NULL;
441 		}
442 	}
443 
444 	memcpy(ent->name, fn, qstr.len + 1);
445 	ent->namelen = qstr.len;
446 	ent->mode = mode;
447 	ent->nlink = nlink;
448 	ent->subdir = RB_ROOT;
449 	refcount_set(&ent->refcnt, 1);
450 	spin_lock_init(&ent->pde_unload_lock);
451 	INIT_LIST_HEAD(&ent->pde_openers);
452 	proc_set_user(ent, (*parent)->uid, (*parent)->gid);
453 
454 	/* Revalidate everything under /proc/${pid}/net */
455 	if ((*parent)->flags & PROC_ENTRY_FORCE_LOOKUP)
456 		pde_force_lookup(ent);
457 
458 out:
459 	return ent;
460 }
461 
462 struct proc_dir_entry *proc_symlink(const char *name,
463 		struct proc_dir_entry *parent, const char *dest)
464 {
465 	struct proc_dir_entry *ent;
466 
467 	ent = __proc_create(&parent, name,
468 			  (S_IFLNK | S_IRUGO | S_IWUGO | S_IXUGO),1);
469 
470 	if (ent) {
471 		ent->size = strlen(dest);
472 		ent->data = kmemdup(dest, ent->size + 1, GFP_KERNEL);
473 		if (ent->data) {
474 			ent->proc_iops = &proc_link_inode_operations;
475 			ent = proc_register(parent, ent);
476 		} else {
477 			pde_free(ent);
478 			ent = NULL;
479 		}
480 	}
481 	return ent;
482 }
483 EXPORT_SYMBOL(proc_symlink);
484 
485 struct proc_dir_entry *_proc_mkdir(const char *name, umode_t mode,
486 		struct proc_dir_entry *parent, void *data, bool force_lookup)
487 {
488 	struct proc_dir_entry *ent;
489 
490 	if (mode == 0)
491 		mode = S_IRUGO | S_IXUGO;
492 
493 	ent = __proc_create(&parent, name, S_IFDIR | mode, 2);
494 	if (ent) {
495 		ent->data = data;
496 		ent->proc_dir_ops = &proc_dir_operations;
497 		ent->proc_iops = &proc_dir_inode_operations;
498 		if (force_lookup) {
499 			pde_force_lookup(ent);
500 		}
501 		ent = proc_register(parent, ent);
502 	}
503 	return ent;
504 }
505 EXPORT_SYMBOL_GPL(_proc_mkdir);
506 
507 struct proc_dir_entry *proc_mkdir_data(const char *name, umode_t mode,
508 		struct proc_dir_entry *parent, void *data)
509 {
510 	return _proc_mkdir(name, mode, parent, data, false);
511 }
512 EXPORT_SYMBOL_GPL(proc_mkdir_data);
513 
514 struct proc_dir_entry *proc_mkdir_mode(const char *name, umode_t mode,
515 				       struct proc_dir_entry *parent)
516 {
517 	return proc_mkdir_data(name, mode, parent, NULL);
518 }
519 EXPORT_SYMBOL(proc_mkdir_mode);
520 
521 struct proc_dir_entry *proc_mkdir(const char *name,
522 		struct proc_dir_entry *parent)
523 {
524 	return proc_mkdir_data(name, 0, parent, NULL);
525 }
526 EXPORT_SYMBOL(proc_mkdir);
527 
528 struct proc_dir_entry *proc_create_mount_point(const char *name)
529 {
530 	umode_t mode = S_IFDIR | S_IRUGO | S_IXUGO;
531 	struct proc_dir_entry *ent, *parent = NULL;
532 
533 	ent = __proc_create(&parent, name, mode, 2);
534 	if (ent) {
535 		ent->data = NULL;
536 		ent->proc_dir_ops = NULL;
537 		ent->proc_iops = NULL;
538 		ent = proc_register(parent, ent);
539 	}
540 	return ent;
541 }
542 EXPORT_SYMBOL(proc_create_mount_point);
543 
544 struct proc_dir_entry *proc_create_reg(const char *name, umode_t mode,
545 		struct proc_dir_entry **parent, void *data)
546 {
547 	struct proc_dir_entry *p;
548 
549 	if ((mode & S_IFMT) == 0)
550 		mode |= S_IFREG;
551 	if ((mode & S_IALLUGO) == 0)
552 		mode |= S_IRUGO;
553 	if (WARN_ON_ONCE(!S_ISREG(mode)))
554 		return NULL;
555 
556 	p = __proc_create(parent, name, mode, 1);
557 	if (p) {
558 		p->proc_iops = &proc_file_inode_operations;
559 		p->data = data;
560 	}
561 	return p;
562 }
563 
564 static void pde_set_flags(struct proc_dir_entry *pde)
565 {
566 	if (pde->proc_ops->proc_flags & PROC_ENTRY_PERMANENT)
567 		pde->flags |= PROC_ENTRY_PERMANENT;
568 	if (pde->proc_ops->proc_read_iter)
569 		pde->flags |= PROC_ENTRY_proc_read_iter;
570 #ifdef CONFIG_COMPAT
571 	if (pde->proc_ops->proc_compat_ioctl)
572 		pde->flags |= PROC_ENTRY_proc_compat_ioctl;
573 #endif
574 }
575 
576 struct proc_dir_entry *proc_create_data(const char *name, umode_t mode,
577 		struct proc_dir_entry *parent,
578 		const struct proc_ops *proc_ops, void *data)
579 {
580 	struct proc_dir_entry *p;
581 
582 	p = proc_create_reg(name, mode, &parent, data);
583 	if (!p)
584 		return NULL;
585 	p->proc_ops = proc_ops;
586 	pde_set_flags(p);
587 	return proc_register(parent, p);
588 }
589 EXPORT_SYMBOL(proc_create_data);
590 
591 struct proc_dir_entry *proc_create(const char *name, umode_t mode,
592 				   struct proc_dir_entry *parent,
593 				   const struct proc_ops *proc_ops)
594 {
595 	return proc_create_data(name, mode, parent, proc_ops, NULL);
596 }
597 EXPORT_SYMBOL(proc_create);
598 
599 static int proc_seq_open(struct inode *inode, struct file *file)
600 {
601 	struct proc_dir_entry *de = PDE(inode);
602 
603 	if (de->state_size)
604 		return seq_open_private(file, de->seq_ops, de->state_size);
605 	return seq_open(file, de->seq_ops);
606 }
607 
608 static int proc_seq_release(struct inode *inode, struct file *file)
609 {
610 	struct proc_dir_entry *de = PDE(inode);
611 
612 	if (de->state_size)
613 		return seq_release_private(inode, file);
614 	return seq_release(inode, file);
615 }
616 
617 static const struct proc_ops proc_seq_ops = {
618 	/* not permanent -- can call into arbitrary seq_operations */
619 	.proc_open	= proc_seq_open,
620 	.proc_read_iter	= seq_read_iter,
621 	.proc_lseek	= seq_lseek,
622 	.proc_release	= proc_seq_release,
623 };
624 
625 struct proc_dir_entry *proc_create_seq_private(const char *name, umode_t mode,
626 		struct proc_dir_entry *parent, const struct seq_operations *ops,
627 		unsigned int state_size, void *data)
628 {
629 	struct proc_dir_entry *p;
630 
631 	p = proc_create_reg(name, mode, &parent, data);
632 	if (!p)
633 		return NULL;
634 	p->proc_ops = &proc_seq_ops;
635 	p->seq_ops = ops;
636 	p->state_size = state_size;
637 	pde_set_flags(p);
638 	return proc_register(parent, p);
639 }
640 EXPORT_SYMBOL(proc_create_seq_private);
641 
642 static int proc_single_open(struct inode *inode, struct file *file)
643 {
644 	struct proc_dir_entry *de = PDE(inode);
645 
646 	return single_open(file, de->single_show, de->data);
647 }
648 
649 static const struct proc_ops proc_single_ops = {
650 	/* not permanent -- can call into arbitrary ->single_show */
651 	.proc_open	= proc_single_open,
652 	.proc_read_iter = seq_read_iter,
653 	.proc_lseek	= seq_lseek,
654 	.proc_release	= single_release,
655 };
656 
657 struct proc_dir_entry *proc_create_single_data(const char *name, umode_t mode,
658 		struct proc_dir_entry *parent,
659 		int (*show)(struct seq_file *, void *), void *data)
660 {
661 	struct proc_dir_entry *p;
662 
663 	p = proc_create_reg(name, mode, &parent, data);
664 	if (!p)
665 		return NULL;
666 	p->proc_ops = &proc_single_ops;
667 	p->single_show = show;
668 	pde_set_flags(p);
669 	return proc_register(parent, p);
670 }
671 EXPORT_SYMBOL(proc_create_single_data);
672 
673 void proc_set_size(struct proc_dir_entry *de, loff_t size)
674 {
675 	de->size = size;
676 }
677 EXPORT_SYMBOL(proc_set_size);
678 
679 void proc_set_user(struct proc_dir_entry *de, kuid_t uid, kgid_t gid)
680 {
681 	de->uid = uid;
682 	de->gid = gid;
683 }
684 EXPORT_SYMBOL(proc_set_user);
685 
686 void pde_put(struct proc_dir_entry *pde)
687 {
688 	if (refcount_dec_and_test(&pde->refcnt)) {
689 		proc_free_inum(pde->low_ino);
690 		pde_free(pde);
691 	}
692 }
693 
694 /*
695  * Remove a /proc entry and free it if it's not currently in use.
696  */
697 void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
698 {
699 	struct proc_dir_entry *de = NULL;
700 	const char *fn = name;
701 	unsigned int len;
702 
703 	write_lock(&proc_subdir_lock);
704 	if (__xlate_proc_name(name, &parent, &fn) != 0) {
705 		write_unlock(&proc_subdir_lock);
706 		return;
707 	}
708 	len = strlen(fn);
709 
710 	de = pde_subdir_find(parent, fn, len);
711 	if (de) {
712 		if (unlikely(pde_is_permanent(de))) {
713 			WARN(1, "removing permanent /proc entry '%s'", de->name);
714 			de = NULL;
715 		} else {
716 			rb_erase(&de->subdir_node, &parent->subdir);
717 			if (S_ISDIR(de->mode))
718 				parent->nlink--;
719 		}
720 	}
721 	write_unlock(&proc_subdir_lock);
722 	if (!de) {
723 		WARN(1, "name '%s'\n", name);
724 		return;
725 	}
726 
727 	proc_entry_rundown(de);
728 
729 	WARN(pde_subdir_first(de),
730 	     "%s: removing non-empty directory '%s/%s', leaking at least '%s'\n",
731 	     __func__, de->parent->name, de->name, pde_subdir_first(de)->name);
732 	pde_put(de);
733 }
734 EXPORT_SYMBOL(remove_proc_entry);
735 
736 int remove_proc_subtree(const char *name, struct proc_dir_entry *parent)
737 {
738 	struct proc_dir_entry *root = NULL, *de, *next;
739 	const char *fn = name;
740 	unsigned int len;
741 
742 	write_lock(&proc_subdir_lock);
743 	if (__xlate_proc_name(name, &parent, &fn) != 0) {
744 		write_unlock(&proc_subdir_lock);
745 		return -ENOENT;
746 	}
747 	len = strlen(fn);
748 
749 	root = pde_subdir_find(parent, fn, len);
750 	if (!root) {
751 		write_unlock(&proc_subdir_lock);
752 		return -ENOENT;
753 	}
754 	if (unlikely(pde_is_permanent(root))) {
755 		write_unlock(&proc_subdir_lock);
756 		WARN(1, "removing permanent /proc entry '%s/%s'",
757 			root->parent->name, root->name);
758 		return -EINVAL;
759 	}
760 	rb_erase(&root->subdir_node, &parent->subdir);
761 
762 	de = root;
763 	while (1) {
764 		next = pde_subdir_first(de);
765 		if (next) {
766 			if (unlikely(pde_is_permanent(next))) {
767 				write_unlock(&proc_subdir_lock);
768 				WARN(1, "removing permanent /proc entry '%s/%s'",
769 					next->parent->name, next->name);
770 				return -EINVAL;
771 			}
772 			rb_erase(&next->subdir_node, &de->subdir);
773 			de = next;
774 			continue;
775 		}
776 		next = de->parent;
777 		if (S_ISDIR(de->mode))
778 			next->nlink--;
779 		write_unlock(&proc_subdir_lock);
780 
781 		proc_entry_rundown(de);
782 		if (de == root)
783 			break;
784 		pde_put(de);
785 
786 		write_lock(&proc_subdir_lock);
787 		de = next;
788 	}
789 	pde_put(root);
790 	return 0;
791 }
792 EXPORT_SYMBOL(remove_proc_subtree);
793 
794 void *proc_get_parent_data(const struct inode *inode)
795 {
796 	struct proc_dir_entry *de = PDE(inode);
797 	return de->parent->data;
798 }
799 EXPORT_SYMBOL_GPL(proc_get_parent_data);
800 
801 void proc_remove(struct proc_dir_entry *de)
802 {
803 	if (de)
804 		remove_proc_subtree(de->name, de->parent);
805 }
806 EXPORT_SYMBOL(proc_remove);
807 
808 /*
809  * Pull a user buffer into memory and pass it to the file's write handler if
810  * one is supplied.  The ->write() method is permitted to modify the
811  * kernel-side buffer.
812  */
813 ssize_t proc_simple_write(struct file *f, const char __user *ubuf, size_t size,
814 			  loff_t *_pos)
815 {
816 	struct proc_dir_entry *pde = PDE(file_inode(f));
817 	char *buf;
818 	int ret;
819 
820 	if (!pde->write)
821 		return -EACCES;
822 	if (size == 0 || size > PAGE_SIZE - 1)
823 		return -EINVAL;
824 	buf = memdup_user_nul(ubuf, size);
825 	if (IS_ERR(buf))
826 		return PTR_ERR(buf);
827 	ret = pde->write(f, buf, size);
828 	kfree(buf);
829 	return ret == 0 ? size : ret;
830 }
831