]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - fs/proc/generic.c
Merge tag 'audit-pr-20170816' of git://git.kernel.org/pub/scm/linux/kernel/git/pcmoor...
[mirror_ubuntu-artful-kernel.git] / fs / proc / generic.c
CommitLineData
1da177e4
LT
1/*
2 * proc/fs/generic.c --- generic routines for the proc-fs
3 *
4 * This file contains generic proc-fs routines for handling
5 * directories and files.
6 *
7 * Copyright (C) 1991, 1992 Linus Torvalds.
8 * Copyright (C) 1997 Theodore Ts'o
9 */
10
11#include <linux/errno.h>
12#include <linux/time.h>
13#include <linux/proc_fs.h>
14#include <linux/stat.h>
1025774c 15#include <linux/mm.h>
1da177e4 16#include <linux/module.h>
5a0e3ad6 17#include <linux/slab.h>
87ebdc00 18#include <linux/printk.h>
1da177e4 19#include <linux/mount.h>
1da177e4
LT
20#include <linux/init.h>
21#include <linux/idr.h>
1da177e4 22#include <linux/bitops.h>
64a07bd8 23#include <linux/spinlock.h>
786d7e16 24#include <linux/completion.h>
7c0f6ba6 25#include <linux/uaccess.h>
1da177e4 26
fee781e6
AB
27#include "internal.h"
28
ecf1a3df 29static DEFINE_RWLOCK(proc_subdir_lock);
64a07bd8 30
312ec7e5 31static int proc_match(unsigned int len, const char *name, struct proc_dir_entry *de)
1da177e4 32{
710585d4
ND
33 if (len < de->namelen)
34 return -1;
35 if (len > de->namelen)
36 return 1;
37
38 return memcmp(name, de->name, len);
39}
40
41static struct proc_dir_entry *pde_subdir_first(struct proc_dir_entry *dir)
42{
2fc1e948
ND
43 return rb_entry_safe(rb_first(&dir->subdir), struct proc_dir_entry,
44 subdir_node);
710585d4
ND
45}
46
47static struct proc_dir_entry *pde_subdir_next(struct proc_dir_entry *dir)
48{
2fc1e948
ND
49 return rb_entry_safe(rb_next(&dir->subdir_node), struct proc_dir_entry,
50 subdir_node);
710585d4
ND
51}
52
53static struct proc_dir_entry *pde_subdir_find(struct proc_dir_entry *dir,
54 const char *name,
55 unsigned int len)
56{
57 struct rb_node *node = dir->subdir.rb_node;
58
59 while (node) {
4e4a7fb7
GT
60 struct proc_dir_entry *de = rb_entry(node,
61 struct proc_dir_entry,
62 subdir_node);
710585d4
ND
63 int result = proc_match(len, name, de);
64
65 if (result < 0)
66 node = node->rb_left;
67 else if (result > 0)
68 node = node->rb_right;
69 else
70 return de;
71 }
72 return NULL;
73}
74
75static bool pde_subdir_insert(struct proc_dir_entry *dir,
76 struct proc_dir_entry *de)
77{
78 struct rb_root *root = &dir->subdir;
79 struct rb_node **new = &root->rb_node, *parent = NULL;
80
81 /* Figure out where to put new node */
82 while (*new) {
4e4a7fb7
GT
83 struct proc_dir_entry *this = rb_entry(*new,
84 struct proc_dir_entry,
85 subdir_node);
710585d4
ND
86 int result = proc_match(de->namelen, de->name, this);
87
88 parent = *new;
89 if (result < 0)
90 new = &(*new)->rb_left;
91 else if (result > 0)
92 new = &(*new)->rb_right;
93 else
94 return false;
95 }
96
97 /* Add new node and rebalance tree. */
98 rb_link_node(&de->subdir_node, parent, new);
99 rb_insert_color(&de->subdir_node, root);
100 return true;
1da177e4
LT
101}
102
1da177e4
LT
103static int proc_notify_change(struct dentry *dentry, struct iattr *iattr)
104{
2b0143b5 105 struct inode *inode = d_inode(dentry);
1da177e4
LT
106 struct proc_dir_entry *de = PDE(inode);
107 int error;
108
31051c85 109 error = setattr_prepare(dentry, iattr);
1da177e4 110 if (error)
1025774c 111 return error;
1da177e4 112
1025774c
CH
113 setattr_copy(inode, iattr);
114 mark_inode_dirty(inode);
46f69557 115
cdf7e8dd 116 proc_set_user(de, inode->i_uid, inode->i_gid);
1da177e4 117 de->mode = inode->i_mode;
1025774c 118 return 0;
1da177e4
LT
119}
120
a528d35e
DH
121static int proc_getattr(const struct path *path, struct kstat *stat,
122 u32 request_mask, unsigned int query_flags)
2b579bee 123{
a528d35e 124 struct inode *inode = d_inode(path->dentry);
6bee55f9 125 struct proc_dir_entry *de = PDE(inode);
2b579bee 126 if (de && de->nlink)
bfe86848 127 set_nlink(inode, de->nlink);
2b579bee
MS
128
129 generic_fillattr(inode, stat);
130 return 0;
131}
132
c5ef1c42 133static const struct inode_operations proc_file_inode_operations = {
1da177e4
LT
134 .setattr = proc_notify_change,
135};
136
137/*
138 * This function parses a name such as "tty/driver/serial", and
139 * returns the struct proc_dir_entry for "/proc/tty/driver", and
140 * returns "serial" in residual.
141 */
e17a5765
AD
142static int __xlate_proc_name(const char *name, struct proc_dir_entry **ret,
143 const char **residual)
1da177e4
LT
144{
145 const char *cp = name, *next;
146 struct proc_dir_entry *de;
312ec7e5 147 unsigned int len;
1da177e4 148
7cee4e00
AD
149 de = *ret;
150 if (!de)
151 de = &proc_root;
152
1da177e4
LT
153 while (1) {
154 next = strchr(cp, '/');
155 if (!next)
156 break;
157
158 len = next - cp;
710585d4 159 de = pde_subdir_find(de, cp, len);
12bac0d9
AD
160 if (!de) {
161 WARN(1, "name '%s'\n", name);
e17a5765 162 return -ENOENT;
12bac0d9 163 }
1da177e4
LT
164 cp += len + 1;
165 }
166 *residual = cp;
167 *ret = de;
e17a5765
AD
168 return 0;
169}
170
171static int xlate_proc_name(const char *name, struct proc_dir_entry **ret,
172 const char **residual)
173{
174 int rv;
175
ecf1a3df 176 read_lock(&proc_subdir_lock);
e17a5765 177 rv = __xlate_proc_name(name, ret, residual);
ecf1a3df 178 read_unlock(&proc_subdir_lock);
e17a5765 179 return rv;
1da177e4
LT
180}
181
9a185409 182static DEFINE_IDA(proc_inum_ida);
1da177e4 183
67935df4 184#define PROC_DYNAMIC_FIRST 0xF0000000U
1da177e4
LT
185
186/*
187 * Return an inode number between PROC_DYNAMIC_FIRST and
188 * 0xffffffff, or zero on failure.
189 */
33d6dce6 190int proc_alloc_inum(unsigned int *inum)
1da177e4 191{
cde1b693 192 int i;
1da177e4 193
cde1b693
HK
194 i = ida_simple_get(&proc_inum_ida, 0, UINT_MAX - PROC_DYNAMIC_FIRST + 1,
195 GFP_KERNEL);
196 if (i < 0)
197 return i;
1da177e4 198
cde1b693 199 *inum = PROC_DYNAMIC_FIRST + (unsigned int)i;
33d6dce6 200 return 0;
1da177e4
LT
201}
202
33d6dce6 203void proc_free_inum(unsigned int inum)
1da177e4 204{
cde1b693 205 ida_simple_remove(&proc_inum_ida, inum - PROC_DYNAMIC_FIRST);
1da177e4
LT
206}
207
1da177e4
LT
208/*
209 * Don't create negative dentries here, return -ENOENT by hand
210 * instead.
211 */
e9720acd
PE
212struct dentry *proc_lookup_de(struct proc_dir_entry *de, struct inode *dir,
213 struct dentry *dentry)
1da177e4 214{
d3d009cb 215 struct inode *inode;
1da177e4 216
ecf1a3df 217 read_lock(&proc_subdir_lock);
710585d4
ND
218 de = pde_subdir_find(de, dentry->d_name.name, dentry->d_name.len);
219 if (de) {
220 pde_get(de);
ecf1a3df 221 read_unlock(&proc_subdir_lock);
710585d4
ND
222 inode = proc_get_inode(dir->i_sb, de);
223 if (!inode)
224 return ERR_PTR(-ENOMEM);
225 d_set_d_op(dentry, &simple_dentry_operations);
226 d_add(dentry, inode);
227 return NULL;
1da177e4 228 }
ecf1a3df 229 read_unlock(&proc_subdir_lock);
d3d009cb 230 return ERR_PTR(-ENOENT);
1da177e4
LT
231}
232
e9720acd 233struct dentry *proc_lookup(struct inode *dir, struct dentry *dentry,
00cd8dd3 234 unsigned int flags)
e9720acd
PE
235{
236 return proc_lookup_de(PDE(dir), dir, dentry);
237}
238
1da177e4
LT
239/*
240 * This returns non-zero if at EOF, so that the /proc
241 * root directory can use this and check if it should
242 * continue with the <pid> entries..
243 *
244 * Note that the VFS-layer doesn't care about the return
245 * value of the readdir() call, as long as it's non-negative
246 * for success..
247 */
f0c3b509
AV
248int proc_readdir_de(struct proc_dir_entry *de, struct file *file,
249 struct dir_context *ctx)
1da177e4 250{
1da177e4 251 int i;
f0c3b509
AV
252
253 if (!dir_emit_dots(file, ctx))
254 return 0;
255
ecf1a3df 256 read_lock(&proc_subdir_lock);
710585d4 257 de = pde_subdir_first(de);
f0c3b509
AV
258 i = ctx->pos - 2;
259 for (;;) {
260 if (!de) {
ecf1a3df 261 read_unlock(&proc_subdir_lock);
f0c3b509
AV
262 return 0;
263 }
264 if (!i)
265 break;
710585d4 266 de = pde_subdir_next(de);
f0c3b509 267 i--;
1da177e4 268 }
f0c3b509
AV
269
270 do {
271 struct proc_dir_entry *next;
272 pde_get(de);
ecf1a3df 273 read_unlock(&proc_subdir_lock);
f0c3b509
AV
274 if (!dir_emit(ctx, de->name, de->namelen,
275 de->low_ino, de->mode >> 12)) {
276 pde_put(de);
277 return 0;
278 }
ecf1a3df 279 read_lock(&proc_subdir_lock);
f0c3b509 280 ctx->pos++;
710585d4 281 next = pde_subdir_next(de);
f0c3b509
AV
282 pde_put(de);
283 de = next;
284 } while (de);
ecf1a3df 285 read_unlock(&proc_subdir_lock);
fd3930f7 286 return 1;
1da177e4
LT
287}
288
f0c3b509 289int proc_readdir(struct file *file, struct dir_context *ctx)
e9720acd 290{
f0c3b509 291 struct inode *inode = file_inode(file);
e9720acd 292
f0c3b509 293 return proc_readdir_de(PDE(inode), file, ctx);
e9720acd
PE
294}
295
1da177e4
LT
296/*
297 * These are the generic /proc directory operations. They
298 * use the in-memory "struct proc_dir_entry" tree to parse
299 * the /proc directory.
300 */
00977a59 301static const struct file_operations proc_dir_operations = {
b4df2b92 302 .llseek = generic_file_llseek,
1da177e4 303 .read = generic_read_dir,
f50752ea 304 .iterate_shared = proc_readdir,
1da177e4
LT
305};
306
307/*
308 * proc directories can do almost nothing..
309 */
c5ef1c42 310static const struct inode_operations proc_dir_inode_operations = {
1da177e4 311 .lookup = proc_lookup,
2b579bee 312 .getattr = proc_getattr,
1da177e4
LT
313 .setattr = proc_notify_change,
314};
315
316static int proc_register(struct proc_dir_entry * dir, struct proc_dir_entry * dp)
317{
33d6dce6 318 int ret;
710585d4 319
33d6dce6
EB
320 ret = proc_alloc_inum(&dp->low_ino);
321 if (ret)
322 return ret;
64a07bd8 323
ecf1a3df 324 write_lock(&proc_subdir_lock);
99fc06df 325 dp->parent = dir;
b208d54b 326 if (pde_subdir_insert(dir, dp) == false) {
710585d4
ND
327 WARN(1, "proc_dir_entry '%s/%s' already registered\n",
328 dir->name, dp->name);
ecf1a3df 329 write_unlock(&proc_subdir_lock);
b208d54b
DB
330 proc_free_inum(dp->low_ino);
331 return -EEXIST;
332 }
ecf1a3df 333 write_unlock(&proc_subdir_lock);
99fc06df 334
1da177e4
LT
335 return 0;
336}
337
2d3a4e36 338static struct proc_dir_entry *__proc_create(struct proc_dir_entry **parent,
1da177e4 339 const char *name,
d161a13f 340 umode_t mode,
1da177e4
LT
341 nlink_t nlink)
342{
343 struct proc_dir_entry *ent = NULL;
dbcdb504
AD
344 const char *fn;
345 struct qstr qstr;
1da177e4 346
7cee4e00 347 if (xlate_proc_name(name, parent, &fn) != 0)
1da177e4 348 goto out;
dbcdb504
AD
349 qstr.name = fn;
350 qstr.len = strlen(fn);
351 if (qstr.len == 0 || qstr.len >= 256) {
352 WARN(1, "name len %u\n", qstr.len);
353 return NULL;
354 }
355 if (*parent == &proc_root && name_to_int(&qstr) != ~0U) {
356 WARN(1, "create '/proc/%s' by hand\n", qstr.name);
357 return NULL;
358 }
eb6d38d5
EB
359 if (is_empty_pde(*parent)) {
360 WARN(1, "attempt to add to permanently empty directory");
361 return NULL;
362 }
1da177e4 363
dbcdb504 364 ent = kzalloc(sizeof(struct proc_dir_entry) + qstr.len + 1, GFP_KERNEL);
17baa2a2 365 if (!ent)
366 goto out;
1da177e4 367
dbcdb504
AD
368 memcpy(ent->name, fn, qstr.len + 1);
369 ent->namelen = qstr.len;
1da177e4
LT
370 ent->mode = mode;
371 ent->nlink = nlink;
710585d4 372 ent->subdir = RB_ROOT;
5a622f2d 373 atomic_set(&ent->count, 1);
786d7e16 374 spin_lock_init(&ent->pde_unload_lock);
881adb85 375 INIT_LIST_HEAD(&ent->pde_openers);
c110486f
DT
376 proc_set_user(ent, (*parent)->uid, (*parent)->gid);
377
17baa2a2 378out:
1da177e4
LT
379 return ent;
380}
381
382struct proc_dir_entry *proc_symlink(const char *name,
383 struct proc_dir_entry *parent, const char *dest)
384{
385 struct proc_dir_entry *ent;
386
2d3a4e36 387 ent = __proc_create(&parent, name,
1da177e4
LT
388 (S_IFLNK | S_IRUGO | S_IWUGO | S_IXUGO),1);
389
390 if (ent) {
391 ent->data = kmalloc((ent->size=strlen(dest))+1, GFP_KERNEL);
392 if (ent->data) {
393 strcpy((char*)ent->data,dest);
d443b9fd 394 ent->proc_iops = &proc_link_inode_operations;
1da177e4
LT
395 if (proc_register(parent, ent) < 0) {
396 kfree(ent->data);
397 kfree(ent);
398 ent = NULL;
399 }
400 } else {
401 kfree(ent);
402 ent = NULL;
403 }
404 }
405 return ent;
406}
587d4a17 407EXPORT_SYMBOL(proc_symlink);
1da177e4 408
270b5ac2
DH
409struct proc_dir_entry *proc_mkdir_data(const char *name, umode_t mode,
410 struct proc_dir_entry *parent, void *data)
1da177e4
LT
411{
412 struct proc_dir_entry *ent;
413
270b5ac2
DH
414 if (mode == 0)
415 mode = S_IRUGO | S_IXUGO;
416
2d3a4e36 417 ent = __proc_create(&parent, name, S_IFDIR | mode, 2);
1da177e4 418 if (ent) {
270b5ac2 419 ent->data = data;
d443b9fd
AV
420 ent->proc_fops = &proc_dir_operations;
421 ent->proc_iops = &proc_dir_inode_operations;
422 parent->nlink++;
1da177e4
LT
423 if (proc_register(parent, ent) < 0) {
424 kfree(ent);
d443b9fd 425 parent->nlink--;
1da177e4
LT
426 ent = NULL;
427 }
428 }
429 return ent;
430}
270b5ac2 431EXPORT_SYMBOL_GPL(proc_mkdir_data);
1da177e4 432
270b5ac2
DH
433struct proc_dir_entry *proc_mkdir_mode(const char *name, umode_t mode,
434 struct proc_dir_entry *parent)
78e92b99 435{
270b5ac2 436 return proc_mkdir_data(name, mode, parent, NULL);
78e92b99 437}
270b5ac2 438EXPORT_SYMBOL(proc_mkdir_mode);
78e92b99 439
1da177e4
LT
440struct proc_dir_entry *proc_mkdir(const char *name,
441 struct proc_dir_entry *parent)
442{
270b5ac2 443 return proc_mkdir_data(name, 0, parent, NULL);
1da177e4 444}
587d4a17 445EXPORT_SYMBOL(proc_mkdir);
1da177e4 446
eb6d38d5
EB
447struct proc_dir_entry *proc_create_mount_point(const char *name)
448{
449 umode_t mode = S_IFDIR | S_IRUGO | S_IXUGO;
450 struct proc_dir_entry *ent, *parent = NULL;
451
452 ent = __proc_create(&parent, name, mode, 2);
453 if (ent) {
454 ent->data = NULL;
455 ent->proc_fops = NULL;
456 ent->proc_iops = NULL;
d66bb160 457 parent->nlink++;
eb6d38d5
EB
458 if (proc_register(parent, ent) < 0) {
459 kfree(ent);
460 parent->nlink--;
461 ent = NULL;
462 }
463 }
464 return ent;
465}
f97df70b 466EXPORT_SYMBOL(proc_create_mount_point);
eb6d38d5 467
d161a13f 468struct proc_dir_entry *proc_create_data(const char *name, umode_t mode,
59b74351
DL
469 struct proc_dir_entry *parent,
470 const struct file_operations *proc_fops,
471 void *data)
2d3a4e36
AD
472{
473 struct proc_dir_entry *pde;
b6cdc731
AV
474 if ((mode & S_IFMT) == 0)
475 mode |= S_IFREG;
2d3a4e36 476
b6cdc731
AV
477 if (!S_ISREG(mode)) {
478 WARN_ON(1); /* use proc_mkdir() */
479 return NULL;
2d3a4e36
AD
480 }
481
d443b9fd
AV
482 BUG_ON(proc_fops == NULL);
483
b6cdc731
AV
484 if ((mode & S_IALLUGO) == 0)
485 mode |= S_IRUGO;
486 pde = __proc_create(&parent, name, mode, 1);
2d3a4e36
AD
487 if (!pde)
488 goto out;
489 pde->proc_fops = proc_fops;
59b74351 490 pde->data = data;
d443b9fd 491 pde->proc_iops = &proc_file_inode_operations;
2d3a4e36
AD
492 if (proc_register(parent, pde) < 0)
493 goto out_free;
494 return pde;
495out_free:
496 kfree(pde);
497out:
498 return NULL;
499}
587d4a17 500EXPORT_SYMBOL(proc_create_data);
271a15ea
DH
501
502void proc_set_size(struct proc_dir_entry *de, loff_t size)
503{
504 de->size = size;
505}
506EXPORT_SYMBOL(proc_set_size);
507
508void proc_set_user(struct proc_dir_entry *de, kuid_t uid, kgid_t gid)
509{
510 de->uid = uid;
511 de->gid = gid;
512}
513EXPORT_SYMBOL(proc_set_user);
2d3a4e36 514
135d5655 515static void free_proc_entry(struct proc_dir_entry *de)
1da177e4 516{
33d6dce6 517 proc_free_inum(de->low_ino);
1da177e4 518
fd2cbe48 519 if (S_ISLNK(de->mode))
1da177e4
LT
520 kfree(de->data);
521 kfree(de);
522}
523
135d5655
AD
524void pde_put(struct proc_dir_entry *pde)
525{
526 if (atomic_dec_and_test(&pde->count))
527 free_proc_entry(pde);
528}
529
8ce584c7
AV
530/*
531 * Remove a /proc entry and free it if it's not currently in use.
532 */
533void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
534{
8ce584c7
AV
535 struct proc_dir_entry *de = NULL;
536 const char *fn = name;
537 unsigned int len;
538
ecf1a3df 539 write_lock(&proc_subdir_lock);
8ce584c7 540 if (__xlate_proc_name(name, &parent, &fn) != 0) {
ecf1a3df 541 write_unlock(&proc_subdir_lock);
8ce584c7
AV
542 return;
543 }
544 len = strlen(fn);
545
710585d4
ND
546 de = pde_subdir_find(parent, fn, len);
547 if (de)
548 rb_erase(&de->subdir_node, &parent->subdir);
ecf1a3df 549 write_unlock(&proc_subdir_lock);
8ce584c7
AV
550 if (!de) {
551 WARN(1, "name '%s'\n", name);
552 return;
553 }
554
866ad9a7 555 proc_entry_rundown(de);
881adb85 556
f649d6d3
AD
557 if (S_ISDIR(de->mode))
558 parent->nlink--;
559 de->nlink = 0;
710585d4
ND
560 WARN(pde_subdir_first(de),
561 "%s: removing non-empty directory '%s/%s', leaking at least '%s'\n",
562 __func__, de->parent->name, de->name, pde_subdir_first(de)->name);
135d5655 563 pde_put(de);
1da177e4 564}
587d4a17 565EXPORT_SYMBOL(remove_proc_entry);
8ce584c7
AV
566
567int remove_proc_subtree(const char *name, struct proc_dir_entry *parent)
568{
8ce584c7
AV
569 struct proc_dir_entry *root = NULL, *de, *next;
570 const char *fn = name;
571 unsigned int len;
572
ecf1a3df 573 write_lock(&proc_subdir_lock);
8ce584c7 574 if (__xlate_proc_name(name, &parent, &fn) != 0) {
ecf1a3df 575 write_unlock(&proc_subdir_lock);
8ce584c7
AV
576 return -ENOENT;
577 }
578 len = strlen(fn);
579
710585d4 580 root = pde_subdir_find(parent, fn, len);
8ce584c7 581 if (!root) {
ecf1a3df 582 write_unlock(&proc_subdir_lock);
8ce584c7
AV
583 return -ENOENT;
584 }
710585d4
ND
585 rb_erase(&root->subdir_node, &parent->subdir);
586
8ce584c7
AV
587 de = root;
588 while (1) {
710585d4 589 next = pde_subdir_first(de);
8ce584c7 590 if (next) {
710585d4 591 rb_erase(&next->subdir_node, &de->subdir);
8ce584c7
AV
592 de = next;
593 continue;
594 }
ecf1a3df 595 write_unlock(&proc_subdir_lock);
8ce584c7 596
866ad9a7 597 proc_entry_rundown(de);
8ce584c7
AV
598 next = de->parent;
599 if (S_ISDIR(de->mode))
600 next->nlink--;
601 de->nlink = 0;
602 if (de == root)
603 break;
604 pde_put(de);
605
ecf1a3df 606 write_lock(&proc_subdir_lock);
8ce584c7
AV
607 de = next;
608 }
609 pde_put(root);
610 return 0;
611}
612EXPORT_SYMBOL(remove_proc_subtree);
4a520d27
DH
613
614void *proc_get_parent_data(const struct inode *inode)
615{
616 struct proc_dir_entry *de = PDE(inode);
617 return de->parent->data;
618}
619EXPORT_SYMBOL_GPL(proc_get_parent_data);
a8ca16ea
DH
620
621void proc_remove(struct proc_dir_entry *de)
622{
623 if (de)
624 remove_proc_subtree(de->name, de->parent);
625}
626EXPORT_SYMBOL(proc_remove);
c30480b9
DH
627
628void *PDE_DATA(const struct inode *inode)
629{
630 return __PDE_DATA(inode);
631}
632EXPORT_SYMBOL(PDE_DATA);