1 /*
2 * kernfs.h - pseudo filesystem decoupled from vfs locking
3 *
4 * This file is released under the GPLv2.
5 */
6
7 #ifndef __LINUX_KERNFS_H
8 #define __LINUX_KERNFS_H
9
10 #include <linux/kernel.h>
11 #include <linux/err.h>
12 #include <linux/list.h>
13 #include <linux/mutex.h>
14 #include <linux/idr.h>
15 #include <linux/lockdep.h>
16 #include <linux/rbtree.h>
17 #include <linux/atomic.h>
18 #include <linux/wait.h>
19
20 struct file;
21 struct dentry;
22 struct iattr;
23 struct seq_file;
24 struct vm_area_struct;
25 struct super_block;
26 struct file_system_type;
27 struct poll_table_struct;
28
29 struct kernfs_open_node;
30 struct kernfs_iattrs;
31
32 enum kernfs_node_type {
33 KERNFS_DIR = 0x0001,
34 KERNFS_FILE = 0x0002,
35 KERNFS_LINK = 0x0004,
36 };
37
38 #define KERNFS_TYPE_MASK 0x000f
39 #define KERNFS_FLAG_MASK ~KERNFS_TYPE_MASK
40
41 enum kernfs_node_flag {
42 KERNFS_ACTIVATED = 0x0010,
43 KERNFS_NS = 0x0020,
44 KERNFS_HAS_SEQ_SHOW = 0x0040,
45 KERNFS_HAS_MMAP = 0x0080,
46 KERNFS_LOCKDEP = 0x0100,
47 KERNFS_SUICIDAL = 0x0400,
48 KERNFS_SUICIDED = 0x0800,
49 KERNFS_EMPTY_DIR = 0x1000,
50 KERNFS_HAS_RELEASE = 0x2000,
51 };
52
53 /* @flags for kernfs_create_root() */
54 enum kernfs_root_flag {
55 /*
56 * kernfs_nodes are created in the deactivated state and invisible.
57 * They require explicit kernfs_activate() to become visible. This
58 * can be used to make related nodes become visible atomically
59 * after all nodes are created successfully.
60 */
61 KERNFS_ROOT_CREATE_DEACTIVATED = 0x0001,
62
63 /*
64 * For regular flies, if the opener has CAP_DAC_OVERRIDE, open(2)
65 * succeeds regardless of the RW permissions. sysfs had an extra
66 * layer of enforcement where open(2) fails with -EACCES regardless
67 * of CAP_DAC_OVERRIDE if the permission doesn't have the
68 * respective read or write access at all (none of S_IRUGO or
69 * S_IWUGO) or the respective operation isn't implemented. The
70 * following flag enables that behavior.
71 */
72 KERNFS_ROOT_EXTRA_OPEN_PERM_CHECK = 0x0002,
73
74 /*
75 * The filesystem supports exportfs operation, so userspace can use
76 * fhandle to access nodes of the fs.
77 */
78 KERNFS_ROOT_SUPPORT_EXPORTOP = 0x0004,
79 };
80
81 /* type-specific structures for kernfs_node union members */
82 struct kernfs_elem_dir {
83 unsigned long subdirs;
84 /* children rbtree starts here and goes through kn->rb */
85 struct rb_root children;
86
87 /*
88 * The kernfs hierarchy this directory belongs to. This fits
89 * better directly in kernfs_node but is here to save space.
90 */
91 struct kernfs_root *root;
92 };
93
94 struct kernfs_elem_symlink {
95 struct kernfs_node *target_kn;
96 };
97
98 struct kernfs_elem_attr {
99 const struct kernfs_ops *ops;
100 struct kernfs_open_node *open;
101 loff_t size;
102 struct kernfs_node *notify_next; /* for kernfs_notify() */
103 };
104
105 /* represent a kernfs node */
106 union kernfs_node_id {
107 struct {
108 /*
109 * blktrace will export this struct as a simplified 'struct
110 * fid' (which is a big data struction), so userspace can use
111 * it to find kernfs node. The layout must match the first two
112 * fields of 'struct fid' exactly.
113 */
114 u32 ino;
115 u32 generation;
116 };
117 u64 id;
118 };
119
120 /*
121 * kernfs_node - the building block of kernfs hierarchy. Each and every
122 * kernfs node is represented by single kernfs_node. Most fields are
123 * private to kernfs and shouldn't be accessed directly by kernfs users.
124 *
125 * As long as s_count reference is held, the kernfs_node itself is
126 * accessible. Dereferencing elem or any other outer entity requires
127 * active reference.
128 */
129 struct kernfs_node {
130 atomic_t count;
131 atomic_t active;
132 #ifdef CONFIG_DEBUG_LOCK_ALLOC
133 struct lockdep_map dep_map;
134 #endif
135 /*
136 * Use kernfs_get_parent() and kernfs_name/path() instead of
137 * accessing the following two fields directly. If the node is
138 * never moved to a different parent, it is safe to access the
139 * parent directly.
140 */
141 struct kernfs_node *parent;
142 const char *name;
143
144 struct rb_node rb;
145
146 const void *ns; /* namespace tag */
147 unsigned int hash; /* ns + name hash */
148 union {
149 struct kernfs_elem_dir dir;
150 struct kernfs_elem_symlink symlink;
151 struct kernfs_elem_attr attr;
152 };
153
154 void *priv;
155
156 union kernfs_node_id id;
157 unsigned short flags;
158 umode_t mode;
159 struct kernfs_iattrs *iattr;
160 };
161
162 /*
163 * kernfs_syscall_ops may be specified on kernfs_create_root() to support
164 * syscalls. These optional callbacks are invoked on the matching syscalls
165 * and can perform any kernfs operations which don't necessarily have to be
166 * the exact operation requested. An active reference is held for each
167 * kernfs_node parameter.
168 */
169 struct kernfs_syscall_ops {
170 int (*remount_fs)(struct kernfs_root *root, int *flags, char *data);
171 int (*show_options)(struct seq_file *sf, struct kernfs_root *root);
172
173 int (*mkdir)(struct kernfs_node *parent, const char *name,
174 umode_t mode);
175 int (*rmdir)(struct kernfs_node *kn);
176 int (*rename)(struct kernfs_node *kn, struct kernfs_node *new_parent,
177 const char *new_name);
178 int (*show_path)(struct seq_file *sf, struct kernfs_node *kn,
179 struct kernfs_root *root);
180 };
181
182 struct kernfs_root {
183 /* published fields */
184 struct kernfs_node *kn;
185 unsigned int flags; /* KERNFS_ROOT_* flags */
186
187 /* private fields, do not use outside kernfs proper */
188 struct idr ino_idr;
189 u32 last_ino;
190 u32 next_generation;
191 struct kernfs_syscall_ops *syscall_ops;
192
193 /* list of kernfs_super_info of this root, protected by kernfs_mutex */
194 struct list_head supers;
195
196 wait_queue_head_t deactivate_waitq;
197 };
198
199 struct kernfs_open_file {
200 /* published fields */
201 struct kernfs_node *kn;
202 struct file *file;
203 struct seq_file *seq_file;
204 void *priv;
205
206 /* private fields, do not use outside kernfs proper */
207 struct mutex mutex;
208 struct mutex prealloc_mutex;
209 int event;
210 struct list_head list;
211 char *prealloc_buf;
212
213 size_t atomic_write_len;
214 bool mmapped:1;
215 bool released:1;
216 const struct vm_operations_struct *vm_ops;
217 };
218
219 struct kernfs_ops {
220 /*
221 * Optional open/release methods. Both are called with
222 * @of->seq_file populated.
223 */
224 int (*open)(struct kernfs_open_file *of);
225 void (*release)(struct kernfs_open_file *of);
226
227 /*
228 * Read is handled by either seq_file or raw_read().
229 *
230 * If seq_show() is present, seq_file path is active. Other seq
231 * operations are optional and if not implemented, the behavior is
232 * equivalent to single_open(). @sf->private points to the
233 * associated kernfs_open_file.
234 *
235 * read() is bounced through kernel buffer and a read larger than
236 * PAGE_SIZE results in partial operation of PAGE_SIZE.
237 */
238 int (*seq_show)(struct seq_file *sf, void *v);
239
240 void *(*seq_start)(struct seq_file *sf, loff_t *ppos);
241 void *(*seq_next)(struct seq_file *sf, void *v, loff_t *ppos);
242 void (*seq_stop)(struct seq_file *sf, void *v);
243
244 ssize_t (*read)(struct kernfs_open_file *of, char *buf, size_t bytes,
245 loff_t off);
246
247 /*
248 * write() is bounced through kernel buffer. If atomic_write_len
249 * is not set, a write larger than PAGE_SIZE results in partial
250 * operations of PAGE_SIZE chunks. If atomic_write_len is set,
251 * writes upto the specified size are executed atomically but
252 * larger ones are rejected with -E2BIG.
253 */
254 size_t atomic_write_len;
255 /*
256 * "prealloc" causes a buffer to be allocated at open for
257 * all read/write requests. As ->seq_show uses seq_read()
258 * which does its own allocation, it is incompatible with
259 * ->prealloc. Provide ->read and ->write with ->prealloc.
260 */
261 bool prealloc;
262 ssize_t (*write)(struct kernfs_open_file *of, char *buf, size_t bytes,
263 loff_t off);
264
265 unsigned int (*poll)(struct kernfs_open_file *of,
266 struct poll_table_struct *pt);
267
268 int (*mmap)(struct kernfs_open_file *of, struct vm_area_struct *vma);
269
270 #ifdef CONFIG_DEBUG_LOCK_ALLOC
271 struct lock_class_key lockdep_key;
272 #endif
273 };
274
275 #ifdef CONFIG_KERNFS
276
kernfs_type(struct kernfs_node * kn)277 static inline enum kernfs_node_type kernfs_type(struct kernfs_node *kn)
278 {
279 return kn->flags & KERNFS_TYPE_MASK;
280 }
281
282 /**
283 * kernfs_enable_ns - enable namespace under a directory
284 * @kn: directory of interest, should be empty
285 *
286 * This is to be called right after @kn is created to enable namespace
287 * under it. All children of @kn must have non-NULL namespace tags and
288 * only the ones which match the super_block's tag will be visible.
289 */
kernfs_enable_ns(struct kernfs_node * kn)290 static inline void kernfs_enable_ns(struct kernfs_node *kn)
291 {
292 WARN_ON_ONCE(kernfs_type(kn) != KERNFS_DIR);
293 WARN_ON_ONCE(!RB_EMPTY_ROOT(&kn->dir.children));
294 kn->flags |= KERNFS_NS;
295 }
296
297 /**
298 * kernfs_ns_enabled - test whether namespace is enabled
299 * @kn: the node to test
300 *
301 * Test whether namespace filtering is enabled for the children of @ns.
302 */
kernfs_ns_enabled(struct kernfs_node * kn)303 static inline bool kernfs_ns_enabled(struct kernfs_node *kn)
304 {
305 return kn->flags & KERNFS_NS;
306 }
307
308 int kernfs_name(struct kernfs_node *kn, char *buf, size_t buflen);
309 int kernfs_path_from_node(struct kernfs_node *root_kn, struct kernfs_node *kn,
310 char *buf, size_t buflen);
311 void pr_cont_kernfs_name(struct kernfs_node *kn);
312 void pr_cont_kernfs_path(struct kernfs_node *kn);
313 struct kernfs_node *kernfs_get_parent(struct kernfs_node *kn);
314 struct kernfs_node *kernfs_find_and_get_ns(struct kernfs_node *parent,
315 const char *name, const void *ns);
316 struct kernfs_node *kernfs_walk_and_get_ns(struct kernfs_node *parent,
317 const char *path, const void *ns);
318 void kernfs_get(struct kernfs_node *kn);
319 void kernfs_put(struct kernfs_node *kn);
320
321 struct kernfs_node *kernfs_node_from_dentry(struct dentry *dentry);
322 struct kernfs_root *kernfs_root_from_sb(struct super_block *sb);
323 struct inode *kernfs_get_inode(struct super_block *sb, struct kernfs_node *kn);
324
325 struct dentry *kernfs_node_dentry(struct kernfs_node *kn,
326 struct super_block *sb);
327 struct kernfs_root *kernfs_create_root(struct kernfs_syscall_ops *scops,
328 unsigned int flags, void *priv);
329 void kernfs_destroy_root(struct kernfs_root *root);
330
331 struct kernfs_node *kernfs_create_dir_ns(struct kernfs_node *parent,
332 const char *name, umode_t mode,
333 void *priv, const void *ns);
334 struct kernfs_node *kernfs_create_empty_dir(struct kernfs_node *parent,
335 const char *name);
336 struct kernfs_node *__kernfs_create_file(struct kernfs_node *parent,
337 const char *name,
338 umode_t mode, loff_t size,
339 const struct kernfs_ops *ops,
340 void *priv, const void *ns,
341 struct lock_class_key *key);
342 struct kernfs_node *kernfs_create_link(struct kernfs_node *parent,
343 const char *name,
344 struct kernfs_node *target);
345 void kernfs_activate(struct kernfs_node *kn);
346 void kernfs_remove(struct kernfs_node *kn);
347 void kernfs_break_active_protection(struct kernfs_node *kn);
348 void kernfs_unbreak_active_protection(struct kernfs_node *kn);
349 bool kernfs_remove_self(struct kernfs_node *kn);
350 int kernfs_remove_by_name_ns(struct kernfs_node *parent, const char *name,
351 const void *ns);
352 int kernfs_rename_ns(struct kernfs_node *kn, struct kernfs_node *new_parent,
353 const char *new_name, const void *new_ns);
354 int kernfs_setattr(struct kernfs_node *kn, const struct iattr *iattr);
355 unsigned int kernfs_generic_poll(struct kernfs_open_file *of,
356 struct poll_table_struct *pt);
357 void kernfs_notify(struct kernfs_node *kn);
358
359 const void *kernfs_super_ns(struct super_block *sb);
360 struct dentry *kernfs_mount_ns(struct file_system_type *fs_type, int flags,
361 struct kernfs_root *root, unsigned long magic,
362 bool *new_sb_created, const void *ns);
363 void kernfs_kill_sb(struct super_block *sb);
364 struct super_block *kernfs_pin_sb(struct kernfs_root *root, const void *ns);
365
366 void kernfs_init(void);
367
368 struct kernfs_node *kernfs_get_node_by_id(struct kernfs_root *root,
369 const union kernfs_node_id *id);
370 #else /* CONFIG_KERNFS */
371
kernfs_type(struct kernfs_node * kn)372 static inline enum kernfs_node_type kernfs_type(struct kernfs_node *kn)
373 { return 0; } /* whatever */
374
kernfs_enable_ns(struct kernfs_node * kn)375 static inline void kernfs_enable_ns(struct kernfs_node *kn) { }
376
kernfs_ns_enabled(struct kernfs_node * kn)377 static inline bool kernfs_ns_enabled(struct kernfs_node *kn)
378 { return false; }
379
kernfs_name(struct kernfs_node * kn,char * buf,size_t buflen)380 static inline int kernfs_name(struct kernfs_node *kn, char *buf, size_t buflen)
381 { return -ENOSYS; }
382
kernfs_path_from_node(struct kernfs_node * root_kn,struct kernfs_node * kn,char * buf,size_t buflen)383 static inline int kernfs_path_from_node(struct kernfs_node *root_kn,
384 struct kernfs_node *kn,
385 char *buf, size_t buflen)
386 { return -ENOSYS; }
387
pr_cont_kernfs_name(struct kernfs_node * kn)388 static inline void pr_cont_kernfs_name(struct kernfs_node *kn) { }
pr_cont_kernfs_path(struct kernfs_node * kn)389 static inline void pr_cont_kernfs_path(struct kernfs_node *kn) { }
390
kernfs_get_parent(struct kernfs_node * kn)391 static inline struct kernfs_node *kernfs_get_parent(struct kernfs_node *kn)
392 { return NULL; }
393
394 static inline struct kernfs_node *
kernfs_find_and_get_ns(struct kernfs_node * parent,const char * name,const void * ns)395 kernfs_find_and_get_ns(struct kernfs_node *parent, const char *name,
396 const void *ns)
397 { return NULL; }
398 static inline struct kernfs_node *
kernfs_walk_and_get_ns(struct kernfs_node * parent,const char * path,const void * ns)399 kernfs_walk_and_get_ns(struct kernfs_node *parent, const char *path,
400 const void *ns)
401 { return NULL; }
402
kernfs_get(struct kernfs_node * kn)403 static inline void kernfs_get(struct kernfs_node *kn) { }
kernfs_put(struct kernfs_node * kn)404 static inline void kernfs_put(struct kernfs_node *kn) { }
405
kernfs_node_from_dentry(struct dentry * dentry)406 static inline struct kernfs_node *kernfs_node_from_dentry(struct dentry *dentry)
407 { return NULL; }
408
kernfs_root_from_sb(struct super_block * sb)409 static inline struct kernfs_root *kernfs_root_from_sb(struct super_block *sb)
410 { return NULL; }
411
412 static inline struct inode *
kernfs_get_inode(struct super_block * sb,struct kernfs_node * kn)413 kernfs_get_inode(struct super_block *sb, struct kernfs_node *kn)
414 { return NULL; }
415
416 static inline struct kernfs_root *
kernfs_create_root(struct kernfs_syscall_ops * scops,unsigned int flags,void * priv)417 kernfs_create_root(struct kernfs_syscall_ops *scops, unsigned int flags,
418 void *priv)
419 { return ERR_PTR(-ENOSYS); }
420
kernfs_destroy_root(struct kernfs_root * root)421 static inline void kernfs_destroy_root(struct kernfs_root *root) { }
422
423 static inline struct kernfs_node *
kernfs_create_dir_ns(struct kernfs_node * parent,const char * name,umode_t mode,void * priv,const void * ns)424 kernfs_create_dir_ns(struct kernfs_node *parent, const char *name,
425 umode_t mode, void *priv, const void *ns)
426 { return ERR_PTR(-ENOSYS); }
427
428 static inline struct kernfs_node *
__kernfs_create_file(struct kernfs_node * parent,const char * name,umode_t mode,loff_t size,const struct kernfs_ops * ops,void * priv,const void * ns,struct lock_class_key * key)429 __kernfs_create_file(struct kernfs_node *parent, const char *name,
430 umode_t mode, loff_t size, const struct kernfs_ops *ops,
431 void *priv, const void *ns, struct lock_class_key *key)
432 { return ERR_PTR(-ENOSYS); }
433
434 static inline struct kernfs_node *
kernfs_create_link(struct kernfs_node * parent,const char * name,struct kernfs_node * target)435 kernfs_create_link(struct kernfs_node *parent, const char *name,
436 struct kernfs_node *target)
437 { return ERR_PTR(-ENOSYS); }
438
kernfs_activate(struct kernfs_node * kn)439 static inline void kernfs_activate(struct kernfs_node *kn) { }
440
kernfs_remove(struct kernfs_node * kn)441 static inline void kernfs_remove(struct kernfs_node *kn) { }
442
kernfs_remove_self(struct kernfs_node * kn)443 static inline bool kernfs_remove_self(struct kernfs_node *kn)
444 { return false; }
445
kernfs_remove_by_name_ns(struct kernfs_node * kn,const char * name,const void * ns)446 static inline int kernfs_remove_by_name_ns(struct kernfs_node *kn,
447 const char *name, const void *ns)
448 { return -ENOSYS; }
449
kernfs_rename_ns(struct kernfs_node * kn,struct kernfs_node * new_parent,const char * new_name,const void * new_ns)450 static inline int kernfs_rename_ns(struct kernfs_node *kn,
451 struct kernfs_node *new_parent,
452 const char *new_name, const void *new_ns)
453 { return -ENOSYS; }
454
kernfs_setattr(struct kernfs_node * kn,const struct iattr * iattr)455 static inline int kernfs_setattr(struct kernfs_node *kn,
456 const struct iattr *iattr)
457 { return -ENOSYS; }
458
kernfs_notify(struct kernfs_node * kn)459 static inline void kernfs_notify(struct kernfs_node *kn) { }
460
kernfs_super_ns(struct super_block * sb)461 static inline const void *kernfs_super_ns(struct super_block *sb)
462 { return NULL; }
463
464 static inline struct dentry *
kernfs_mount_ns(struct file_system_type * fs_type,int flags,struct kernfs_root * root,unsigned long magic,bool * new_sb_created,const void * ns)465 kernfs_mount_ns(struct file_system_type *fs_type, int flags,
466 struct kernfs_root *root, unsigned long magic,
467 bool *new_sb_created, const void *ns)
468 { return ERR_PTR(-ENOSYS); }
469
kernfs_kill_sb(struct super_block * sb)470 static inline void kernfs_kill_sb(struct super_block *sb) { }
471
kernfs_init(void)472 static inline void kernfs_init(void) { }
473
474 #endif /* CONFIG_KERNFS */
475
476 /**
477 * kernfs_path - build full path of a given node
478 * @kn: kernfs_node of interest
479 * @buf: buffer to copy @kn's name into
480 * @buflen: size of @buf
481 *
482 * Builds and returns the full path of @kn in @buf of @buflen bytes. The
483 * path is built from the end of @buf so the returned pointer usually
484 * doesn't match @buf. If @buf isn't long enough, @buf is nul terminated
485 * and %NULL is returned.
486 */
kernfs_path(struct kernfs_node * kn,char * buf,size_t buflen)487 static inline int kernfs_path(struct kernfs_node *kn, char *buf, size_t buflen)
488 {
489 return kernfs_path_from_node(kn, NULL, buf, buflen);
490 }
491
492 static inline struct kernfs_node *
kernfs_find_and_get(struct kernfs_node * kn,const char * name)493 kernfs_find_and_get(struct kernfs_node *kn, const char *name)
494 {
495 return kernfs_find_and_get_ns(kn, name, NULL);
496 }
497
498 static inline struct kernfs_node *
kernfs_walk_and_get(struct kernfs_node * kn,const char * path)499 kernfs_walk_and_get(struct kernfs_node *kn, const char *path)
500 {
501 return kernfs_walk_and_get_ns(kn, path, NULL);
502 }
503
504 static inline struct kernfs_node *
kernfs_create_dir(struct kernfs_node * parent,const char * name,umode_t mode,void * priv)505 kernfs_create_dir(struct kernfs_node *parent, const char *name, umode_t mode,
506 void *priv)
507 {
508 return kernfs_create_dir_ns(parent, name, mode, priv, NULL);
509 }
510
511 static inline struct kernfs_node *
kernfs_create_file_ns(struct kernfs_node * parent,const char * name,umode_t mode,loff_t size,const struct kernfs_ops * ops,void * priv,const void * ns)512 kernfs_create_file_ns(struct kernfs_node *parent, const char *name,
513 umode_t mode, loff_t size, const struct kernfs_ops *ops,
514 void *priv, const void *ns)
515 {
516 struct lock_class_key *key = NULL;
517
518 #ifdef CONFIG_DEBUG_LOCK_ALLOC
519 key = (struct lock_class_key *)&ops->lockdep_key;
520 #endif
521 return __kernfs_create_file(parent, name, mode, size, ops, priv, ns,
522 key);
523 }
524
525 static inline struct kernfs_node *
kernfs_create_file(struct kernfs_node * parent,const char * name,umode_t mode,loff_t size,const struct kernfs_ops * ops,void * priv)526 kernfs_create_file(struct kernfs_node *parent, const char *name, umode_t mode,
527 loff_t size, const struct kernfs_ops *ops, void *priv)
528 {
529 return kernfs_create_file_ns(parent, name, mode, size, ops, priv, NULL);
530 }
531
kernfs_remove_by_name(struct kernfs_node * parent,const char * name)532 static inline int kernfs_remove_by_name(struct kernfs_node *parent,
533 const char *name)
534 {
535 return kernfs_remove_by_name_ns(parent, name, NULL);
536 }
537
kernfs_rename(struct kernfs_node * kn,struct kernfs_node * new_parent,const char * new_name)538 static inline int kernfs_rename(struct kernfs_node *kn,
539 struct kernfs_node *new_parent,
540 const char *new_name)
541 {
542 return kernfs_rename_ns(kn, new_parent, new_name, NULL);
543 }
544
545 static inline struct dentry *
kernfs_mount(struct file_system_type * fs_type,int flags,struct kernfs_root * root,unsigned long magic,bool * new_sb_created)546 kernfs_mount(struct file_system_type *fs_type, int flags,
547 struct kernfs_root *root, unsigned long magic,
548 bool *new_sb_created)
549 {
550 return kernfs_mount_ns(fs_type, flags, root,
551 magic, new_sb_created, NULL);
552 }
553
554 #endif /* __LINUX_KERNFS_H */
555