162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * /proc/sys support 462306a36Sopenharmony_ci */ 562306a36Sopenharmony_ci#include <linux/init.h> 662306a36Sopenharmony_ci#include <linux/sysctl.h> 762306a36Sopenharmony_ci#include <linux/poll.h> 862306a36Sopenharmony_ci#include <linux/proc_fs.h> 962306a36Sopenharmony_ci#include <linux/printk.h> 1062306a36Sopenharmony_ci#include <linux/security.h> 1162306a36Sopenharmony_ci#include <linux/sched.h> 1262306a36Sopenharmony_ci#include <linux/cred.h> 1362306a36Sopenharmony_ci#include <linux/namei.h> 1462306a36Sopenharmony_ci#include <linux/mm.h> 1562306a36Sopenharmony_ci#include <linux/uio.h> 1662306a36Sopenharmony_ci#include <linux/module.h> 1762306a36Sopenharmony_ci#include <linux/bpf-cgroup.h> 1862306a36Sopenharmony_ci#include <linux/mount.h> 1962306a36Sopenharmony_ci#include <linux/kmemleak.h> 2062306a36Sopenharmony_ci#include "internal.h" 2162306a36Sopenharmony_ci 2262306a36Sopenharmony_ci#define list_for_each_table_entry(entry, header) \ 2362306a36Sopenharmony_ci entry = header->ctl_table; \ 2462306a36Sopenharmony_ci for (size_t i = 0 ; i < header->ctl_table_size && entry->procname; ++i, entry++) 2562306a36Sopenharmony_ci 2662306a36Sopenharmony_cistatic const struct dentry_operations proc_sys_dentry_operations; 2762306a36Sopenharmony_cistatic const struct file_operations proc_sys_file_operations; 2862306a36Sopenharmony_cistatic const struct inode_operations proc_sys_inode_operations; 2962306a36Sopenharmony_cistatic const struct file_operations proc_sys_dir_file_operations; 3062306a36Sopenharmony_cistatic const struct inode_operations proc_sys_dir_operations; 3162306a36Sopenharmony_ci 3262306a36Sopenharmony_ci/* Support for permanently empty directories */ 3362306a36Sopenharmony_cistatic struct ctl_table sysctl_mount_point[] = { 3462306a36Sopenharmony_ci {.type = SYSCTL_TABLE_TYPE_PERMANENTLY_EMPTY } 3562306a36Sopenharmony_ci}; 3662306a36Sopenharmony_ci 3762306a36Sopenharmony_ci/** 3862306a36Sopenharmony_ci * register_sysctl_mount_point() - registers a sysctl mount point 3962306a36Sopenharmony_ci * @path: path for the mount point 4062306a36Sopenharmony_ci * 4162306a36Sopenharmony_ci * Used to create a permanently empty directory to serve as mount point. 4262306a36Sopenharmony_ci * There are some subtle but important permission checks this allows in the 4362306a36Sopenharmony_ci * case of unprivileged mounts. 4462306a36Sopenharmony_ci */ 4562306a36Sopenharmony_cistruct ctl_table_header *register_sysctl_mount_point(const char *path) 4662306a36Sopenharmony_ci{ 4762306a36Sopenharmony_ci return register_sysctl(path, sysctl_mount_point); 4862306a36Sopenharmony_ci} 4962306a36Sopenharmony_ciEXPORT_SYMBOL(register_sysctl_mount_point); 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_ci#define sysctl_is_perm_empty_ctl_table(tptr) \ 5262306a36Sopenharmony_ci (tptr[0].type == SYSCTL_TABLE_TYPE_PERMANENTLY_EMPTY) 5362306a36Sopenharmony_ci#define sysctl_is_perm_empty_ctl_header(hptr) \ 5462306a36Sopenharmony_ci (sysctl_is_perm_empty_ctl_table(hptr->ctl_table)) 5562306a36Sopenharmony_ci#define sysctl_set_perm_empty_ctl_header(hptr) \ 5662306a36Sopenharmony_ci (hptr->ctl_table[0].type = SYSCTL_TABLE_TYPE_PERMANENTLY_EMPTY) 5762306a36Sopenharmony_ci#define sysctl_clear_perm_empty_ctl_header(hptr) \ 5862306a36Sopenharmony_ci (hptr->ctl_table[0].type = SYSCTL_TABLE_TYPE_DEFAULT) 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_civoid proc_sys_poll_notify(struct ctl_table_poll *poll) 6162306a36Sopenharmony_ci{ 6262306a36Sopenharmony_ci if (!poll) 6362306a36Sopenharmony_ci return; 6462306a36Sopenharmony_ci 6562306a36Sopenharmony_ci atomic_inc(&poll->event); 6662306a36Sopenharmony_ci wake_up_interruptible(&poll->wait); 6762306a36Sopenharmony_ci} 6862306a36Sopenharmony_ci 6962306a36Sopenharmony_cistatic struct ctl_table root_table[] = { 7062306a36Sopenharmony_ci { 7162306a36Sopenharmony_ci .procname = "", 7262306a36Sopenharmony_ci .mode = S_IFDIR|S_IRUGO|S_IXUGO, 7362306a36Sopenharmony_ci }, 7462306a36Sopenharmony_ci { } 7562306a36Sopenharmony_ci}; 7662306a36Sopenharmony_cistatic struct ctl_table_root sysctl_table_root = { 7762306a36Sopenharmony_ci .default_set.dir.header = { 7862306a36Sopenharmony_ci {{.count = 1, 7962306a36Sopenharmony_ci .nreg = 1, 8062306a36Sopenharmony_ci .ctl_table = root_table }}, 8162306a36Sopenharmony_ci .ctl_table_arg = root_table, 8262306a36Sopenharmony_ci .root = &sysctl_table_root, 8362306a36Sopenharmony_ci .set = &sysctl_table_root.default_set, 8462306a36Sopenharmony_ci }, 8562306a36Sopenharmony_ci}; 8662306a36Sopenharmony_ci 8762306a36Sopenharmony_cistatic DEFINE_SPINLOCK(sysctl_lock); 8862306a36Sopenharmony_ci 8962306a36Sopenharmony_cistatic void drop_sysctl_table(struct ctl_table_header *header); 9062306a36Sopenharmony_cistatic int sysctl_follow_link(struct ctl_table_header **phead, 9162306a36Sopenharmony_ci struct ctl_table **pentry); 9262306a36Sopenharmony_cistatic int insert_links(struct ctl_table_header *head); 9362306a36Sopenharmony_cistatic void put_links(struct ctl_table_header *header); 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_cistatic void sysctl_print_dir(struct ctl_dir *dir) 9662306a36Sopenharmony_ci{ 9762306a36Sopenharmony_ci if (dir->header.parent) 9862306a36Sopenharmony_ci sysctl_print_dir(dir->header.parent); 9962306a36Sopenharmony_ci pr_cont("%s/", dir->header.ctl_table[0].procname); 10062306a36Sopenharmony_ci} 10162306a36Sopenharmony_ci 10262306a36Sopenharmony_cistatic int namecmp(const char *name1, int len1, const char *name2, int len2) 10362306a36Sopenharmony_ci{ 10462306a36Sopenharmony_ci int cmp; 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_ci cmp = memcmp(name1, name2, min(len1, len2)); 10762306a36Sopenharmony_ci if (cmp == 0) 10862306a36Sopenharmony_ci cmp = len1 - len2; 10962306a36Sopenharmony_ci return cmp; 11062306a36Sopenharmony_ci} 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_ci/* Called under sysctl_lock */ 11362306a36Sopenharmony_cistatic struct ctl_table *find_entry(struct ctl_table_header **phead, 11462306a36Sopenharmony_ci struct ctl_dir *dir, const char *name, int namelen) 11562306a36Sopenharmony_ci{ 11662306a36Sopenharmony_ci struct ctl_table_header *head; 11762306a36Sopenharmony_ci struct ctl_table *entry; 11862306a36Sopenharmony_ci struct rb_node *node = dir->root.rb_node; 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_ci while (node) 12162306a36Sopenharmony_ci { 12262306a36Sopenharmony_ci struct ctl_node *ctl_node; 12362306a36Sopenharmony_ci const char *procname; 12462306a36Sopenharmony_ci int cmp; 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci ctl_node = rb_entry(node, struct ctl_node, node); 12762306a36Sopenharmony_ci head = ctl_node->header; 12862306a36Sopenharmony_ci entry = &head->ctl_table[ctl_node - head->node]; 12962306a36Sopenharmony_ci procname = entry->procname; 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci cmp = namecmp(name, namelen, procname, strlen(procname)); 13262306a36Sopenharmony_ci if (cmp < 0) 13362306a36Sopenharmony_ci node = node->rb_left; 13462306a36Sopenharmony_ci else if (cmp > 0) 13562306a36Sopenharmony_ci node = node->rb_right; 13662306a36Sopenharmony_ci else { 13762306a36Sopenharmony_ci *phead = head; 13862306a36Sopenharmony_ci return entry; 13962306a36Sopenharmony_ci } 14062306a36Sopenharmony_ci } 14162306a36Sopenharmony_ci return NULL; 14262306a36Sopenharmony_ci} 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_cistatic int insert_entry(struct ctl_table_header *head, struct ctl_table *entry) 14562306a36Sopenharmony_ci{ 14662306a36Sopenharmony_ci struct rb_node *node = &head->node[entry - head->ctl_table].node; 14762306a36Sopenharmony_ci struct rb_node **p = &head->parent->root.rb_node; 14862306a36Sopenharmony_ci struct rb_node *parent = NULL; 14962306a36Sopenharmony_ci const char *name = entry->procname; 15062306a36Sopenharmony_ci int namelen = strlen(name); 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci while (*p) { 15362306a36Sopenharmony_ci struct ctl_table_header *parent_head; 15462306a36Sopenharmony_ci struct ctl_table *parent_entry; 15562306a36Sopenharmony_ci struct ctl_node *parent_node; 15662306a36Sopenharmony_ci const char *parent_name; 15762306a36Sopenharmony_ci int cmp; 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_ci parent = *p; 16062306a36Sopenharmony_ci parent_node = rb_entry(parent, struct ctl_node, node); 16162306a36Sopenharmony_ci parent_head = parent_node->header; 16262306a36Sopenharmony_ci parent_entry = &parent_head->ctl_table[parent_node - parent_head->node]; 16362306a36Sopenharmony_ci parent_name = parent_entry->procname; 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci cmp = namecmp(name, namelen, parent_name, strlen(parent_name)); 16662306a36Sopenharmony_ci if (cmp < 0) 16762306a36Sopenharmony_ci p = &(*p)->rb_left; 16862306a36Sopenharmony_ci else if (cmp > 0) 16962306a36Sopenharmony_ci p = &(*p)->rb_right; 17062306a36Sopenharmony_ci else { 17162306a36Sopenharmony_ci pr_err("sysctl duplicate entry: "); 17262306a36Sopenharmony_ci sysctl_print_dir(head->parent); 17362306a36Sopenharmony_ci pr_cont("%s\n", entry->procname); 17462306a36Sopenharmony_ci return -EEXIST; 17562306a36Sopenharmony_ci } 17662306a36Sopenharmony_ci } 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci rb_link_node(node, parent, p); 17962306a36Sopenharmony_ci rb_insert_color(node, &head->parent->root); 18062306a36Sopenharmony_ci return 0; 18162306a36Sopenharmony_ci} 18262306a36Sopenharmony_ci 18362306a36Sopenharmony_cistatic void erase_entry(struct ctl_table_header *head, struct ctl_table *entry) 18462306a36Sopenharmony_ci{ 18562306a36Sopenharmony_ci struct rb_node *node = &head->node[entry - head->ctl_table].node; 18662306a36Sopenharmony_ci 18762306a36Sopenharmony_ci rb_erase(node, &head->parent->root); 18862306a36Sopenharmony_ci} 18962306a36Sopenharmony_ci 19062306a36Sopenharmony_cistatic void init_header(struct ctl_table_header *head, 19162306a36Sopenharmony_ci struct ctl_table_root *root, struct ctl_table_set *set, 19262306a36Sopenharmony_ci struct ctl_node *node, struct ctl_table *table, size_t table_size) 19362306a36Sopenharmony_ci{ 19462306a36Sopenharmony_ci head->ctl_table = table; 19562306a36Sopenharmony_ci head->ctl_table_size = table_size; 19662306a36Sopenharmony_ci head->ctl_table_arg = table; 19762306a36Sopenharmony_ci head->used = 0; 19862306a36Sopenharmony_ci head->count = 1; 19962306a36Sopenharmony_ci head->nreg = 1; 20062306a36Sopenharmony_ci head->unregistering = NULL; 20162306a36Sopenharmony_ci head->root = root; 20262306a36Sopenharmony_ci head->set = set; 20362306a36Sopenharmony_ci head->parent = NULL; 20462306a36Sopenharmony_ci head->node = node; 20562306a36Sopenharmony_ci INIT_HLIST_HEAD(&head->inodes); 20662306a36Sopenharmony_ci if (node) { 20762306a36Sopenharmony_ci struct ctl_table *entry; 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_ci list_for_each_table_entry(entry, head) { 21062306a36Sopenharmony_ci node->header = head; 21162306a36Sopenharmony_ci node++; 21262306a36Sopenharmony_ci } 21362306a36Sopenharmony_ci } 21462306a36Sopenharmony_ci} 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_cistatic void erase_header(struct ctl_table_header *head) 21762306a36Sopenharmony_ci{ 21862306a36Sopenharmony_ci struct ctl_table *entry; 21962306a36Sopenharmony_ci 22062306a36Sopenharmony_ci list_for_each_table_entry(entry, head) 22162306a36Sopenharmony_ci erase_entry(head, entry); 22262306a36Sopenharmony_ci} 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_cistatic int insert_header(struct ctl_dir *dir, struct ctl_table_header *header) 22562306a36Sopenharmony_ci{ 22662306a36Sopenharmony_ci struct ctl_table *entry; 22762306a36Sopenharmony_ci struct ctl_table_header *dir_h = &dir->header; 22862306a36Sopenharmony_ci int err; 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci /* Is this a permanently empty directory? */ 23262306a36Sopenharmony_ci if (sysctl_is_perm_empty_ctl_header(dir_h)) 23362306a36Sopenharmony_ci return -EROFS; 23462306a36Sopenharmony_ci 23562306a36Sopenharmony_ci /* Am I creating a permanently empty directory? */ 23662306a36Sopenharmony_ci if (header->ctl_table_size > 0 && 23762306a36Sopenharmony_ci sysctl_is_perm_empty_ctl_table(header->ctl_table)) { 23862306a36Sopenharmony_ci if (!RB_EMPTY_ROOT(&dir->root)) 23962306a36Sopenharmony_ci return -EINVAL; 24062306a36Sopenharmony_ci sysctl_set_perm_empty_ctl_header(dir_h); 24162306a36Sopenharmony_ci } 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci dir_h->nreg++; 24462306a36Sopenharmony_ci header->parent = dir; 24562306a36Sopenharmony_ci err = insert_links(header); 24662306a36Sopenharmony_ci if (err) 24762306a36Sopenharmony_ci goto fail_links; 24862306a36Sopenharmony_ci list_for_each_table_entry(entry, header) { 24962306a36Sopenharmony_ci err = insert_entry(header, entry); 25062306a36Sopenharmony_ci if (err) 25162306a36Sopenharmony_ci goto fail; 25262306a36Sopenharmony_ci } 25362306a36Sopenharmony_ci return 0; 25462306a36Sopenharmony_cifail: 25562306a36Sopenharmony_ci erase_header(header); 25662306a36Sopenharmony_ci put_links(header); 25762306a36Sopenharmony_cifail_links: 25862306a36Sopenharmony_ci if (header->ctl_table == sysctl_mount_point) 25962306a36Sopenharmony_ci sysctl_clear_perm_empty_ctl_header(dir_h); 26062306a36Sopenharmony_ci header->parent = NULL; 26162306a36Sopenharmony_ci drop_sysctl_table(dir_h); 26262306a36Sopenharmony_ci return err; 26362306a36Sopenharmony_ci} 26462306a36Sopenharmony_ci 26562306a36Sopenharmony_ci/* called under sysctl_lock */ 26662306a36Sopenharmony_cistatic int use_table(struct ctl_table_header *p) 26762306a36Sopenharmony_ci{ 26862306a36Sopenharmony_ci if (unlikely(p->unregistering)) 26962306a36Sopenharmony_ci return 0; 27062306a36Sopenharmony_ci p->used++; 27162306a36Sopenharmony_ci return 1; 27262306a36Sopenharmony_ci} 27362306a36Sopenharmony_ci 27462306a36Sopenharmony_ci/* called under sysctl_lock */ 27562306a36Sopenharmony_cistatic void unuse_table(struct ctl_table_header *p) 27662306a36Sopenharmony_ci{ 27762306a36Sopenharmony_ci if (!--p->used) 27862306a36Sopenharmony_ci if (unlikely(p->unregistering)) 27962306a36Sopenharmony_ci complete(p->unregistering); 28062306a36Sopenharmony_ci} 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_cistatic void proc_sys_invalidate_dcache(struct ctl_table_header *head) 28362306a36Sopenharmony_ci{ 28462306a36Sopenharmony_ci proc_invalidate_siblings_dcache(&head->inodes, &sysctl_lock); 28562306a36Sopenharmony_ci} 28662306a36Sopenharmony_ci 28762306a36Sopenharmony_ci/* called under sysctl_lock, will reacquire if has to wait */ 28862306a36Sopenharmony_cistatic void start_unregistering(struct ctl_table_header *p) 28962306a36Sopenharmony_ci{ 29062306a36Sopenharmony_ci /* 29162306a36Sopenharmony_ci * if p->used is 0, nobody will ever touch that entry again; 29262306a36Sopenharmony_ci * we'll eliminate all paths to it before dropping sysctl_lock 29362306a36Sopenharmony_ci */ 29462306a36Sopenharmony_ci if (unlikely(p->used)) { 29562306a36Sopenharmony_ci struct completion wait; 29662306a36Sopenharmony_ci init_completion(&wait); 29762306a36Sopenharmony_ci p->unregistering = &wait; 29862306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 29962306a36Sopenharmony_ci wait_for_completion(&wait); 30062306a36Sopenharmony_ci } else { 30162306a36Sopenharmony_ci /* anything non-NULL; we'll never dereference it */ 30262306a36Sopenharmony_ci p->unregistering = ERR_PTR(-EINVAL); 30362306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 30462306a36Sopenharmony_ci } 30562306a36Sopenharmony_ci /* 30662306a36Sopenharmony_ci * Invalidate dentries for unregistered sysctls: namespaced sysctls 30762306a36Sopenharmony_ci * can have duplicate names and contaminate dcache very badly. 30862306a36Sopenharmony_ci */ 30962306a36Sopenharmony_ci proc_sys_invalidate_dcache(p); 31062306a36Sopenharmony_ci /* 31162306a36Sopenharmony_ci * do not remove from the list until nobody holds it; walking the 31262306a36Sopenharmony_ci * list in do_sysctl() relies on that. 31362306a36Sopenharmony_ci */ 31462306a36Sopenharmony_ci spin_lock(&sysctl_lock); 31562306a36Sopenharmony_ci erase_header(p); 31662306a36Sopenharmony_ci} 31762306a36Sopenharmony_ci 31862306a36Sopenharmony_cistatic struct ctl_table_header *sysctl_head_grab(struct ctl_table_header *head) 31962306a36Sopenharmony_ci{ 32062306a36Sopenharmony_ci BUG_ON(!head); 32162306a36Sopenharmony_ci spin_lock(&sysctl_lock); 32262306a36Sopenharmony_ci if (!use_table(head)) 32362306a36Sopenharmony_ci head = ERR_PTR(-ENOENT); 32462306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 32562306a36Sopenharmony_ci return head; 32662306a36Sopenharmony_ci} 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_cistatic void sysctl_head_finish(struct ctl_table_header *head) 32962306a36Sopenharmony_ci{ 33062306a36Sopenharmony_ci if (!head) 33162306a36Sopenharmony_ci return; 33262306a36Sopenharmony_ci spin_lock(&sysctl_lock); 33362306a36Sopenharmony_ci unuse_table(head); 33462306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 33562306a36Sopenharmony_ci} 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_cistatic struct ctl_table_set * 33862306a36Sopenharmony_cilookup_header_set(struct ctl_table_root *root) 33962306a36Sopenharmony_ci{ 34062306a36Sopenharmony_ci struct ctl_table_set *set = &root->default_set; 34162306a36Sopenharmony_ci if (root->lookup) 34262306a36Sopenharmony_ci set = root->lookup(root); 34362306a36Sopenharmony_ci return set; 34462306a36Sopenharmony_ci} 34562306a36Sopenharmony_ci 34662306a36Sopenharmony_cistatic struct ctl_table *lookup_entry(struct ctl_table_header **phead, 34762306a36Sopenharmony_ci struct ctl_dir *dir, 34862306a36Sopenharmony_ci const char *name, int namelen) 34962306a36Sopenharmony_ci{ 35062306a36Sopenharmony_ci struct ctl_table_header *head; 35162306a36Sopenharmony_ci struct ctl_table *entry; 35262306a36Sopenharmony_ci 35362306a36Sopenharmony_ci spin_lock(&sysctl_lock); 35462306a36Sopenharmony_ci entry = find_entry(&head, dir, name, namelen); 35562306a36Sopenharmony_ci if (entry && use_table(head)) 35662306a36Sopenharmony_ci *phead = head; 35762306a36Sopenharmony_ci else 35862306a36Sopenharmony_ci entry = NULL; 35962306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 36062306a36Sopenharmony_ci return entry; 36162306a36Sopenharmony_ci} 36262306a36Sopenharmony_ci 36362306a36Sopenharmony_cistatic struct ctl_node *first_usable_entry(struct rb_node *node) 36462306a36Sopenharmony_ci{ 36562306a36Sopenharmony_ci struct ctl_node *ctl_node; 36662306a36Sopenharmony_ci 36762306a36Sopenharmony_ci for (;node; node = rb_next(node)) { 36862306a36Sopenharmony_ci ctl_node = rb_entry(node, struct ctl_node, node); 36962306a36Sopenharmony_ci if (use_table(ctl_node->header)) 37062306a36Sopenharmony_ci return ctl_node; 37162306a36Sopenharmony_ci } 37262306a36Sopenharmony_ci return NULL; 37362306a36Sopenharmony_ci} 37462306a36Sopenharmony_ci 37562306a36Sopenharmony_cistatic void first_entry(struct ctl_dir *dir, 37662306a36Sopenharmony_ci struct ctl_table_header **phead, struct ctl_table **pentry) 37762306a36Sopenharmony_ci{ 37862306a36Sopenharmony_ci struct ctl_table_header *head = NULL; 37962306a36Sopenharmony_ci struct ctl_table *entry = NULL; 38062306a36Sopenharmony_ci struct ctl_node *ctl_node; 38162306a36Sopenharmony_ci 38262306a36Sopenharmony_ci spin_lock(&sysctl_lock); 38362306a36Sopenharmony_ci ctl_node = first_usable_entry(rb_first(&dir->root)); 38462306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 38562306a36Sopenharmony_ci if (ctl_node) { 38662306a36Sopenharmony_ci head = ctl_node->header; 38762306a36Sopenharmony_ci entry = &head->ctl_table[ctl_node - head->node]; 38862306a36Sopenharmony_ci } 38962306a36Sopenharmony_ci *phead = head; 39062306a36Sopenharmony_ci *pentry = entry; 39162306a36Sopenharmony_ci} 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_cistatic void next_entry(struct ctl_table_header **phead, struct ctl_table **pentry) 39462306a36Sopenharmony_ci{ 39562306a36Sopenharmony_ci struct ctl_table_header *head = *phead; 39662306a36Sopenharmony_ci struct ctl_table *entry = *pentry; 39762306a36Sopenharmony_ci struct ctl_node *ctl_node = &head->node[entry - head->ctl_table]; 39862306a36Sopenharmony_ci 39962306a36Sopenharmony_ci spin_lock(&sysctl_lock); 40062306a36Sopenharmony_ci unuse_table(head); 40162306a36Sopenharmony_ci 40262306a36Sopenharmony_ci ctl_node = first_usable_entry(rb_next(&ctl_node->node)); 40362306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 40462306a36Sopenharmony_ci head = NULL; 40562306a36Sopenharmony_ci if (ctl_node) { 40662306a36Sopenharmony_ci head = ctl_node->header; 40762306a36Sopenharmony_ci entry = &head->ctl_table[ctl_node - head->node]; 40862306a36Sopenharmony_ci } 40962306a36Sopenharmony_ci *phead = head; 41062306a36Sopenharmony_ci *pentry = entry; 41162306a36Sopenharmony_ci} 41262306a36Sopenharmony_ci 41362306a36Sopenharmony_ci/* 41462306a36Sopenharmony_ci * sysctl_perm does NOT grant the superuser all rights automatically, because 41562306a36Sopenharmony_ci * some sysctl variables are readonly even to root. 41662306a36Sopenharmony_ci */ 41762306a36Sopenharmony_ci 41862306a36Sopenharmony_cistatic int test_perm(int mode, int op) 41962306a36Sopenharmony_ci{ 42062306a36Sopenharmony_ci if (uid_eq(current_euid(), GLOBAL_ROOT_UID)) 42162306a36Sopenharmony_ci mode >>= 6; 42262306a36Sopenharmony_ci else if (in_egroup_p(GLOBAL_ROOT_GID)) 42362306a36Sopenharmony_ci mode >>= 3; 42462306a36Sopenharmony_ci if ((op & ~mode & (MAY_READ|MAY_WRITE|MAY_EXEC)) == 0) 42562306a36Sopenharmony_ci return 0; 42662306a36Sopenharmony_ci return -EACCES; 42762306a36Sopenharmony_ci} 42862306a36Sopenharmony_ci 42962306a36Sopenharmony_cistatic int sysctl_perm(struct ctl_table_header *head, struct ctl_table *table, int op) 43062306a36Sopenharmony_ci{ 43162306a36Sopenharmony_ci struct ctl_table_root *root = head->root; 43262306a36Sopenharmony_ci int mode; 43362306a36Sopenharmony_ci 43462306a36Sopenharmony_ci if (root->permissions) 43562306a36Sopenharmony_ci mode = root->permissions(head, table); 43662306a36Sopenharmony_ci else 43762306a36Sopenharmony_ci mode = table->mode; 43862306a36Sopenharmony_ci 43962306a36Sopenharmony_ci return test_perm(mode, op); 44062306a36Sopenharmony_ci} 44162306a36Sopenharmony_ci 44262306a36Sopenharmony_cistatic struct inode *proc_sys_make_inode(struct super_block *sb, 44362306a36Sopenharmony_ci struct ctl_table_header *head, struct ctl_table *table) 44462306a36Sopenharmony_ci{ 44562306a36Sopenharmony_ci struct ctl_table_root *root = head->root; 44662306a36Sopenharmony_ci struct inode *inode; 44762306a36Sopenharmony_ci struct proc_inode *ei; 44862306a36Sopenharmony_ci 44962306a36Sopenharmony_ci inode = new_inode(sb); 45062306a36Sopenharmony_ci if (!inode) 45162306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 45262306a36Sopenharmony_ci 45362306a36Sopenharmony_ci inode->i_ino = get_next_ino(); 45462306a36Sopenharmony_ci 45562306a36Sopenharmony_ci ei = PROC_I(inode); 45662306a36Sopenharmony_ci 45762306a36Sopenharmony_ci spin_lock(&sysctl_lock); 45862306a36Sopenharmony_ci if (unlikely(head->unregistering)) { 45962306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 46062306a36Sopenharmony_ci iput(inode); 46162306a36Sopenharmony_ci return ERR_PTR(-ENOENT); 46262306a36Sopenharmony_ci } 46362306a36Sopenharmony_ci ei->sysctl = head; 46462306a36Sopenharmony_ci ei->sysctl_entry = table; 46562306a36Sopenharmony_ci hlist_add_head_rcu(&ei->sibling_inodes, &head->inodes); 46662306a36Sopenharmony_ci head->count++; 46762306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 46862306a36Sopenharmony_ci 46962306a36Sopenharmony_ci inode->i_mtime = inode->i_atime = inode_set_ctime_current(inode); 47062306a36Sopenharmony_ci inode->i_mode = table->mode; 47162306a36Sopenharmony_ci if (!S_ISDIR(table->mode)) { 47262306a36Sopenharmony_ci inode->i_mode |= S_IFREG; 47362306a36Sopenharmony_ci inode->i_op = &proc_sys_inode_operations; 47462306a36Sopenharmony_ci inode->i_fop = &proc_sys_file_operations; 47562306a36Sopenharmony_ci } else { 47662306a36Sopenharmony_ci inode->i_mode |= S_IFDIR; 47762306a36Sopenharmony_ci inode->i_op = &proc_sys_dir_operations; 47862306a36Sopenharmony_ci inode->i_fop = &proc_sys_dir_file_operations; 47962306a36Sopenharmony_ci if (sysctl_is_perm_empty_ctl_header(head)) 48062306a36Sopenharmony_ci make_empty_dir_inode(inode); 48162306a36Sopenharmony_ci } 48262306a36Sopenharmony_ci 48362306a36Sopenharmony_ci if (root->set_ownership) 48462306a36Sopenharmony_ci root->set_ownership(head, table, &inode->i_uid, &inode->i_gid); 48562306a36Sopenharmony_ci else { 48662306a36Sopenharmony_ci inode->i_uid = GLOBAL_ROOT_UID; 48762306a36Sopenharmony_ci inode->i_gid = GLOBAL_ROOT_GID; 48862306a36Sopenharmony_ci } 48962306a36Sopenharmony_ci 49062306a36Sopenharmony_ci return inode; 49162306a36Sopenharmony_ci} 49262306a36Sopenharmony_ci 49362306a36Sopenharmony_civoid proc_sys_evict_inode(struct inode *inode, struct ctl_table_header *head) 49462306a36Sopenharmony_ci{ 49562306a36Sopenharmony_ci spin_lock(&sysctl_lock); 49662306a36Sopenharmony_ci hlist_del_init_rcu(&PROC_I(inode)->sibling_inodes); 49762306a36Sopenharmony_ci if (!--head->count) 49862306a36Sopenharmony_ci kfree_rcu(head, rcu); 49962306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 50062306a36Sopenharmony_ci} 50162306a36Sopenharmony_ci 50262306a36Sopenharmony_cistatic struct ctl_table_header *grab_header(struct inode *inode) 50362306a36Sopenharmony_ci{ 50462306a36Sopenharmony_ci struct ctl_table_header *head = PROC_I(inode)->sysctl; 50562306a36Sopenharmony_ci if (!head) 50662306a36Sopenharmony_ci head = &sysctl_table_root.default_set.dir.header; 50762306a36Sopenharmony_ci return sysctl_head_grab(head); 50862306a36Sopenharmony_ci} 50962306a36Sopenharmony_ci 51062306a36Sopenharmony_cistatic struct dentry *proc_sys_lookup(struct inode *dir, struct dentry *dentry, 51162306a36Sopenharmony_ci unsigned int flags) 51262306a36Sopenharmony_ci{ 51362306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(dir); 51462306a36Sopenharmony_ci struct ctl_table_header *h = NULL; 51562306a36Sopenharmony_ci const struct qstr *name = &dentry->d_name; 51662306a36Sopenharmony_ci struct ctl_table *p; 51762306a36Sopenharmony_ci struct inode *inode; 51862306a36Sopenharmony_ci struct dentry *err = ERR_PTR(-ENOENT); 51962306a36Sopenharmony_ci struct ctl_dir *ctl_dir; 52062306a36Sopenharmony_ci int ret; 52162306a36Sopenharmony_ci 52262306a36Sopenharmony_ci if (IS_ERR(head)) 52362306a36Sopenharmony_ci return ERR_CAST(head); 52462306a36Sopenharmony_ci 52562306a36Sopenharmony_ci ctl_dir = container_of(head, struct ctl_dir, header); 52662306a36Sopenharmony_ci 52762306a36Sopenharmony_ci p = lookup_entry(&h, ctl_dir, name->name, name->len); 52862306a36Sopenharmony_ci if (!p) 52962306a36Sopenharmony_ci goto out; 53062306a36Sopenharmony_ci 53162306a36Sopenharmony_ci if (S_ISLNK(p->mode)) { 53262306a36Sopenharmony_ci ret = sysctl_follow_link(&h, &p); 53362306a36Sopenharmony_ci err = ERR_PTR(ret); 53462306a36Sopenharmony_ci if (ret) 53562306a36Sopenharmony_ci goto out; 53662306a36Sopenharmony_ci } 53762306a36Sopenharmony_ci 53862306a36Sopenharmony_ci inode = proc_sys_make_inode(dir->i_sb, h ? h : head, p); 53962306a36Sopenharmony_ci if (IS_ERR(inode)) { 54062306a36Sopenharmony_ci err = ERR_CAST(inode); 54162306a36Sopenharmony_ci goto out; 54262306a36Sopenharmony_ci } 54362306a36Sopenharmony_ci 54462306a36Sopenharmony_ci d_set_d_op(dentry, &proc_sys_dentry_operations); 54562306a36Sopenharmony_ci err = d_splice_alias(inode, dentry); 54662306a36Sopenharmony_ci 54762306a36Sopenharmony_ciout: 54862306a36Sopenharmony_ci if (h) 54962306a36Sopenharmony_ci sysctl_head_finish(h); 55062306a36Sopenharmony_ci sysctl_head_finish(head); 55162306a36Sopenharmony_ci return err; 55262306a36Sopenharmony_ci} 55362306a36Sopenharmony_ci 55462306a36Sopenharmony_cistatic ssize_t proc_sys_call_handler(struct kiocb *iocb, struct iov_iter *iter, 55562306a36Sopenharmony_ci int write) 55662306a36Sopenharmony_ci{ 55762306a36Sopenharmony_ci struct inode *inode = file_inode(iocb->ki_filp); 55862306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(inode); 55962306a36Sopenharmony_ci struct ctl_table *table = PROC_I(inode)->sysctl_entry; 56062306a36Sopenharmony_ci size_t count = iov_iter_count(iter); 56162306a36Sopenharmony_ci char *kbuf; 56262306a36Sopenharmony_ci ssize_t error; 56362306a36Sopenharmony_ci 56462306a36Sopenharmony_ci if (IS_ERR(head)) 56562306a36Sopenharmony_ci return PTR_ERR(head); 56662306a36Sopenharmony_ci 56762306a36Sopenharmony_ci /* 56862306a36Sopenharmony_ci * At this point we know that the sysctl was not unregistered 56962306a36Sopenharmony_ci * and won't be until we finish. 57062306a36Sopenharmony_ci */ 57162306a36Sopenharmony_ci error = -EPERM; 57262306a36Sopenharmony_ci if (sysctl_perm(head, table, write ? MAY_WRITE : MAY_READ)) 57362306a36Sopenharmony_ci goto out; 57462306a36Sopenharmony_ci 57562306a36Sopenharmony_ci /* if that can happen at all, it should be -EINVAL, not -EISDIR */ 57662306a36Sopenharmony_ci error = -EINVAL; 57762306a36Sopenharmony_ci if (!table->proc_handler) 57862306a36Sopenharmony_ci goto out; 57962306a36Sopenharmony_ci 58062306a36Sopenharmony_ci /* don't even try if the size is too large */ 58162306a36Sopenharmony_ci error = -ENOMEM; 58262306a36Sopenharmony_ci if (count >= KMALLOC_MAX_SIZE) 58362306a36Sopenharmony_ci goto out; 58462306a36Sopenharmony_ci kbuf = kvzalloc(count + 1, GFP_KERNEL); 58562306a36Sopenharmony_ci if (!kbuf) 58662306a36Sopenharmony_ci goto out; 58762306a36Sopenharmony_ci 58862306a36Sopenharmony_ci if (write) { 58962306a36Sopenharmony_ci error = -EFAULT; 59062306a36Sopenharmony_ci if (!copy_from_iter_full(kbuf, count, iter)) 59162306a36Sopenharmony_ci goto out_free_buf; 59262306a36Sopenharmony_ci kbuf[count] = '\0'; 59362306a36Sopenharmony_ci } 59462306a36Sopenharmony_ci 59562306a36Sopenharmony_ci error = BPF_CGROUP_RUN_PROG_SYSCTL(head, table, write, &kbuf, &count, 59662306a36Sopenharmony_ci &iocb->ki_pos); 59762306a36Sopenharmony_ci if (error) 59862306a36Sopenharmony_ci goto out_free_buf; 59962306a36Sopenharmony_ci 60062306a36Sopenharmony_ci /* careful: calling conventions are nasty here */ 60162306a36Sopenharmony_ci error = table->proc_handler(table, write, kbuf, &count, &iocb->ki_pos); 60262306a36Sopenharmony_ci if (error) 60362306a36Sopenharmony_ci goto out_free_buf; 60462306a36Sopenharmony_ci 60562306a36Sopenharmony_ci if (!write) { 60662306a36Sopenharmony_ci error = -EFAULT; 60762306a36Sopenharmony_ci if (copy_to_iter(kbuf, count, iter) < count) 60862306a36Sopenharmony_ci goto out_free_buf; 60962306a36Sopenharmony_ci } 61062306a36Sopenharmony_ci 61162306a36Sopenharmony_ci error = count; 61262306a36Sopenharmony_ciout_free_buf: 61362306a36Sopenharmony_ci kvfree(kbuf); 61462306a36Sopenharmony_ciout: 61562306a36Sopenharmony_ci sysctl_head_finish(head); 61662306a36Sopenharmony_ci 61762306a36Sopenharmony_ci return error; 61862306a36Sopenharmony_ci} 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_cistatic ssize_t proc_sys_read(struct kiocb *iocb, struct iov_iter *iter) 62162306a36Sopenharmony_ci{ 62262306a36Sopenharmony_ci return proc_sys_call_handler(iocb, iter, 0); 62362306a36Sopenharmony_ci} 62462306a36Sopenharmony_ci 62562306a36Sopenharmony_cistatic ssize_t proc_sys_write(struct kiocb *iocb, struct iov_iter *iter) 62662306a36Sopenharmony_ci{ 62762306a36Sopenharmony_ci return proc_sys_call_handler(iocb, iter, 1); 62862306a36Sopenharmony_ci} 62962306a36Sopenharmony_ci 63062306a36Sopenharmony_cistatic int proc_sys_open(struct inode *inode, struct file *filp) 63162306a36Sopenharmony_ci{ 63262306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(inode); 63362306a36Sopenharmony_ci struct ctl_table *table = PROC_I(inode)->sysctl_entry; 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_ci /* sysctl was unregistered */ 63662306a36Sopenharmony_ci if (IS_ERR(head)) 63762306a36Sopenharmony_ci return PTR_ERR(head); 63862306a36Sopenharmony_ci 63962306a36Sopenharmony_ci if (table->poll) 64062306a36Sopenharmony_ci filp->private_data = proc_sys_poll_event(table->poll); 64162306a36Sopenharmony_ci 64262306a36Sopenharmony_ci sysctl_head_finish(head); 64362306a36Sopenharmony_ci 64462306a36Sopenharmony_ci return 0; 64562306a36Sopenharmony_ci} 64662306a36Sopenharmony_ci 64762306a36Sopenharmony_cistatic __poll_t proc_sys_poll(struct file *filp, poll_table *wait) 64862306a36Sopenharmony_ci{ 64962306a36Sopenharmony_ci struct inode *inode = file_inode(filp); 65062306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(inode); 65162306a36Sopenharmony_ci struct ctl_table *table = PROC_I(inode)->sysctl_entry; 65262306a36Sopenharmony_ci __poll_t ret = DEFAULT_POLLMASK; 65362306a36Sopenharmony_ci unsigned long event; 65462306a36Sopenharmony_ci 65562306a36Sopenharmony_ci /* sysctl was unregistered */ 65662306a36Sopenharmony_ci if (IS_ERR(head)) 65762306a36Sopenharmony_ci return EPOLLERR | EPOLLHUP; 65862306a36Sopenharmony_ci 65962306a36Sopenharmony_ci if (!table->proc_handler) 66062306a36Sopenharmony_ci goto out; 66162306a36Sopenharmony_ci 66262306a36Sopenharmony_ci if (!table->poll) 66362306a36Sopenharmony_ci goto out; 66462306a36Sopenharmony_ci 66562306a36Sopenharmony_ci event = (unsigned long)filp->private_data; 66662306a36Sopenharmony_ci poll_wait(filp, &table->poll->wait, wait); 66762306a36Sopenharmony_ci 66862306a36Sopenharmony_ci if (event != atomic_read(&table->poll->event)) { 66962306a36Sopenharmony_ci filp->private_data = proc_sys_poll_event(table->poll); 67062306a36Sopenharmony_ci ret = EPOLLIN | EPOLLRDNORM | EPOLLERR | EPOLLPRI; 67162306a36Sopenharmony_ci } 67262306a36Sopenharmony_ci 67362306a36Sopenharmony_ciout: 67462306a36Sopenharmony_ci sysctl_head_finish(head); 67562306a36Sopenharmony_ci 67662306a36Sopenharmony_ci return ret; 67762306a36Sopenharmony_ci} 67862306a36Sopenharmony_ci 67962306a36Sopenharmony_cistatic bool proc_sys_fill_cache(struct file *file, 68062306a36Sopenharmony_ci struct dir_context *ctx, 68162306a36Sopenharmony_ci struct ctl_table_header *head, 68262306a36Sopenharmony_ci struct ctl_table *table) 68362306a36Sopenharmony_ci{ 68462306a36Sopenharmony_ci struct dentry *child, *dir = file->f_path.dentry; 68562306a36Sopenharmony_ci struct inode *inode; 68662306a36Sopenharmony_ci struct qstr qname; 68762306a36Sopenharmony_ci ino_t ino = 0; 68862306a36Sopenharmony_ci unsigned type = DT_UNKNOWN; 68962306a36Sopenharmony_ci 69062306a36Sopenharmony_ci qname.name = table->procname; 69162306a36Sopenharmony_ci qname.len = strlen(table->procname); 69262306a36Sopenharmony_ci qname.hash = full_name_hash(dir, qname.name, qname.len); 69362306a36Sopenharmony_ci 69462306a36Sopenharmony_ci child = d_lookup(dir, &qname); 69562306a36Sopenharmony_ci if (!child) { 69662306a36Sopenharmony_ci DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq); 69762306a36Sopenharmony_ci child = d_alloc_parallel(dir, &qname, &wq); 69862306a36Sopenharmony_ci if (IS_ERR(child)) 69962306a36Sopenharmony_ci return false; 70062306a36Sopenharmony_ci if (d_in_lookup(child)) { 70162306a36Sopenharmony_ci struct dentry *res; 70262306a36Sopenharmony_ci inode = proc_sys_make_inode(dir->d_sb, head, table); 70362306a36Sopenharmony_ci if (IS_ERR(inode)) { 70462306a36Sopenharmony_ci d_lookup_done(child); 70562306a36Sopenharmony_ci dput(child); 70662306a36Sopenharmony_ci return false; 70762306a36Sopenharmony_ci } 70862306a36Sopenharmony_ci d_set_d_op(child, &proc_sys_dentry_operations); 70962306a36Sopenharmony_ci res = d_splice_alias(inode, child); 71062306a36Sopenharmony_ci d_lookup_done(child); 71162306a36Sopenharmony_ci if (unlikely(res)) { 71262306a36Sopenharmony_ci if (IS_ERR(res)) { 71362306a36Sopenharmony_ci dput(child); 71462306a36Sopenharmony_ci return false; 71562306a36Sopenharmony_ci } 71662306a36Sopenharmony_ci dput(child); 71762306a36Sopenharmony_ci child = res; 71862306a36Sopenharmony_ci } 71962306a36Sopenharmony_ci } 72062306a36Sopenharmony_ci } 72162306a36Sopenharmony_ci inode = d_inode(child); 72262306a36Sopenharmony_ci ino = inode->i_ino; 72362306a36Sopenharmony_ci type = inode->i_mode >> 12; 72462306a36Sopenharmony_ci dput(child); 72562306a36Sopenharmony_ci return dir_emit(ctx, qname.name, qname.len, ino, type); 72662306a36Sopenharmony_ci} 72762306a36Sopenharmony_ci 72862306a36Sopenharmony_cistatic bool proc_sys_link_fill_cache(struct file *file, 72962306a36Sopenharmony_ci struct dir_context *ctx, 73062306a36Sopenharmony_ci struct ctl_table_header *head, 73162306a36Sopenharmony_ci struct ctl_table *table) 73262306a36Sopenharmony_ci{ 73362306a36Sopenharmony_ci bool ret = true; 73462306a36Sopenharmony_ci 73562306a36Sopenharmony_ci head = sysctl_head_grab(head); 73662306a36Sopenharmony_ci if (IS_ERR(head)) 73762306a36Sopenharmony_ci return false; 73862306a36Sopenharmony_ci 73962306a36Sopenharmony_ci /* It is not an error if we can not follow the link ignore it */ 74062306a36Sopenharmony_ci if (sysctl_follow_link(&head, &table)) 74162306a36Sopenharmony_ci goto out; 74262306a36Sopenharmony_ci 74362306a36Sopenharmony_ci ret = proc_sys_fill_cache(file, ctx, head, table); 74462306a36Sopenharmony_ciout: 74562306a36Sopenharmony_ci sysctl_head_finish(head); 74662306a36Sopenharmony_ci return ret; 74762306a36Sopenharmony_ci} 74862306a36Sopenharmony_ci 74962306a36Sopenharmony_cistatic int scan(struct ctl_table_header *head, struct ctl_table *table, 75062306a36Sopenharmony_ci unsigned long *pos, struct file *file, 75162306a36Sopenharmony_ci struct dir_context *ctx) 75262306a36Sopenharmony_ci{ 75362306a36Sopenharmony_ci bool res; 75462306a36Sopenharmony_ci 75562306a36Sopenharmony_ci if ((*pos)++ < ctx->pos) 75662306a36Sopenharmony_ci return true; 75762306a36Sopenharmony_ci 75862306a36Sopenharmony_ci if (unlikely(S_ISLNK(table->mode))) 75962306a36Sopenharmony_ci res = proc_sys_link_fill_cache(file, ctx, head, table); 76062306a36Sopenharmony_ci else 76162306a36Sopenharmony_ci res = proc_sys_fill_cache(file, ctx, head, table); 76262306a36Sopenharmony_ci 76362306a36Sopenharmony_ci if (res) 76462306a36Sopenharmony_ci ctx->pos = *pos; 76562306a36Sopenharmony_ci 76662306a36Sopenharmony_ci return res; 76762306a36Sopenharmony_ci} 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_cistatic int proc_sys_readdir(struct file *file, struct dir_context *ctx) 77062306a36Sopenharmony_ci{ 77162306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(file_inode(file)); 77262306a36Sopenharmony_ci struct ctl_table_header *h = NULL; 77362306a36Sopenharmony_ci struct ctl_table *entry; 77462306a36Sopenharmony_ci struct ctl_dir *ctl_dir; 77562306a36Sopenharmony_ci unsigned long pos; 77662306a36Sopenharmony_ci 77762306a36Sopenharmony_ci if (IS_ERR(head)) 77862306a36Sopenharmony_ci return PTR_ERR(head); 77962306a36Sopenharmony_ci 78062306a36Sopenharmony_ci ctl_dir = container_of(head, struct ctl_dir, header); 78162306a36Sopenharmony_ci 78262306a36Sopenharmony_ci if (!dir_emit_dots(file, ctx)) 78362306a36Sopenharmony_ci goto out; 78462306a36Sopenharmony_ci 78562306a36Sopenharmony_ci pos = 2; 78662306a36Sopenharmony_ci 78762306a36Sopenharmony_ci for (first_entry(ctl_dir, &h, &entry); h; next_entry(&h, &entry)) { 78862306a36Sopenharmony_ci if (!scan(h, entry, &pos, file, ctx)) { 78962306a36Sopenharmony_ci sysctl_head_finish(h); 79062306a36Sopenharmony_ci break; 79162306a36Sopenharmony_ci } 79262306a36Sopenharmony_ci } 79362306a36Sopenharmony_ciout: 79462306a36Sopenharmony_ci sysctl_head_finish(head); 79562306a36Sopenharmony_ci return 0; 79662306a36Sopenharmony_ci} 79762306a36Sopenharmony_ci 79862306a36Sopenharmony_cistatic int proc_sys_permission(struct mnt_idmap *idmap, 79962306a36Sopenharmony_ci struct inode *inode, int mask) 80062306a36Sopenharmony_ci{ 80162306a36Sopenharmony_ci /* 80262306a36Sopenharmony_ci * sysctl entries that are not writeable, 80362306a36Sopenharmony_ci * are _NOT_ writeable, capabilities or not. 80462306a36Sopenharmony_ci */ 80562306a36Sopenharmony_ci struct ctl_table_header *head; 80662306a36Sopenharmony_ci struct ctl_table *table; 80762306a36Sopenharmony_ci int error; 80862306a36Sopenharmony_ci 80962306a36Sopenharmony_ci /* Executable files are not allowed under /proc/sys/ */ 81062306a36Sopenharmony_ci if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) 81162306a36Sopenharmony_ci return -EACCES; 81262306a36Sopenharmony_ci 81362306a36Sopenharmony_ci head = grab_header(inode); 81462306a36Sopenharmony_ci if (IS_ERR(head)) 81562306a36Sopenharmony_ci return PTR_ERR(head); 81662306a36Sopenharmony_ci 81762306a36Sopenharmony_ci table = PROC_I(inode)->sysctl_entry; 81862306a36Sopenharmony_ci if (!table) /* global root - r-xr-xr-x */ 81962306a36Sopenharmony_ci error = mask & MAY_WRITE ? -EACCES : 0; 82062306a36Sopenharmony_ci else /* Use the permissions on the sysctl table entry */ 82162306a36Sopenharmony_ci error = sysctl_perm(head, table, mask & ~MAY_NOT_BLOCK); 82262306a36Sopenharmony_ci 82362306a36Sopenharmony_ci sysctl_head_finish(head); 82462306a36Sopenharmony_ci return error; 82562306a36Sopenharmony_ci} 82662306a36Sopenharmony_ci 82762306a36Sopenharmony_cistatic int proc_sys_setattr(struct mnt_idmap *idmap, 82862306a36Sopenharmony_ci struct dentry *dentry, struct iattr *attr) 82962306a36Sopenharmony_ci{ 83062306a36Sopenharmony_ci struct inode *inode = d_inode(dentry); 83162306a36Sopenharmony_ci int error; 83262306a36Sopenharmony_ci 83362306a36Sopenharmony_ci if (attr->ia_valid & (ATTR_MODE | ATTR_UID | ATTR_GID)) 83462306a36Sopenharmony_ci return -EPERM; 83562306a36Sopenharmony_ci 83662306a36Sopenharmony_ci error = setattr_prepare(&nop_mnt_idmap, dentry, attr); 83762306a36Sopenharmony_ci if (error) 83862306a36Sopenharmony_ci return error; 83962306a36Sopenharmony_ci 84062306a36Sopenharmony_ci setattr_copy(&nop_mnt_idmap, inode, attr); 84162306a36Sopenharmony_ci return 0; 84262306a36Sopenharmony_ci} 84362306a36Sopenharmony_ci 84462306a36Sopenharmony_cistatic int proc_sys_getattr(struct mnt_idmap *idmap, 84562306a36Sopenharmony_ci const struct path *path, struct kstat *stat, 84662306a36Sopenharmony_ci u32 request_mask, unsigned int query_flags) 84762306a36Sopenharmony_ci{ 84862306a36Sopenharmony_ci struct inode *inode = d_inode(path->dentry); 84962306a36Sopenharmony_ci struct ctl_table_header *head = grab_header(inode); 85062306a36Sopenharmony_ci struct ctl_table *table = PROC_I(inode)->sysctl_entry; 85162306a36Sopenharmony_ci 85262306a36Sopenharmony_ci if (IS_ERR(head)) 85362306a36Sopenharmony_ci return PTR_ERR(head); 85462306a36Sopenharmony_ci 85562306a36Sopenharmony_ci generic_fillattr(&nop_mnt_idmap, request_mask, inode, stat); 85662306a36Sopenharmony_ci if (table) 85762306a36Sopenharmony_ci stat->mode = (stat->mode & S_IFMT) | table->mode; 85862306a36Sopenharmony_ci 85962306a36Sopenharmony_ci sysctl_head_finish(head); 86062306a36Sopenharmony_ci return 0; 86162306a36Sopenharmony_ci} 86262306a36Sopenharmony_ci 86362306a36Sopenharmony_cistatic const struct file_operations proc_sys_file_operations = { 86462306a36Sopenharmony_ci .open = proc_sys_open, 86562306a36Sopenharmony_ci .poll = proc_sys_poll, 86662306a36Sopenharmony_ci .read_iter = proc_sys_read, 86762306a36Sopenharmony_ci .write_iter = proc_sys_write, 86862306a36Sopenharmony_ci .splice_read = copy_splice_read, 86962306a36Sopenharmony_ci .splice_write = iter_file_splice_write, 87062306a36Sopenharmony_ci .llseek = default_llseek, 87162306a36Sopenharmony_ci}; 87262306a36Sopenharmony_ci 87362306a36Sopenharmony_cistatic const struct file_operations proc_sys_dir_file_operations = { 87462306a36Sopenharmony_ci .read = generic_read_dir, 87562306a36Sopenharmony_ci .iterate_shared = proc_sys_readdir, 87662306a36Sopenharmony_ci .llseek = generic_file_llseek, 87762306a36Sopenharmony_ci}; 87862306a36Sopenharmony_ci 87962306a36Sopenharmony_cistatic const struct inode_operations proc_sys_inode_operations = { 88062306a36Sopenharmony_ci .permission = proc_sys_permission, 88162306a36Sopenharmony_ci .setattr = proc_sys_setattr, 88262306a36Sopenharmony_ci .getattr = proc_sys_getattr, 88362306a36Sopenharmony_ci}; 88462306a36Sopenharmony_ci 88562306a36Sopenharmony_cistatic const struct inode_operations proc_sys_dir_operations = { 88662306a36Sopenharmony_ci .lookup = proc_sys_lookup, 88762306a36Sopenharmony_ci .permission = proc_sys_permission, 88862306a36Sopenharmony_ci .setattr = proc_sys_setattr, 88962306a36Sopenharmony_ci .getattr = proc_sys_getattr, 89062306a36Sopenharmony_ci}; 89162306a36Sopenharmony_ci 89262306a36Sopenharmony_cistatic int proc_sys_revalidate(struct dentry *dentry, unsigned int flags) 89362306a36Sopenharmony_ci{ 89462306a36Sopenharmony_ci if (flags & LOOKUP_RCU) 89562306a36Sopenharmony_ci return -ECHILD; 89662306a36Sopenharmony_ci return !PROC_I(d_inode(dentry))->sysctl->unregistering; 89762306a36Sopenharmony_ci} 89862306a36Sopenharmony_ci 89962306a36Sopenharmony_cistatic int proc_sys_delete(const struct dentry *dentry) 90062306a36Sopenharmony_ci{ 90162306a36Sopenharmony_ci return !!PROC_I(d_inode(dentry))->sysctl->unregistering; 90262306a36Sopenharmony_ci} 90362306a36Sopenharmony_ci 90462306a36Sopenharmony_cistatic int sysctl_is_seen(struct ctl_table_header *p) 90562306a36Sopenharmony_ci{ 90662306a36Sopenharmony_ci struct ctl_table_set *set = p->set; 90762306a36Sopenharmony_ci int res; 90862306a36Sopenharmony_ci spin_lock(&sysctl_lock); 90962306a36Sopenharmony_ci if (p->unregistering) 91062306a36Sopenharmony_ci res = 0; 91162306a36Sopenharmony_ci else if (!set->is_seen) 91262306a36Sopenharmony_ci res = 1; 91362306a36Sopenharmony_ci else 91462306a36Sopenharmony_ci res = set->is_seen(set); 91562306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 91662306a36Sopenharmony_ci return res; 91762306a36Sopenharmony_ci} 91862306a36Sopenharmony_ci 91962306a36Sopenharmony_cistatic int proc_sys_compare(const struct dentry *dentry, 92062306a36Sopenharmony_ci unsigned int len, const char *str, const struct qstr *name) 92162306a36Sopenharmony_ci{ 92262306a36Sopenharmony_ci struct ctl_table_header *head; 92362306a36Sopenharmony_ci struct inode *inode; 92462306a36Sopenharmony_ci 92562306a36Sopenharmony_ci /* Although proc doesn't have negative dentries, rcu-walk means 92662306a36Sopenharmony_ci * that inode here can be NULL */ 92762306a36Sopenharmony_ci /* AV: can it, indeed? */ 92862306a36Sopenharmony_ci inode = d_inode_rcu(dentry); 92962306a36Sopenharmony_ci if (!inode) 93062306a36Sopenharmony_ci return 1; 93162306a36Sopenharmony_ci if (name->len != len) 93262306a36Sopenharmony_ci return 1; 93362306a36Sopenharmony_ci if (memcmp(name->name, str, len)) 93462306a36Sopenharmony_ci return 1; 93562306a36Sopenharmony_ci head = rcu_dereference(PROC_I(inode)->sysctl); 93662306a36Sopenharmony_ci return !head || !sysctl_is_seen(head); 93762306a36Sopenharmony_ci} 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_cistatic const struct dentry_operations proc_sys_dentry_operations = { 94062306a36Sopenharmony_ci .d_revalidate = proc_sys_revalidate, 94162306a36Sopenharmony_ci .d_delete = proc_sys_delete, 94262306a36Sopenharmony_ci .d_compare = proc_sys_compare, 94362306a36Sopenharmony_ci}; 94462306a36Sopenharmony_ci 94562306a36Sopenharmony_cistatic struct ctl_dir *find_subdir(struct ctl_dir *dir, 94662306a36Sopenharmony_ci const char *name, int namelen) 94762306a36Sopenharmony_ci{ 94862306a36Sopenharmony_ci struct ctl_table_header *head; 94962306a36Sopenharmony_ci struct ctl_table *entry; 95062306a36Sopenharmony_ci 95162306a36Sopenharmony_ci entry = find_entry(&head, dir, name, namelen); 95262306a36Sopenharmony_ci if (!entry) 95362306a36Sopenharmony_ci return ERR_PTR(-ENOENT); 95462306a36Sopenharmony_ci if (!S_ISDIR(entry->mode)) 95562306a36Sopenharmony_ci return ERR_PTR(-ENOTDIR); 95662306a36Sopenharmony_ci return container_of(head, struct ctl_dir, header); 95762306a36Sopenharmony_ci} 95862306a36Sopenharmony_ci 95962306a36Sopenharmony_cistatic struct ctl_dir *new_dir(struct ctl_table_set *set, 96062306a36Sopenharmony_ci const char *name, int namelen) 96162306a36Sopenharmony_ci{ 96262306a36Sopenharmony_ci struct ctl_table *table; 96362306a36Sopenharmony_ci struct ctl_dir *new; 96462306a36Sopenharmony_ci struct ctl_node *node; 96562306a36Sopenharmony_ci char *new_name; 96662306a36Sopenharmony_ci 96762306a36Sopenharmony_ci new = kzalloc(sizeof(*new) + sizeof(struct ctl_node) + 96862306a36Sopenharmony_ci sizeof(struct ctl_table)*2 + namelen + 1, 96962306a36Sopenharmony_ci GFP_KERNEL); 97062306a36Sopenharmony_ci if (!new) 97162306a36Sopenharmony_ci return NULL; 97262306a36Sopenharmony_ci 97362306a36Sopenharmony_ci node = (struct ctl_node *)(new + 1); 97462306a36Sopenharmony_ci table = (struct ctl_table *)(node + 1); 97562306a36Sopenharmony_ci new_name = (char *)(table + 2); 97662306a36Sopenharmony_ci memcpy(new_name, name, namelen); 97762306a36Sopenharmony_ci table[0].procname = new_name; 97862306a36Sopenharmony_ci table[0].mode = S_IFDIR|S_IRUGO|S_IXUGO; 97962306a36Sopenharmony_ci init_header(&new->header, set->dir.header.root, set, node, table, 1); 98062306a36Sopenharmony_ci 98162306a36Sopenharmony_ci return new; 98262306a36Sopenharmony_ci} 98362306a36Sopenharmony_ci 98462306a36Sopenharmony_ci/** 98562306a36Sopenharmony_ci * get_subdir - find or create a subdir with the specified name. 98662306a36Sopenharmony_ci * @dir: Directory to create the subdirectory in 98762306a36Sopenharmony_ci * @name: The name of the subdirectory to find or create 98862306a36Sopenharmony_ci * @namelen: The length of name 98962306a36Sopenharmony_ci * 99062306a36Sopenharmony_ci * Takes a directory with an elevated reference count so we know that 99162306a36Sopenharmony_ci * if we drop the lock the directory will not go away. Upon success 99262306a36Sopenharmony_ci * the reference is moved from @dir to the returned subdirectory. 99362306a36Sopenharmony_ci * Upon error an error code is returned and the reference on @dir is 99462306a36Sopenharmony_ci * simply dropped. 99562306a36Sopenharmony_ci */ 99662306a36Sopenharmony_cistatic struct ctl_dir *get_subdir(struct ctl_dir *dir, 99762306a36Sopenharmony_ci const char *name, int namelen) 99862306a36Sopenharmony_ci{ 99962306a36Sopenharmony_ci struct ctl_table_set *set = dir->header.set; 100062306a36Sopenharmony_ci struct ctl_dir *subdir, *new = NULL; 100162306a36Sopenharmony_ci int err; 100262306a36Sopenharmony_ci 100362306a36Sopenharmony_ci spin_lock(&sysctl_lock); 100462306a36Sopenharmony_ci subdir = find_subdir(dir, name, namelen); 100562306a36Sopenharmony_ci if (!IS_ERR(subdir)) 100662306a36Sopenharmony_ci goto found; 100762306a36Sopenharmony_ci if (PTR_ERR(subdir) != -ENOENT) 100862306a36Sopenharmony_ci goto failed; 100962306a36Sopenharmony_ci 101062306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 101162306a36Sopenharmony_ci new = new_dir(set, name, namelen); 101262306a36Sopenharmony_ci spin_lock(&sysctl_lock); 101362306a36Sopenharmony_ci subdir = ERR_PTR(-ENOMEM); 101462306a36Sopenharmony_ci if (!new) 101562306a36Sopenharmony_ci goto failed; 101662306a36Sopenharmony_ci 101762306a36Sopenharmony_ci /* Was the subdir added while we dropped the lock? */ 101862306a36Sopenharmony_ci subdir = find_subdir(dir, name, namelen); 101962306a36Sopenharmony_ci if (!IS_ERR(subdir)) 102062306a36Sopenharmony_ci goto found; 102162306a36Sopenharmony_ci if (PTR_ERR(subdir) != -ENOENT) 102262306a36Sopenharmony_ci goto failed; 102362306a36Sopenharmony_ci 102462306a36Sopenharmony_ci /* Nope. Use the our freshly made directory entry. */ 102562306a36Sopenharmony_ci err = insert_header(dir, &new->header); 102662306a36Sopenharmony_ci subdir = ERR_PTR(err); 102762306a36Sopenharmony_ci if (err) 102862306a36Sopenharmony_ci goto failed; 102962306a36Sopenharmony_ci subdir = new; 103062306a36Sopenharmony_cifound: 103162306a36Sopenharmony_ci subdir->header.nreg++; 103262306a36Sopenharmony_cifailed: 103362306a36Sopenharmony_ci if (IS_ERR(subdir)) { 103462306a36Sopenharmony_ci pr_err("sysctl could not get directory: "); 103562306a36Sopenharmony_ci sysctl_print_dir(dir); 103662306a36Sopenharmony_ci pr_cont("%*.*s %ld\n", namelen, namelen, name, 103762306a36Sopenharmony_ci PTR_ERR(subdir)); 103862306a36Sopenharmony_ci } 103962306a36Sopenharmony_ci drop_sysctl_table(&dir->header); 104062306a36Sopenharmony_ci if (new) 104162306a36Sopenharmony_ci drop_sysctl_table(&new->header); 104262306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 104362306a36Sopenharmony_ci return subdir; 104462306a36Sopenharmony_ci} 104562306a36Sopenharmony_ci 104662306a36Sopenharmony_cistatic struct ctl_dir *xlate_dir(struct ctl_table_set *set, struct ctl_dir *dir) 104762306a36Sopenharmony_ci{ 104862306a36Sopenharmony_ci struct ctl_dir *parent; 104962306a36Sopenharmony_ci const char *procname; 105062306a36Sopenharmony_ci if (!dir->header.parent) 105162306a36Sopenharmony_ci return &set->dir; 105262306a36Sopenharmony_ci parent = xlate_dir(set, dir->header.parent); 105362306a36Sopenharmony_ci if (IS_ERR(parent)) 105462306a36Sopenharmony_ci return parent; 105562306a36Sopenharmony_ci procname = dir->header.ctl_table[0].procname; 105662306a36Sopenharmony_ci return find_subdir(parent, procname, strlen(procname)); 105762306a36Sopenharmony_ci} 105862306a36Sopenharmony_ci 105962306a36Sopenharmony_cistatic int sysctl_follow_link(struct ctl_table_header **phead, 106062306a36Sopenharmony_ci struct ctl_table **pentry) 106162306a36Sopenharmony_ci{ 106262306a36Sopenharmony_ci struct ctl_table_header *head; 106362306a36Sopenharmony_ci struct ctl_table_root *root; 106462306a36Sopenharmony_ci struct ctl_table_set *set; 106562306a36Sopenharmony_ci struct ctl_table *entry; 106662306a36Sopenharmony_ci struct ctl_dir *dir; 106762306a36Sopenharmony_ci int ret; 106862306a36Sopenharmony_ci 106962306a36Sopenharmony_ci spin_lock(&sysctl_lock); 107062306a36Sopenharmony_ci root = (*pentry)->data; 107162306a36Sopenharmony_ci set = lookup_header_set(root); 107262306a36Sopenharmony_ci dir = xlate_dir(set, (*phead)->parent); 107362306a36Sopenharmony_ci if (IS_ERR(dir)) 107462306a36Sopenharmony_ci ret = PTR_ERR(dir); 107562306a36Sopenharmony_ci else { 107662306a36Sopenharmony_ci const char *procname = (*pentry)->procname; 107762306a36Sopenharmony_ci head = NULL; 107862306a36Sopenharmony_ci entry = find_entry(&head, dir, procname, strlen(procname)); 107962306a36Sopenharmony_ci ret = -ENOENT; 108062306a36Sopenharmony_ci if (entry && use_table(head)) { 108162306a36Sopenharmony_ci unuse_table(*phead); 108262306a36Sopenharmony_ci *phead = head; 108362306a36Sopenharmony_ci *pentry = entry; 108462306a36Sopenharmony_ci ret = 0; 108562306a36Sopenharmony_ci } 108662306a36Sopenharmony_ci } 108762306a36Sopenharmony_ci 108862306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 108962306a36Sopenharmony_ci return ret; 109062306a36Sopenharmony_ci} 109162306a36Sopenharmony_ci 109262306a36Sopenharmony_cistatic int sysctl_err(const char *path, struct ctl_table *table, char *fmt, ...) 109362306a36Sopenharmony_ci{ 109462306a36Sopenharmony_ci struct va_format vaf; 109562306a36Sopenharmony_ci va_list args; 109662306a36Sopenharmony_ci 109762306a36Sopenharmony_ci va_start(args, fmt); 109862306a36Sopenharmony_ci vaf.fmt = fmt; 109962306a36Sopenharmony_ci vaf.va = &args; 110062306a36Sopenharmony_ci 110162306a36Sopenharmony_ci pr_err("sysctl table check failed: %s/%s %pV\n", 110262306a36Sopenharmony_ci path, table->procname, &vaf); 110362306a36Sopenharmony_ci 110462306a36Sopenharmony_ci va_end(args); 110562306a36Sopenharmony_ci return -EINVAL; 110662306a36Sopenharmony_ci} 110762306a36Sopenharmony_ci 110862306a36Sopenharmony_cistatic int sysctl_check_table_array(const char *path, struct ctl_table *table) 110962306a36Sopenharmony_ci{ 111062306a36Sopenharmony_ci int err = 0; 111162306a36Sopenharmony_ci 111262306a36Sopenharmony_ci if ((table->proc_handler == proc_douintvec) || 111362306a36Sopenharmony_ci (table->proc_handler == proc_douintvec_minmax)) { 111462306a36Sopenharmony_ci if (table->maxlen != sizeof(unsigned int)) 111562306a36Sopenharmony_ci err |= sysctl_err(path, table, "array not allowed"); 111662306a36Sopenharmony_ci } 111762306a36Sopenharmony_ci 111862306a36Sopenharmony_ci if (table->proc_handler == proc_dou8vec_minmax) { 111962306a36Sopenharmony_ci if (table->maxlen != sizeof(u8)) 112062306a36Sopenharmony_ci err |= sysctl_err(path, table, "array not allowed"); 112162306a36Sopenharmony_ci } 112262306a36Sopenharmony_ci 112362306a36Sopenharmony_ci if (table->proc_handler == proc_dobool) { 112462306a36Sopenharmony_ci if (table->maxlen != sizeof(bool)) 112562306a36Sopenharmony_ci err |= sysctl_err(path, table, "array not allowed"); 112662306a36Sopenharmony_ci } 112762306a36Sopenharmony_ci 112862306a36Sopenharmony_ci return err; 112962306a36Sopenharmony_ci} 113062306a36Sopenharmony_ci 113162306a36Sopenharmony_cistatic int sysctl_check_table(const char *path, struct ctl_table_header *header) 113262306a36Sopenharmony_ci{ 113362306a36Sopenharmony_ci struct ctl_table *entry; 113462306a36Sopenharmony_ci int err = 0; 113562306a36Sopenharmony_ci list_for_each_table_entry(entry, header) { 113662306a36Sopenharmony_ci if ((entry->proc_handler == proc_dostring) || 113762306a36Sopenharmony_ci (entry->proc_handler == proc_dobool) || 113862306a36Sopenharmony_ci (entry->proc_handler == proc_dointvec) || 113962306a36Sopenharmony_ci (entry->proc_handler == proc_douintvec) || 114062306a36Sopenharmony_ci (entry->proc_handler == proc_douintvec_minmax) || 114162306a36Sopenharmony_ci (entry->proc_handler == proc_dointvec_minmax) || 114262306a36Sopenharmony_ci (entry->proc_handler == proc_dou8vec_minmax) || 114362306a36Sopenharmony_ci (entry->proc_handler == proc_dointvec_jiffies) || 114462306a36Sopenharmony_ci (entry->proc_handler == proc_dointvec_userhz_jiffies) || 114562306a36Sopenharmony_ci (entry->proc_handler == proc_dointvec_ms_jiffies) || 114662306a36Sopenharmony_ci (entry->proc_handler == proc_doulongvec_minmax) || 114762306a36Sopenharmony_ci (entry->proc_handler == proc_doulongvec_ms_jiffies_minmax)) { 114862306a36Sopenharmony_ci if (!entry->data) 114962306a36Sopenharmony_ci err |= sysctl_err(path, entry, "No data"); 115062306a36Sopenharmony_ci if (!entry->maxlen) 115162306a36Sopenharmony_ci err |= sysctl_err(path, entry, "No maxlen"); 115262306a36Sopenharmony_ci else 115362306a36Sopenharmony_ci err |= sysctl_check_table_array(path, entry); 115462306a36Sopenharmony_ci } 115562306a36Sopenharmony_ci if (!entry->proc_handler) 115662306a36Sopenharmony_ci err |= sysctl_err(path, entry, "No proc_handler"); 115762306a36Sopenharmony_ci 115862306a36Sopenharmony_ci if ((entry->mode & (S_IRUGO|S_IWUGO)) != entry->mode) 115962306a36Sopenharmony_ci err |= sysctl_err(path, entry, "bogus .mode 0%o", 116062306a36Sopenharmony_ci entry->mode); 116162306a36Sopenharmony_ci } 116262306a36Sopenharmony_ci return err; 116362306a36Sopenharmony_ci} 116462306a36Sopenharmony_ci 116562306a36Sopenharmony_cistatic struct ctl_table_header *new_links(struct ctl_dir *dir, struct ctl_table_header *head) 116662306a36Sopenharmony_ci{ 116762306a36Sopenharmony_ci struct ctl_table *link_table, *entry, *link; 116862306a36Sopenharmony_ci struct ctl_table_header *links; 116962306a36Sopenharmony_ci struct ctl_node *node; 117062306a36Sopenharmony_ci char *link_name; 117162306a36Sopenharmony_ci int nr_entries, name_bytes; 117262306a36Sopenharmony_ci 117362306a36Sopenharmony_ci name_bytes = 0; 117462306a36Sopenharmony_ci nr_entries = 0; 117562306a36Sopenharmony_ci list_for_each_table_entry(entry, head) { 117662306a36Sopenharmony_ci nr_entries++; 117762306a36Sopenharmony_ci name_bytes += strlen(entry->procname) + 1; 117862306a36Sopenharmony_ci } 117962306a36Sopenharmony_ci 118062306a36Sopenharmony_ci links = kzalloc(sizeof(struct ctl_table_header) + 118162306a36Sopenharmony_ci sizeof(struct ctl_node)*nr_entries + 118262306a36Sopenharmony_ci sizeof(struct ctl_table)*(nr_entries + 1) + 118362306a36Sopenharmony_ci name_bytes, 118462306a36Sopenharmony_ci GFP_KERNEL); 118562306a36Sopenharmony_ci 118662306a36Sopenharmony_ci if (!links) 118762306a36Sopenharmony_ci return NULL; 118862306a36Sopenharmony_ci 118962306a36Sopenharmony_ci node = (struct ctl_node *)(links + 1); 119062306a36Sopenharmony_ci link_table = (struct ctl_table *)(node + nr_entries); 119162306a36Sopenharmony_ci link_name = (char *)&link_table[nr_entries + 1]; 119262306a36Sopenharmony_ci link = link_table; 119362306a36Sopenharmony_ci 119462306a36Sopenharmony_ci list_for_each_table_entry(entry, head) { 119562306a36Sopenharmony_ci int len = strlen(entry->procname) + 1; 119662306a36Sopenharmony_ci memcpy(link_name, entry->procname, len); 119762306a36Sopenharmony_ci link->procname = link_name; 119862306a36Sopenharmony_ci link->mode = S_IFLNK|S_IRWXUGO; 119962306a36Sopenharmony_ci link->data = head->root; 120062306a36Sopenharmony_ci link_name += len; 120162306a36Sopenharmony_ci link++; 120262306a36Sopenharmony_ci } 120362306a36Sopenharmony_ci init_header(links, dir->header.root, dir->header.set, node, link_table, 120462306a36Sopenharmony_ci head->ctl_table_size); 120562306a36Sopenharmony_ci links->nreg = nr_entries; 120662306a36Sopenharmony_ci 120762306a36Sopenharmony_ci return links; 120862306a36Sopenharmony_ci} 120962306a36Sopenharmony_ci 121062306a36Sopenharmony_cistatic bool get_links(struct ctl_dir *dir, 121162306a36Sopenharmony_ci struct ctl_table_header *header, 121262306a36Sopenharmony_ci struct ctl_table_root *link_root) 121362306a36Sopenharmony_ci{ 121462306a36Sopenharmony_ci struct ctl_table_header *tmp_head; 121562306a36Sopenharmony_ci struct ctl_table *entry, *link; 121662306a36Sopenharmony_ci 121762306a36Sopenharmony_ci if (header->ctl_table_size == 0 || 121862306a36Sopenharmony_ci sysctl_is_perm_empty_ctl_table(header->ctl_table)) 121962306a36Sopenharmony_ci return true; 122062306a36Sopenharmony_ci 122162306a36Sopenharmony_ci /* Are there links available for every entry in table? */ 122262306a36Sopenharmony_ci list_for_each_table_entry(entry, header) { 122362306a36Sopenharmony_ci const char *procname = entry->procname; 122462306a36Sopenharmony_ci link = find_entry(&tmp_head, dir, procname, strlen(procname)); 122562306a36Sopenharmony_ci if (!link) 122662306a36Sopenharmony_ci return false; 122762306a36Sopenharmony_ci if (S_ISDIR(link->mode) && S_ISDIR(entry->mode)) 122862306a36Sopenharmony_ci continue; 122962306a36Sopenharmony_ci if (S_ISLNK(link->mode) && (link->data == link_root)) 123062306a36Sopenharmony_ci continue; 123162306a36Sopenharmony_ci return false; 123262306a36Sopenharmony_ci } 123362306a36Sopenharmony_ci 123462306a36Sopenharmony_ci /* The checks passed. Increase the registration count on the links */ 123562306a36Sopenharmony_ci list_for_each_table_entry(entry, header) { 123662306a36Sopenharmony_ci const char *procname = entry->procname; 123762306a36Sopenharmony_ci link = find_entry(&tmp_head, dir, procname, strlen(procname)); 123862306a36Sopenharmony_ci tmp_head->nreg++; 123962306a36Sopenharmony_ci } 124062306a36Sopenharmony_ci return true; 124162306a36Sopenharmony_ci} 124262306a36Sopenharmony_ci 124362306a36Sopenharmony_cistatic int insert_links(struct ctl_table_header *head) 124462306a36Sopenharmony_ci{ 124562306a36Sopenharmony_ci struct ctl_table_set *root_set = &sysctl_table_root.default_set; 124662306a36Sopenharmony_ci struct ctl_dir *core_parent; 124762306a36Sopenharmony_ci struct ctl_table_header *links; 124862306a36Sopenharmony_ci int err; 124962306a36Sopenharmony_ci 125062306a36Sopenharmony_ci if (head->set == root_set) 125162306a36Sopenharmony_ci return 0; 125262306a36Sopenharmony_ci 125362306a36Sopenharmony_ci core_parent = xlate_dir(root_set, head->parent); 125462306a36Sopenharmony_ci if (IS_ERR(core_parent)) 125562306a36Sopenharmony_ci return 0; 125662306a36Sopenharmony_ci 125762306a36Sopenharmony_ci if (get_links(core_parent, head, head->root)) 125862306a36Sopenharmony_ci return 0; 125962306a36Sopenharmony_ci 126062306a36Sopenharmony_ci core_parent->header.nreg++; 126162306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 126262306a36Sopenharmony_ci 126362306a36Sopenharmony_ci links = new_links(core_parent, head); 126462306a36Sopenharmony_ci 126562306a36Sopenharmony_ci spin_lock(&sysctl_lock); 126662306a36Sopenharmony_ci err = -ENOMEM; 126762306a36Sopenharmony_ci if (!links) 126862306a36Sopenharmony_ci goto out; 126962306a36Sopenharmony_ci 127062306a36Sopenharmony_ci err = 0; 127162306a36Sopenharmony_ci if (get_links(core_parent, head, head->root)) { 127262306a36Sopenharmony_ci kfree(links); 127362306a36Sopenharmony_ci goto out; 127462306a36Sopenharmony_ci } 127562306a36Sopenharmony_ci 127662306a36Sopenharmony_ci err = insert_header(core_parent, links); 127762306a36Sopenharmony_ci if (err) 127862306a36Sopenharmony_ci kfree(links); 127962306a36Sopenharmony_ciout: 128062306a36Sopenharmony_ci drop_sysctl_table(&core_parent->header); 128162306a36Sopenharmony_ci return err; 128262306a36Sopenharmony_ci} 128362306a36Sopenharmony_ci 128462306a36Sopenharmony_ci/* Find the directory for the ctl_table. If one is not found create it. */ 128562306a36Sopenharmony_cistatic struct ctl_dir *sysctl_mkdir_p(struct ctl_dir *dir, const char *path) 128662306a36Sopenharmony_ci{ 128762306a36Sopenharmony_ci const char *name, *nextname; 128862306a36Sopenharmony_ci 128962306a36Sopenharmony_ci for (name = path; name; name = nextname) { 129062306a36Sopenharmony_ci int namelen; 129162306a36Sopenharmony_ci nextname = strchr(name, '/'); 129262306a36Sopenharmony_ci if (nextname) { 129362306a36Sopenharmony_ci namelen = nextname - name; 129462306a36Sopenharmony_ci nextname++; 129562306a36Sopenharmony_ci } else { 129662306a36Sopenharmony_ci namelen = strlen(name); 129762306a36Sopenharmony_ci } 129862306a36Sopenharmony_ci if (namelen == 0) 129962306a36Sopenharmony_ci continue; 130062306a36Sopenharmony_ci 130162306a36Sopenharmony_ci /* 130262306a36Sopenharmony_ci * namelen ensures if name is "foo/bar/yay" only foo is 130362306a36Sopenharmony_ci * registered first. We traverse as if using mkdir -p and 130462306a36Sopenharmony_ci * return a ctl_dir for the last directory entry. 130562306a36Sopenharmony_ci */ 130662306a36Sopenharmony_ci dir = get_subdir(dir, name, namelen); 130762306a36Sopenharmony_ci if (IS_ERR(dir)) 130862306a36Sopenharmony_ci break; 130962306a36Sopenharmony_ci } 131062306a36Sopenharmony_ci return dir; 131162306a36Sopenharmony_ci} 131262306a36Sopenharmony_ci 131362306a36Sopenharmony_ci/** 131462306a36Sopenharmony_ci * __register_sysctl_table - register a leaf sysctl table 131562306a36Sopenharmony_ci * @set: Sysctl tree to register on 131662306a36Sopenharmony_ci * @path: The path to the directory the sysctl table is in. 131762306a36Sopenharmony_ci * @table: the top-level table structure without any child. This table 131862306a36Sopenharmony_ci * should not be free'd after registration. So it should not be 131962306a36Sopenharmony_ci * used on stack. It can either be a global or dynamically allocated 132062306a36Sopenharmony_ci * by the caller and free'd later after sysctl unregistration. 132162306a36Sopenharmony_ci * @table_size : The number of elements in table 132262306a36Sopenharmony_ci * 132362306a36Sopenharmony_ci * Register a sysctl table hierarchy. @table should be a filled in ctl_table 132462306a36Sopenharmony_ci * array. A completely 0 filled entry terminates the table. 132562306a36Sopenharmony_ci * 132662306a36Sopenharmony_ci * The members of the &struct ctl_table structure are used as follows: 132762306a36Sopenharmony_ci * 132862306a36Sopenharmony_ci * procname - the name of the sysctl file under /proc/sys. Set to %NULL to not 132962306a36Sopenharmony_ci * enter a sysctl file 133062306a36Sopenharmony_ci * 133162306a36Sopenharmony_ci * data - a pointer to data for use by proc_handler 133262306a36Sopenharmony_ci * 133362306a36Sopenharmony_ci * maxlen - the maximum size in bytes of the data 133462306a36Sopenharmony_ci * 133562306a36Sopenharmony_ci * mode - the file permissions for the /proc/sys file 133662306a36Sopenharmony_ci * 133762306a36Sopenharmony_ci * child - must be %NULL. 133862306a36Sopenharmony_ci * 133962306a36Sopenharmony_ci * proc_handler - the text handler routine (described below) 134062306a36Sopenharmony_ci * 134162306a36Sopenharmony_ci * extra1, extra2 - extra pointers usable by the proc handler routines 134262306a36Sopenharmony_ci * XXX: we should eventually modify these to use long min / max [0] 134362306a36Sopenharmony_ci * [0] https://lkml.kernel.org/87zgpte9o4.fsf@email.froward.int.ebiederm.org 134462306a36Sopenharmony_ci * 134562306a36Sopenharmony_ci * Leaf nodes in the sysctl tree will be represented by a single file 134662306a36Sopenharmony_ci * under /proc; non-leaf nodes (where child is not NULL) are not allowed, 134762306a36Sopenharmony_ci * sysctl_check_table() verifies this. 134862306a36Sopenharmony_ci * 134962306a36Sopenharmony_ci * There must be a proc_handler routine for any terminal nodes. 135062306a36Sopenharmony_ci * Several default handlers are available to cover common cases - 135162306a36Sopenharmony_ci * 135262306a36Sopenharmony_ci * proc_dostring(), proc_dointvec(), proc_dointvec_jiffies(), 135362306a36Sopenharmony_ci * proc_dointvec_userhz_jiffies(), proc_dointvec_minmax(), 135462306a36Sopenharmony_ci * proc_doulongvec_ms_jiffies_minmax(), proc_doulongvec_minmax() 135562306a36Sopenharmony_ci * 135662306a36Sopenharmony_ci * It is the handler's job to read the input buffer from user memory 135762306a36Sopenharmony_ci * and process it. The handler should return 0 on success. 135862306a36Sopenharmony_ci * 135962306a36Sopenharmony_ci * This routine returns %NULL on a failure to register, and a pointer 136062306a36Sopenharmony_ci * to the table header on success. 136162306a36Sopenharmony_ci */ 136262306a36Sopenharmony_cistruct ctl_table_header *__register_sysctl_table( 136362306a36Sopenharmony_ci struct ctl_table_set *set, 136462306a36Sopenharmony_ci const char *path, struct ctl_table *table, size_t table_size) 136562306a36Sopenharmony_ci{ 136662306a36Sopenharmony_ci struct ctl_table_root *root = set->dir.header.root; 136762306a36Sopenharmony_ci struct ctl_table_header *header; 136862306a36Sopenharmony_ci struct ctl_dir *dir; 136962306a36Sopenharmony_ci struct ctl_node *node; 137062306a36Sopenharmony_ci 137162306a36Sopenharmony_ci header = kzalloc(sizeof(struct ctl_table_header) + 137262306a36Sopenharmony_ci sizeof(struct ctl_node)*table_size, GFP_KERNEL_ACCOUNT); 137362306a36Sopenharmony_ci if (!header) 137462306a36Sopenharmony_ci return NULL; 137562306a36Sopenharmony_ci 137662306a36Sopenharmony_ci node = (struct ctl_node *)(header + 1); 137762306a36Sopenharmony_ci init_header(header, root, set, node, table, table_size); 137862306a36Sopenharmony_ci if (sysctl_check_table(path, header)) 137962306a36Sopenharmony_ci goto fail; 138062306a36Sopenharmony_ci 138162306a36Sopenharmony_ci spin_lock(&sysctl_lock); 138262306a36Sopenharmony_ci dir = &set->dir; 138362306a36Sopenharmony_ci /* Reference moved down the directory tree get_subdir */ 138462306a36Sopenharmony_ci dir->header.nreg++; 138562306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 138662306a36Sopenharmony_ci 138762306a36Sopenharmony_ci dir = sysctl_mkdir_p(dir, path); 138862306a36Sopenharmony_ci if (IS_ERR(dir)) 138962306a36Sopenharmony_ci goto fail; 139062306a36Sopenharmony_ci spin_lock(&sysctl_lock); 139162306a36Sopenharmony_ci if (insert_header(dir, header)) 139262306a36Sopenharmony_ci goto fail_put_dir_locked; 139362306a36Sopenharmony_ci 139462306a36Sopenharmony_ci drop_sysctl_table(&dir->header); 139562306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 139662306a36Sopenharmony_ci 139762306a36Sopenharmony_ci return header; 139862306a36Sopenharmony_ci 139962306a36Sopenharmony_cifail_put_dir_locked: 140062306a36Sopenharmony_ci drop_sysctl_table(&dir->header); 140162306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 140262306a36Sopenharmony_cifail: 140362306a36Sopenharmony_ci kfree(header); 140462306a36Sopenharmony_ci return NULL; 140562306a36Sopenharmony_ci} 140662306a36Sopenharmony_ci 140762306a36Sopenharmony_ci/** 140862306a36Sopenharmony_ci * register_sysctl_sz - register a sysctl table 140962306a36Sopenharmony_ci * @path: The path to the directory the sysctl table is in. If the path 141062306a36Sopenharmony_ci * doesn't exist we will create it for you. 141162306a36Sopenharmony_ci * @table: the table structure. The calller must ensure the life of the @table 141262306a36Sopenharmony_ci * will be kept during the lifetime use of the syctl. It must not be freed 141362306a36Sopenharmony_ci * until unregister_sysctl_table() is called with the given returned table 141462306a36Sopenharmony_ci * with this registration. If your code is non modular then you don't need 141562306a36Sopenharmony_ci * to call unregister_sysctl_table() and can instead use something like 141662306a36Sopenharmony_ci * register_sysctl_init() which does not care for the result of the syctl 141762306a36Sopenharmony_ci * registration. 141862306a36Sopenharmony_ci * @table_size: The number of elements in table. 141962306a36Sopenharmony_ci * 142062306a36Sopenharmony_ci * Register a sysctl table. @table should be a filled in ctl_table 142162306a36Sopenharmony_ci * array. A completely 0 filled entry terminates the table. 142262306a36Sopenharmony_ci * 142362306a36Sopenharmony_ci * See __register_sysctl_table for more details. 142462306a36Sopenharmony_ci */ 142562306a36Sopenharmony_cistruct ctl_table_header *register_sysctl_sz(const char *path, struct ctl_table *table, 142662306a36Sopenharmony_ci size_t table_size) 142762306a36Sopenharmony_ci{ 142862306a36Sopenharmony_ci return __register_sysctl_table(&sysctl_table_root.default_set, 142962306a36Sopenharmony_ci path, table, table_size); 143062306a36Sopenharmony_ci} 143162306a36Sopenharmony_ciEXPORT_SYMBOL(register_sysctl_sz); 143262306a36Sopenharmony_ci 143362306a36Sopenharmony_ci/** 143462306a36Sopenharmony_ci * __register_sysctl_init() - register sysctl table to path 143562306a36Sopenharmony_ci * @path: path name for sysctl base. If that path doesn't exist we will create 143662306a36Sopenharmony_ci * it for you. 143762306a36Sopenharmony_ci * @table: This is the sysctl table that needs to be registered to the path. 143862306a36Sopenharmony_ci * The caller must ensure the life of the @table will be kept during the 143962306a36Sopenharmony_ci * lifetime use of the sysctl. 144062306a36Sopenharmony_ci * @table_name: The name of sysctl table, only used for log printing when 144162306a36Sopenharmony_ci * registration fails 144262306a36Sopenharmony_ci * @table_size: The number of elements in table 144362306a36Sopenharmony_ci * 144462306a36Sopenharmony_ci * The sysctl interface is used by userspace to query or modify at runtime 144562306a36Sopenharmony_ci * a predefined value set on a variable. These variables however have default 144662306a36Sopenharmony_ci * values pre-set. Code which depends on these variables will always work even 144762306a36Sopenharmony_ci * if register_sysctl() fails. If register_sysctl() fails you'd just loose the 144862306a36Sopenharmony_ci * ability to query or modify the sysctls dynamically at run time. Chances of 144962306a36Sopenharmony_ci * register_sysctl() failing on init are extremely low, and so for both reasons 145062306a36Sopenharmony_ci * this function does not return any error as it is used by initialization code. 145162306a36Sopenharmony_ci * 145262306a36Sopenharmony_ci * Context: if your base directory does not exist it will be created for you. 145362306a36Sopenharmony_ci */ 145462306a36Sopenharmony_civoid __init __register_sysctl_init(const char *path, struct ctl_table *table, 145562306a36Sopenharmony_ci const char *table_name, size_t table_size) 145662306a36Sopenharmony_ci{ 145762306a36Sopenharmony_ci struct ctl_table_header *hdr = register_sysctl_sz(path, table, table_size); 145862306a36Sopenharmony_ci 145962306a36Sopenharmony_ci if (unlikely(!hdr)) { 146062306a36Sopenharmony_ci pr_err("failed when register_sysctl_sz %s to %s\n", table_name, path); 146162306a36Sopenharmony_ci return; 146262306a36Sopenharmony_ci } 146362306a36Sopenharmony_ci kmemleak_not_leak(hdr); 146462306a36Sopenharmony_ci} 146562306a36Sopenharmony_ci 146662306a36Sopenharmony_cistatic void put_links(struct ctl_table_header *header) 146762306a36Sopenharmony_ci{ 146862306a36Sopenharmony_ci struct ctl_table_set *root_set = &sysctl_table_root.default_set; 146962306a36Sopenharmony_ci struct ctl_table_root *root = header->root; 147062306a36Sopenharmony_ci struct ctl_dir *parent = header->parent; 147162306a36Sopenharmony_ci struct ctl_dir *core_parent; 147262306a36Sopenharmony_ci struct ctl_table *entry; 147362306a36Sopenharmony_ci 147462306a36Sopenharmony_ci if (header->set == root_set) 147562306a36Sopenharmony_ci return; 147662306a36Sopenharmony_ci 147762306a36Sopenharmony_ci core_parent = xlate_dir(root_set, parent); 147862306a36Sopenharmony_ci if (IS_ERR(core_parent)) 147962306a36Sopenharmony_ci return; 148062306a36Sopenharmony_ci 148162306a36Sopenharmony_ci list_for_each_table_entry(entry, header) { 148262306a36Sopenharmony_ci struct ctl_table_header *link_head; 148362306a36Sopenharmony_ci struct ctl_table *link; 148462306a36Sopenharmony_ci const char *name = entry->procname; 148562306a36Sopenharmony_ci 148662306a36Sopenharmony_ci link = find_entry(&link_head, core_parent, name, strlen(name)); 148762306a36Sopenharmony_ci if (link && 148862306a36Sopenharmony_ci ((S_ISDIR(link->mode) && S_ISDIR(entry->mode)) || 148962306a36Sopenharmony_ci (S_ISLNK(link->mode) && (link->data == root)))) { 149062306a36Sopenharmony_ci drop_sysctl_table(link_head); 149162306a36Sopenharmony_ci } 149262306a36Sopenharmony_ci else { 149362306a36Sopenharmony_ci pr_err("sysctl link missing during unregister: "); 149462306a36Sopenharmony_ci sysctl_print_dir(parent); 149562306a36Sopenharmony_ci pr_cont("%s\n", name); 149662306a36Sopenharmony_ci } 149762306a36Sopenharmony_ci } 149862306a36Sopenharmony_ci} 149962306a36Sopenharmony_ci 150062306a36Sopenharmony_cistatic void drop_sysctl_table(struct ctl_table_header *header) 150162306a36Sopenharmony_ci{ 150262306a36Sopenharmony_ci struct ctl_dir *parent = header->parent; 150362306a36Sopenharmony_ci 150462306a36Sopenharmony_ci if (--header->nreg) 150562306a36Sopenharmony_ci return; 150662306a36Sopenharmony_ci 150762306a36Sopenharmony_ci if (parent) { 150862306a36Sopenharmony_ci put_links(header); 150962306a36Sopenharmony_ci start_unregistering(header); 151062306a36Sopenharmony_ci } 151162306a36Sopenharmony_ci 151262306a36Sopenharmony_ci if (!--header->count) 151362306a36Sopenharmony_ci kfree_rcu(header, rcu); 151462306a36Sopenharmony_ci 151562306a36Sopenharmony_ci if (parent) 151662306a36Sopenharmony_ci drop_sysctl_table(&parent->header); 151762306a36Sopenharmony_ci} 151862306a36Sopenharmony_ci 151962306a36Sopenharmony_ci/** 152062306a36Sopenharmony_ci * unregister_sysctl_table - unregister a sysctl table hierarchy 152162306a36Sopenharmony_ci * @header: the header returned from register_sysctl or __register_sysctl_table 152262306a36Sopenharmony_ci * 152362306a36Sopenharmony_ci * Unregisters the sysctl table and all children. proc entries may not 152462306a36Sopenharmony_ci * actually be removed until they are no longer used by anyone. 152562306a36Sopenharmony_ci */ 152662306a36Sopenharmony_civoid unregister_sysctl_table(struct ctl_table_header * header) 152762306a36Sopenharmony_ci{ 152862306a36Sopenharmony_ci might_sleep(); 152962306a36Sopenharmony_ci 153062306a36Sopenharmony_ci if (header == NULL) 153162306a36Sopenharmony_ci return; 153262306a36Sopenharmony_ci 153362306a36Sopenharmony_ci spin_lock(&sysctl_lock); 153462306a36Sopenharmony_ci drop_sysctl_table(header); 153562306a36Sopenharmony_ci spin_unlock(&sysctl_lock); 153662306a36Sopenharmony_ci} 153762306a36Sopenharmony_ciEXPORT_SYMBOL(unregister_sysctl_table); 153862306a36Sopenharmony_ci 153962306a36Sopenharmony_civoid setup_sysctl_set(struct ctl_table_set *set, 154062306a36Sopenharmony_ci struct ctl_table_root *root, 154162306a36Sopenharmony_ci int (*is_seen)(struct ctl_table_set *)) 154262306a36Sopenharmony_ci{ 154362306a36Sopenharmony_ci memset(set, 0, sizeof(*set)); 154462306a36Sopenharmony_ci set->is_seen = is_seen; 154562306a36Sopenharmony_ci init_header(&set->dir.header, root, set, NULL, root_table, 1); 154662306a36Sopenharmony_ci} 154762306a36Sopenharmony_ci 154862306a36Sopenharmony_civoid retire_sysctl_set(struct ctl_table_set *set) 154962306a36Sopenharmony_ci{ 155062306a36Sopenharmony_ci WARN_ON(!RB_EMPTY_ROOT(&set->dir.root)); 155162306a36Sopenharmony_ci} 155262306a36Sopenharmony_ci 155362306a36Sopenharmony_ciint __init proc_sys_init(void) 155462306a36Sopenharmony_ci{ 155562306a36Sopenharmony_ci struct proc_dir_entry *proc_sys_root; 155662306a36Sopenharmony_ci 155762306a36Sopenharmony_ci proc_sys_root = proc_mkdir("sys", NULL); 155862306a36Sopenharmony_ci proc_sys_root->proc_iops = &proc_sys_dir_operations; 155962306a36Sopenharmony_ci proc_sys_root->proc_dir_ops = &proc_sys_dir_file_operations; 156062306a36Sopenharmony_ci proc_sys_root->nlink = 0; 156162306a36Sopenharmony_ci 156262306a36Sopenharmony_ci return sysctl_init_bases(); 156362306a36Sopenharmony_ci} 156462306a36Sopenharmony_ci 156562306a36Sopenharmony_cistruct sysctl_alias { 156662306a36Sopenharmony_ci const char *kernel_param; 156762306a36Sopenharmony_ci const char *sysctl_param; 156862306a36Sopenharmony_ci}; 156962306a36Sopenharmony_ci 157062306a36Sopenharmony_ci/* 157162306a36Sopenharmony_ci * Historically some settings had both sysctl and a command line parameter. 157262306a36Sopenharmony_ci * With the generic sysctl. parameter support, we can handle them at a single 157362306a36Sopenharmony_ci * place and only keep the historical name for compatibility. This is not meant 157462306a36Sopenharmony_ci * to add brand new aliases. When adding existing aliases, consider whether 157562306a36Sopenharmony_ci * the possibly different moment of changing the value (e.g. from early_param 157662306a36Sopenharmony_ci * to the moment do_sysctl_args() is called) is an issue for the specific 157762306a36Sopenharmony_ci * parameter. 157862306a36Sopenharmony_ci */ 157962306a36Sopenharmony_cistatic const struct sysctl_alias sysctl_aliases[] = { 158062306a36Sopenharmony_ci {"hardlockup_all_cpu_backtrace", "kernel.hardlockup_all_cpu_backtrace" }, 158162306a36Sopenharmony_ci {"hung_task_panic", "kernel.hung_task_panic" }, 158262306a36Sopenharmony_ci {"numa_zonelist_order", "vm.numa_zonelist_order" }, 158362306a36Sopenharmony_ci {"softlockup_all_cpu_backtrace", "kernel.softlockup_all_cpu_backtrace" }, 158462306a36Sopenharmony_ci { } 158562306a36Sopenharmony_ci}; 158662306a36Sopenharmony_ci 158762306a36Sopenharmony_cistatic const char *sysctl_find_alias(char *param) 158862306a36Sopenharmony_ci{ 158962306a36Sopenharmony_ci const struct sysctl_alias *alias; 159062306a36Sopenharmony_ci 159162306a36Sopenharmony_ci for (alias = &sysctl_aliases[0]; alias->kernel_param != NULL; alias++) { 159262306a36Sopenharmony_ci if (strcmp(alias->kernel_param, param) == 0) 159362306a36Sopenharmony_ci return alias->sysctl_param; 159462306a36Sopenharmony_ci } 159562306a36Sopenharmony_ci 159662306a36Sopenharmony_ci return NULL; 159762306a36Sopenharmony_ci} 159862306a36Sopenharmony_ci 159962306a36Sopenharmony_cibool sysctl_is_alias(char *param) 160062306a36Sopenharmony_ci{ 160162306a36Sopenharmony_ci const char *alias = sysctl_find_alias(param); 160262306a36Sopenharmony_ci 160362306a36Sopenharmony_ci return alias != NULL; 160462306a36Sopenharmony_ci} 160562306a36Sopenharmony_ci 160662306a36Sopenharmony_ci/* Set sysctl value passed on kernel command line. */ 160762306a36Sopenharmony_cistatic int process_sysctl_arg(char *param, char *val, 160862306a36Sopenharmony_ci const char *unused, void *arg) 160962306a36Sopenharmony_ci{ 161062306a36Sopenharmony_ci char *path; 161162306a36Sopenharmony_ci struct vfsmount **proc_mnt = arg; 161262306a36Sopenharmony_ci struct file_system_type *proc_fs_type; 161362306a36Sopenharmony_ci struct file *file; 161462306a36Sopenharmony_ci int len; 161562306a36Sopenharmony_ci int err; 161662306a36Sopenharmony_ci loff_t pos = 0; 161762306a36Sopenharmony_ci ssize_t wret; 161862306a36Sopenharmony_ci 161962306a36Sopenharmony_ci if (strncmp(param, "sysctl", sizeof("sysctl") - 1) == 0) { 162062306a36Sopenharmony_ci param += sizeof("sysctl") - 1; 162162306a36Sopenharmony_ci 162262306a36Sopenharmony_ci if (param[0] != '/' && param[0] != '.') 162362306a36Sopenharmony_ci return 0; 162462306a36Sopenharmony_ci 162562306a36Sopenharmony_ci param++; 162662306a36Sopenharmony_ci } else { 162762306a36Sopenharmony_ci param = (char *) sysctl_find_alias(param); 162862306a36Sopenharmony_ci if (!param) 162962306a36Sopenharmony_ci return 0; 163062306a36Sopenharmony_ci } 163162306a36Sopenharmony_ci 163262306a36Sopenharmony_ci if (!val) 163362306a36Sopenharmony_ci return -EINVAL; 163462306a36Sopenharmony_ci len = strlen(val); 163562306a36Sopenharmony_ci if (len == 0) 163662306a36Sopenharmony_ci return -EINVAL; 163762306a36Sopenharmony_ci 163862306a36Sopenharmony_ci /* 163962306a36Sopenharmony_ci * To set sysctl options, we use a temporary mount of proc, look up the 164062306a36Sopenharmony_ci * respective sys/ file and write to it. To avoid mounting it when no 164162306a36Sopenharmony_ci * options were given, we mount it only when the first sysctl option is 164262306a36Sopenharmony_ci * found. Why not a persistent mount? There are problems with a 164362306a36Sopenharmony_ci * persistent mount of proc in that it forces userspace not to use any 164462306a36Sopenharmony_ci * proc mount options. 164562306a36Sopenharmony_ci */ 164662306a36Sopenharmony_ci if (!*proc_mnt) { 164762306a36Sopenharmony_ci proc_fs_type = get_fs_type("proc"); 164862306a36Sopenharmony_ci if (!proc_fs_type) { 164962306a36Sopenharmony_ci pr_err("Failed to find procfs to set sysctl from command line\n"); 165062306a36Sopenharmony_ci return 0; 165162306a36Sopenharmony_ci } 165262306a36Sopenharmony_ci *proc_mnt = kern_mount(proc_fs_type); 165362306a36Sopenharmony_ci put_filesystem(proc_fs_type); 165462306a36Sopenharmony_ci if (IS_ERR(*proc_mnt)) { 165562306a36Sopenharmony_ci pr_err("Failed to mount procfs to set sysctl from command line\n"); 165662306a36Sopenharmony_ci return 0; 165762306a36Sopenharmony_ci } 165862306a36Sopenharmony_ci } 165962306a36Sopenharmony_ci 166062306a36Sopenharmony_ci path = kasprintf(GFP_KERNEL, "sys/%s", param); 166162306a36Sopenharmony_ci if (!path) 166262306a36Sopenharmony_ci panic("%s: Failed to allocate path for %s\n", __func__, param); 166362306a36Sopenharmony_ci strreplace(path, '.', '/'); 166462306a36Sopenharmony_ci 166562306a36Sopenharmony_ci file = file_open_root_mnt(*proc_mnt, path, O_WRONLY, 0); 166662306a36Sopenharmony_ci if (IS_ERR(file)) { 166762306a36Sopenharmony_ci err = PTR_ERR(file); 166862306a36Sopenharmony_ci if (err == -ENOENT) 166962306a36Sopenharmony_ci pr_err("Failed to set sysctl parameter '%s=%s': parameter not found\n", 167062306a36Sopenharmony_ci param, val); 167162306a36Sopenharmony_ci else if (err == -EACCES) 167262306a36Sopenharmony_ci pr_err("Failed to set sysctl parameter '%s=%s': permission denied (read-only?)\n", 167362306a36Sopenharmony_ci param, val); 167462306a36Sopenharmony_ci else 167562306a36Sopenharmony_ci pr_err("Error %pe opening proc file to set sysctl parameter '%s=%s'\n", 167662306a36Sopenharmony_ci file, param, val); 167762306a36Sopenharmony_ci goto out; 167862306a36Sopenharmony_ci } 167962306a36Sopenharmony_ci wret = kernel_write(file, val, len, &pos); 168062306a36Sopenharmony_ci if (wret < 0) { 168162306a36Sopenharmony_ci err = wret; 168262306a36Sopenharmony_ci if (err == -EINVAL) 168362306a36Sopenharmony_ci pr_err("Failed to set sysctl parameter '%s=%s': invalid value\n", 168462306a36Sopenharmony_ci param, val); 168562306a36Sopenharmony_ci else 168662306a36Sopenharmony_ci pr_err("Error %pe writing to proc file to set sysctl parameter '%s=%s'\n", 168762306a36Sopenharmony_ci ERR_PTR(err), param, val); 168862306a36Sopenharmony_ci } else if (wret != len) { 168962306a36Sopenharmony_ci pr_err("Wrote only %zd bytes of %d writing to proc file %s to set sysctl parameter '%s=%s\n", 169062306a36Sopenharmony_ci wret, len, path, param, val); 169162306a36Sopenharmony_ci } 169262306a36Sopenharmony_ci 169362306a36Sopenharmony_ci err = filp_close(file, NULL); 169462306a36Sopenharmony_ci if (err) 169562306a36Sopenharmony_ci pr_err("Error %pe closing proc file to set sysctl parameter '%s=%s\n", 169662306a36Sopenharmony_ci ERR_PTR(err), param, val); 169762306a36Sopenharmony_ciout: 169862306a36Sopenharmony_ci kfree(path); 169962306a36Sopenharmony_ci return 0; 170062306a36Sopenharmony_ci} 170162306a36Sopenharmony_ci 170262306a36Sopenharmony_civoid do_sysctl_args(void) 170362306a36Sopenharmony_ci{ 170462306a36Sopenharmony_ci char *command_line; 170562306a36Sopenharmony_ci struct vfsmount *proc_mnt = NULL; 170662306a36Sopenharmony_ci 170762306a36Sopenharmony_ci command_line = kstrdup(saved_command_line, GFP_KERNEL); 170862306a36Sopenharmony_ci if (!command_line) 170962306a36Sopenharmony_ci panic("%s: Failed to allocate copy of command line\n", __func__); 171062306a36Sopenharmony_ci 171162306a36Sopenharmony_ci parse_args("Setting sysctl args", command_line, 171262306a36Sopenharmony_ci NULL, 0, -1, -1, &proc_mnt, process_sysctl_arg); 171362306a36Sopenharmony_ci 171462306a36Sopenharmony_ci if (proc_mnt) 171562306a36Sopenharmony_ci kern_unmount(proc_mnt); 171662306a36Sopenharmony_ci 171762306a36Sopenharmony_ci kfree(command_line); 171862306a36Sopenharmony_ci} 1719