ipc_sysctl.c 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2007
  4. *
  5. * Author: Eric Biederman <ebiederm@xmision.com>
  6. */
  7. #include <linux/module.h>
  8. #include <linux/ipc.h>
  9. #include <linux/nsproxy.h>
  10. #include <linux/sysctl.h>
  11. #include <linux/uaccess.h>
  12. #include <linux/capability.h>
  13. #include <linux/ipc_namespace.h>
  14. #include <linux/msg.h>
  15. #include <linux/slab.h>
  16. #include <linux/cred.h>
  17. #include "util.h"
  18. static int proc_ipc_dointvec_minmax_orphans(const struct ctl_table *table, int write,
  19. void *buffer, size_t *lenp, loff_t *ppos)
  20. {
  21. struct ipc_namespace *ns =
  22. container_of(table->data, struct ipc_namespace, shm_rmid_forced);
  23. int err;
  24. err = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
  25. if (err < 0)
  26. return err;
  27. if (ns->shm_rmid_forced)
  28. shm_destroy_orphaned(ns);
  29. return err;
  30. }
  31. static int proc_ipc_auto_msgmni(const struct ctl_table *table, int write,
  32. void *buffer, size_t *lenp, loff_t *ppos)
  33. {
  34. struct ctl_table ipc_table;
  35. int dummy = 0;
  36. memcpy(&ipc_table, table, sizeof(ipc_table));
  37. ipc_table.data = &dummy;
  38. if (write)
  39. pr_info_once("writing to auto_msgmni has no effect");
  40. return proc_dointvec_minmax(&ipc_table, write, buffer, lenp, ppos);
  41. }
  42. static int proc_ipc_sem_dointvec(const struct ctl_table *table, int write,
  43. void *buffer, size_t *lenp, loff_t *ppos)
  44. {
  45. struct ipc_namespace *ns =
  46. container_of(table->data, struct ipc_namespace, sem_ctls);
  47. int ret, semmni;
  48. semmni = ns->sem_ctls[3];
  49. ret = proc_dointvec(table, write, buffer, lenp, ppos);
  50. if (!ret)
  51. ret = sem_check_semmni(ns);
  52. /*
  53. * Reset the semmni value if an error happens.
  54. */
  55. if (ret)
  56. ns->sem_ctls[3] = semmni;
  57. return ret;
  58. }
  59. int ipc_mni = IPCMNI;
  60. int ipc_mni_shift = IPCMNI_SHIFT;
  61. int ipc_min_cycle = RADIX_TREE_MAP_SIZE;
  62. static struct ctl_table ipc_sysctls[] = {
  63. {
  64. .procname = "shmmax",
  65. .data = &init_ipc_ns.shm_ctlmax,
  66. .maxlen = sizeof(init_ipc_ns.shm_ctlmax),
  67. .mode = 0644,
  68. .proc_handler = proc_doulongvec_minmax,
  69. },
  70. {
  71. .procname = "shmall",
  72. .data = &init_ipc_ns.shm_ctlall,
  73. .maxlen = sizeof(init_ipc_ns.shm_ctlall),
  74. .mode = 0644,
  75. .proc_handler = proc_doulongvec_minmax,
  76. },
  77. {
  78. .procname = "shmmni",
  79. .data = &init_ipc_ns.shm_ctlmni,
  80. .maxlen = sizeof(init_ipc_ns.shm_ctlmni),
  81. .mode = 0644,
  82. .proc_handler = proc_dointvec_minmax,
  83. .extra1 = SYSCTL_ZERO,
  84. .extra2 = &ipc_mni,
  85. },
  86. {
  87. .procname = "shm_rmid_forced",
  88. .data = &init_ipc_ns.shm_rmid_forced,
  89. .maxlen = sizeof(init_ipc_ns.shm_rmid_forced),
  90. .mode = 0644,
  91. .proc_handler = proc_ipc_dointvec_minmax_orphans,
  92. .extra1 = SYSCTL_ZERO,
  93. .extra2 = SYSCTL_ONE,
  94. },
  95. {
  96. .procname = "msgmax",
  97. .data = &init_ipc_ns.msg_ctlmax,
  98. .maxlen = sizeof(init_ipc_ns.msg_ctlmax),
  99. .mode = 0644,
  100. .proc_handler = proc_dointvec_minmax,
  101. .extra1 = SYSCTL_ZERO,
  102. .extra2 = SYSCTL_INT_MAX,
  103. },
  104. {
  105. .procname = "msgmni",
  106. .data = &init_ipc_ns.msg_ctlmni,
  107. .maxlen = sizeof(init_ipc_ns.msg_ctlmni),
  108. .mode = 0644,
  109. .proc_handler = proc_dointvec_minmax,
  110. .extra1 = SYSCTL_ZERO,
  111. .extra2 = &ipc_mni,
  112. },
  113. {
  114. .procname = "auto_msgmni",
  115. .data = NULL,
  116. .maxlen = sizeof(int),
  117. .mode = 0644,
  118. .proc_handler = proc_ipc_auto_msgmni,
  119. .extra1 = SYSCTL_ZERO,
  120. .extra2 = SYSCTL_ONE,
  121. },
  122. {
  123. .procname = "msgmnb",
  124. .data = &init_ipc_ns.msg_ctlmnb,
  125. .maxlen = sizeof(init_ipc_ns.msg_ctlmnb),
  126. .mode = 0644,
  127. .proc_handler = proc_dointvec_minmax,
  128. .extra1 = SYSCTL_ZERO,
  129. .extra2 = SYSCTL_INT_MAX,
  130. },
  131. {
  132. .procname = "sem",
  133. .data = &init_ipc_ns.sem_ctls,
  134. .maxlen = 4*sizeof(int),
  135. .mode = 0644,
  136. .proc_handler = proc_ipc_sem_dointvec,
  137. },
  138. #ifdef CONFIG_CHECKPOINT_RESTORE
  139. {
  140. .procname = "sem_next_id",
  141. .data = &init_ipc_ns.ids[IPC_SEM_IDS].next_id,
  142. .maxlen = sizeof(init_ipc_ns.ids[IPC_SEM_IDS].next_id),
  143. .mode = 0444,
  144. .proc_handler = proc_dointvec_minmax,
  145. .extra1 = SYSCTL_ZERO,
  146. .extra2 = SYSCTL_INT_MAX,
  147. },
  148. {
  149. .procname = "msg_next_id",
  150. .data = &init_ipc_ns.ids[IPC_MSG_IDS].next_id,
  151. .maxlen = sizeof(init_ipc_ns.ids[IPC_MSG_IDS].next_id),
  152. .mode = 0444,
  153. .proc_handler = proc_dointvec_minmax,
  154. .extra1 = SYSCTL_ZERO,
  155. .extra2 = SYSCTL_INT_MAX,
  156. },
  157. {
  158. .procname = "shm_next_id",
  159. .data = &init_ipc_ns.ids[IPC_SHM_IDS].next_id,
  160. .maxlen = sizeof(init_ipc_ns.ids[IPC_SHM_IDS].next_id),
  161. .mode = 0444,
  162. .proc_handler = proc_dointvec_minmax,
  163. .extra1 = SYSCTL_ZERO,
  164. .extra2 = SYSCTL_INT_MAX,
  165. },
  166. #endif
  167. };
  168. static struct ctl_table_set *set_lookup(struct ctl_table_root *root)
  169. {
  170. return &current->nsproxy->ipc_ns->ipc_set;
  171. }
  172. static int set_is_seen(struct ctl_table_set *set)
  173. {
  174. return &current->nsproxy->ipc_ns->ipc_set == set;
  175. }
  176. static void ipc_set_ownership(struct ctl_table_header *head,
  177. kuid_t *uid, kgid_t *gid)
  178. {
  179. struct ipc_namespace *ns =
  180. container_of(head->set, struct ipc_namespace, ipc_set);
  181. kuid_t ns_root_uid = make_kuid(ns->user_ns, 0);
  182. kgid_t ns_root_gid = make_kgid(ns->user_ns, 0);
  183. *uid = uid_valid(ns_root_uid) ? ns_root_uid : GLOBAL_ROOT_UID;
  184. *gid = gid_valid(ns_root_gid) ? ns_root_gid : GLOBAL_ROOT_GID;
  185. }
  186. static int ipc_permissions(struct ctl_table_header *head, const struct ctl_table *table)
  187. {
  188. int mode = table->mode;
  189. #ifdef CONFIG_CHECKPOINT_RESTORE
  190. struct ipc_namespace *ns =
  191. container_of(head->set, struct ipc_namespace, ipc_set);
  192. if (((table->data == &ns->ids[IPC_SEM_IDS].next_id) ||
  193. (table->data == &ns->ids[IPC_MSG_IDS].next_id) ||
  194. (table->data == &ns->ids[IPC_SHM_IDS].next_id)) &&
  195. checkpoint_restore_ns_capable(ns->user_ns))
  196. mode = 0666;
  197. else
  198. #endif
  199. {
  200. kuid_t ns_root_uid;
  201. kgid_t ns_root_gid;
  202. ipc_set_ownership(head, &ns_root_uid, &ns_root_gid);
  203. if (uid_eq(current_euid(), ns_root_uid))
  204. mode >>= 6;
  205. else if (in_egroup_p(ns_root_gid))
  206. mode >>= 3;
  207. }
  208. mode &= 7;
  209. return (mode << 6) | (mode << 3) | mode;
  210. }
  211. static struct ctl_table_root set_root = {
  212. .lookup = set_lookup,
  213. .permissions = ipc_permissions,
  214. .set_ownership = ipc_set_ownership,
  215. };
  216. bool setup_ipc_sysctls(struct ipc_namespace *ns)
  217. {
  218. struct ctl_table *tbl;
  219. setup_sysctl_set(&ns->ipc_set, &set_root, set_is_seen);
  220. tbl = kmemdup(ipc_sysctls, sizeof(ipc_sysctls), GFP_KERNEL);
  221. if (tbl) {
  222. int i;
  223. for (i = 0; i < ARRAY_SIZE(ipc_sysctls); i++) {
  224. if (tbl[i].data == &init_ipc_ns.shm_ctlmax)
  225. tbl[i].data = &ns->shm_ctlmax;
  226. else if (tbl[i].data == &init_ipc_ns.shm_ctlall)
  227. tbl[i].data = &ns->shm_ctlall;
  228. else if (tbl[i].data == &init_ipc_ns.shm_ctlmni)
  229. tbl[i].data = &ns->shm_ctlmni;
  230. else if (tbl[i].data == &init_ipc_ns.shm_rmid_forced)
  231. tbl[i].data = &ns->shm_rmid_forced;
  232. else if (tbl[i].data == &init_ipc_ns.msg_ctlmax)
  233. tbl[i].data = &ns->msg_ctlmax;
  234. else if (tbl[i].data == &init_ipc_ns.msg_ctlmni)
  235. tbl[i].data = &ns->msg_ctlmni;
  236. else if (tbl[i].data == &init_ipc_ns.msg_ctlmnb)
  237. tbl[i].data = &ns->msg_ctlmnb;
  238. else if (tbl[i].data == &init_ipc_ns.sem_ctls)
  239. tbl[i].data = &ns->sem_ctls;
  240. #ifdef CONFIG_CHECKPOINT_RESTORE
  241. else if (tbl[i].data == &init_ipc_ns.ids[IPC_SEM_IDS].next_id)
  242. tbl[i].data = &ns->ids[IPC_SEM_IDS].next_id;
  243. else if (tbl[i].data == &init_ipc_ns.ids[IPC_MSG_IDS].next_id)
  244. tbl[i].data = &ns->ids[IPC_MSG_IDS].next_id;
  245. else if (tbl[i].data == &init_ipc_ns.ids[IPC_SHM_IDS].next_id)
  246. tbl[i].data = &ns->ids[IPC_SHM_IDS].next_id;
  247. #endif
  248. else
  249. tbl[i].data = NULL;
  250. }
  251. ns->ipc_sysctls = __register_sysctl_table(&ns->ipc_set, "kernel", tbl,
  252. ARRAY_SIZE(ipc_sysctls));
  253. }
  254. if (!ns->ipc_sysctls) {
  255. kfree(tbl);
  256. retire_sysctl_set(&ns->ipc_set);
  257. return false;
  258. }
  259. return true;
  260. }
  261. void retire_ipc_sysctls(struct ipc_namespace *ns)
  262. {
  263. const struct ctl_table *tbl;
  264. tbl = ns->ipc_sysctls->ctl_table_arg;
  265. unregister_sysctl_table(ns->ipc_sysctls);
  266. retire_sysctl_set(&ns->ipc_set);
  267. kfree(tbl);
  268. }
  269. static int __init ipc_sysctl_init(void)
  270. {
  271. if (!setup_ipc_sysctls(&init_ipc_ns)) {
  272. pr_warn("ipc sysctl registration failed\n");
  273. return -ENOMEM;
  274. }
  275. return 0;
  276. }
  277. device_initcall(ipc_sysctl_init);
  278. static int __init ipc_mni_extend(char *str)
  279. {
  280. ipc_mni = IPCMNI_EXTEND;
  281. ipc_mni_shift = IPCMNI_EXTEND_SHIFT;
  282. ipc_min_cycle = IPCMNI_EXTEND_MIN_CYCLE;
  283. pr_info("IPCMNI extended to %d.\n", ipc_mni);
  284. return 0;
  285. }
  286. early_param("ipcmni_extend", ipc_mni_extend);