]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
1da177e4 LT |
2 | /* |
3 | * linux/ipc/util.c | |
4 | * Copyright (C) 1992 Krishna Balasubramanian | |
5 | * | |
6 | * Sep 1997 - Call suser() last after "normal" permission checks so we | |
7 | * get BSD style process accounting right. | |
8 | * Occurs in several places in the IPC code. | |
9 | * Chris Evans, <[email protected]> | |
10 | * Nov 1999 - ipc helper functions, unified SMP locking | |
624dffcb | 11 | * Manfred Spraul <[email protected]> |
1da177e4 LT |
12 | * Oct 2002 - One lock per IPC id. RCU ipc_free for lock-free grow_ary(). |
13 | * Mingming Cao <[email protected]> | |
073115d6 SG |
14 | * Mar 2006 - support for audit of ipc object properties |
15 | * Dustin Kirkland <[email protected]> | |
73ea4130 KK |
16 | * Jun 2006 - namespaces ssupport |
17 | * OpenVZ, SWsoft Inc. | |
18 | * Pavel Emelianov <[email protected]> | |
05603c44 DB |
19 | * |
20 | * General sysv ipc locking scheme: | |
18ccee26 DB |
21 | * rcu_read_lock() |
22 | * obtain the ipc object (kern_ipc_perm) by looking up the id in an idr | |
23 | * tree. | |
24 | * - perform initial checks (capabilities, auditing and permission, | |
25 | * etc). | |
87ad4b0d PM |
26 | * - perform read-only operations, such as INFO command, that |
27 | * do not demand atomicity | |
18ccee26 DB |
28 | * acquire the ipc lock (kern_ipc_perm.lock) through |
29 | * ipc_lock_object() | |
87ad4b0d PM |
30 | * - perform read-only operations that demand atomicity, |
31 | * such as STAT command. | |
18ccee26 DB |
32 | * - perform data updates, such as SET, RMID commands and |
33 | * mechanism-specific operations (semop/semtimedop, | |
34 | * msgsnd/msgrcv, shmat/shmdt). | |
35 | * drop the ipc lock, through ipc_unlock_object(). | |
36 | * rcu_read_unlock() | |
37 | * | |
38 | * The ids->rwsem must be taken when: | |
39 | * - creating, removing and iterating the existing entries in ipc | |
40 | * identifier sets. | |
41 | * - iterating through files under /proc/sysvipc/ | |
42 | * | |
43 | * Note that sems have a special fast path that avoids kern_ipc_perm.lock - | |
44 | * see sem_lock(). | |
1da177e4 LT |
45 | */ |
46 | ||
1da177e4 LT |
47 | #include <linux/mm.h> |
48 | #include <linux/shm.h> | |
49 | #include <linux/init.h> | |
50 | #include <linux/msg.h> | |
1da177e4 LT |
51 | #include <linux/vmalloc.h> |
52 | #include <linux/slab.h> | |
8f68fa2d | 53 | #include <linux/notifier.h> |
c59ede7b | 54 | #include <linux/capability.h> |
1da177e4 LT |
55 | #include <linux/highuid.h> |
56 | #include <linux/security.h> | |
57 | #include <linux/rcupdate.h> | |
58 | #include <linux/workqueue.h> | |
ae781774 MW |
59 | #include <linux/seq_file.h> |
60 | #include <linux/proc_fs.h> | |
073115d6 | 61 | #include <linux/audit.h> |
73ea4130 | 62 | #include <linux/nsproxy.h> |
3e148c79 | 63 | #include <linux/rwsem.h> |
b6b337ad | 64 | #include <linux/memory.h> |
ae5e1b22 | 65 | #include <linux/ipc_namespace.h> |
0eb71a9d | 66 | #include <linux/rhashtable.h> |
b869d5be | 67 | #include <linux/log2.h> |
1da177e4 LT |
68 | |
69 | #include <asm/unistd.h> | |
70 | ||
71 | #include "util.h" | |
72 | ||
ae781774 MW |
73 | struct ipc_proc_iface { |
74 | const char *path; | |
75 | const char *header; | |
73ea4130 | 76 | int ids; |
ae781774 MW |
77 | int (*show)(struct seq_file *, void *); |
78 | }; | |
79 | ||
1da177e4 | 80 | /** |
8001c858 | 81 | * ipc_init - initialise ipc subsystem |
1da177e4 | 82 | * |
8001c858 DB |
83 | * The various sysv ipc resources (semaphores, messages and shared |
84 | * memory) are initialised. | |
85 | * | |
86 | * A callback routine is registered into the memory hotplug notifier | |
87 | * chain: since msgmni scales to lowmem this callback routine will be | |
88 | * called upon successful memory add / remove to recompute msmgni. | |
1da177e4 | 89 | */ |
1da177e4 LT |
90 | static int __init ipc_init(void) |
91 | { | |
e74a0eff | 92 | proc_mkdir("sysvipc", NULL); |
eae04d25 DB |
93 | sem_init(); |
94 | msg_init(); | |
1da177e4 | 95 | shm_init(); |
0cfb6aee | 96 | |
eae04d25 | 97 | return 0; |
1da177e4 | 98 | } |
6d08a256 | 99 | device_initcall(ipc_init); |
1da177e4 | 100 | |
0cfb6aee GK |
101 | static const struct rhashtable_params ipc_kht_params = { |
102 | .head_offset = offsetof(struct kern_ipc_perm, khtnode), | |
103 | .key_offset = offsetof(struct kern_ipc_perm, key), | |
c593642c | 104 | .key_len = sizeof_field(struct kern_ipc_perm, key), |
0cfb6aee GK |
105 | .automatic_shrinking = true, |
106 | }; | |
107 | ||
1da177e4 | 108 | /** |
8001c858 DB |
109 | * ipc_init_ids - initialise ipc identifiers |
110 | * @ids: ipc identifier set | |
1da177e4 | 111 | * |
8001c858 | 112 | * Set up the sequence range to use for the ipc identifier range (limited |
5ac893b8 | 113 | * below ipc_mni) then initialise the keys hashtable and ids idr. |
1da177e4 | 114 | */ |
eae04d25 | 115 | void ipc_init_ids(struct ipc_ids *ids) |
1da177e4 | 116 | { |
1da177e4 | 117 | ids->in_use = 0; |
1da177e4 | 118 | ids->seq = 0; |
daf948c7 | 119 | init_rwsem(&ids->rwsem); |
eae04d25 | 120 | rhashtable_init(&ids->key_ht, &ipc_kht_params); |
7ca7e564 | 121 | idr_init(&ids->ipcs_idr); |
27c331a1 | 122 | ids->max_idx = -1; |
3278a2c2 | 123 | ids->last_idx = -1; |
b8fd9983 DB |
124 | #ifdef CONFIG_CHECKPOINT_RESTORE |
125 | ids->next_id = -1; | |
126 | #endif | |
1da177e4 LT |
127 | } |
128 | ||
ae781774 | 129 | #ifdef CONFIG_PROC_FS |
97a32539 | 130 | static const struct proc_ops sysvipc_proc_ops; |
ae781774 | 131 | /** |
8001c858 DB |
132 | * ipc_init_proc_interface - create a proc interface for sysipc types using a seq_file interface. |
133 | * @path: Path in procfs | |
134 | * @header: Banner to be printed at the beginning of the file. | |
135 | * @ids: ipc id table to iterate. | |
136 | * @show: show routine. | |
ae781774 MW |
137 | */ |
138 | void __init ipc_init_proc_interface(const char *path, const char *header, | |
73ea4130 | 139 | int ids, int (*show)(struct seq_file *, void *)) |
ae781774 MW |
140 | { |
141 | struct proc_dir_entry *pde; | |
142 | struct ipc_proc_iface *iface; | |
143 | ||
144 | iface = kmalloc(sizeof(*iface), GFP_KERNEL); | |
145 | if (!iface) | |
146 | return; | |
147 | iface->path = path; | |
148 | iface->header = header; | |
149 | iface->ids = ids; | |
150 | iface->show = show; | |
151 | ||
6a6375db DL |
152 | pde = proc_create_data(path, |
153 | S_IRUGO, /* world readable */ | |
154 | NULL, /* parent dir */ | |
97a32539 | 155 | &sysvipc_proc_ops, |
6a6375db | 156 | iface); |
3ab08fe2 | 157 | if (!pde) |
ae781774 | 158 | kfree(iface); |
ae781774 MW |
159 | } |
160 | #endif | |
161 | ||
1da177e4 | 162 | /** |
8001c858 DB |
163 | * ipc_findkey - find a key in an ipc identifier set |
164 | * @ids: ipc identifier set | |
165 | * @key: key to find | |
46c0a8ca | 166 | * |
8001c858 DB |
167 | * Returns the locked pointer to the ipc structure if found or NULL |
168 | * otherwise. If key is found ipc points to the owning ipc structure | |
169 | * | |
0cfb6aee | 170 | * Called with writer ipc_ids.rwsem held. |
1da177e4 | 171 | */ |
7748dbfa | 172 | static struct kern_ipc_perm *ipc_findkey(struct ipc_ids *ids, key_t key) |
1da177e4 | 173 | { |
dc2c8c84 | 174 | struct kern_ipc_perm *ipcp; |
7ca7e564 | 175 | |
dc2c8c84 | 176 | ipcp = rhashtable_lookup_fast(&ids->key_ht, &key, |
0cfb6aee | 177 | ipc_kht_params); |
dc2c8c84 DB |
178 | if (!ipcp) |
179 | return NULL; | |
7ca7e564 | 180 | |
dc2c8c84 DB |
181 | rcu_read_lock(); |
182 | ipc_lock_object(ipcp); | |
183 | return ipcp; | |
1da177e4 LT |
184 | } |
185 | ||
b8fd9983 | 186 | /* |
e2652ae6 MS |
187 | * Insert new IPC object into idr tree, and set sequence number and id |
188 | * in the correct order. | |
189 | * Especially: | |
190 | * - the sequence number must be set before inserting the object into the idr, | |
191 | * because the sequence number is accessed without a lock. | |
192 | * - the id can/must be set after inserting the object into the idr. | |
193 | * All accesses must be done after getting kern_ipc_perm.lock. | |
194 | * | |
195 | * The caller must own kern_ipc_perm.lock.of the new object. | |
196 | * On error, the function returns a (negative) error code. | |
3278a2c2 MS |
197 | * |
198 | * To conserve sequence number space, especially with extended ipc_mni, | |
199 | * the sequence number is incremented only when the returned ID is less than | |
200 | * the last one. | |
b8fd9983 | 201 | */ |
e2652ae6 | 202 | static inline int ipc_idr_alloc(struct ipc_ids *ids, struct kern_ipc_perm *new) |
b8fd9983 | 203 | { |
e2652ae6 MS |
204 | int idx, next_id = -1; |
205 | ||
206 | #ifdef CONFIG_CHECKPOINT_RESTORE | |
207 | next_id = ids->next_id; | |
208 | ids->next_id = -1; | |
209 | #endif | |
210 | ||
211 | /* | |
212 | * As soon as a new object is inserted into the idr, | |
213 | * ipc_obtain_object_idr() or ipc_obtain_object_check() can find it, | |
214 | * and the lockless preparations for ipc operations can start. | |
215 | * This means especially: permission checks, audit calls, allocation | |
216 | * of undo structures, ... | |
217 | * | |
218 | * Thus the object must be fully initialized, and if something fails, | |
219 | * then the full tear-down sequence must be followed. | |
220 | * (i.e.: set new->deleted, reduce refcount, call_rcu()) | |
221 | */ | |
222 | ||
223 | if (next_id < 0) { /* !CHECKPOINT_RESTORE or next_id is unset */ | |
99db46ea MS |
224 | int max_idx; |
225 | ||
226 | max_idx = max(ids->in_use*3/2, ipc_min_cycle); | |
227 | max_idx = min(max_idx, ipc_mni); | |
3278a2c2 MS |
228 | |
229 | /* allocate the idx, with a NULL struct kern_ipc_perm */ | |
99db46ea MS |
230 | idx = idr_alloc_cyclic(&ids->ipcs_idr, NULL, 0, max_idx, |
231 | GFP_NOWAIT); | |
3278a2c2 MS |
232 | |
233 | if (idx >= 0) { | |
234 | /* | |
235 | * idx got allocated successfully. | |
236 | * Now calculate the sequence number and set the | |
237 | * pointer for real. | |
238 | */ | |
239 | if (idx <= ids->last_idx) { | |
240 | ids->seq++; | |
241 | if (ids->seq >= ipcid_seq_max()) | |
242 | ids->seq = 0; | |
243 | } | |
244 | ids->last_idx = idx; | |
245 | ||
246 | new->seq = ids->seq; | |
247 | /* no need for smp_wmb(), this is done | |
248 | * inside idr_replace, as part of | |
249 | * rcu_assign_pointer | |
250 | */ | |
251 | idr_replace(&ids->ipcs_idr, new, idx); | |
252 | } | |
b8fd9983 | 253 | } else { |
e2652ae6 MS |
254 | new->seq = ipcid_to_seqx(next_id); |
255 | idx = idr_alloc(&ids->ipcs_idr, new, ipcid_to_idx(next_id), | |
256 | 0, GFP_NOWAIT); | |
b8fd9983 | 257 | } |
e2652ae6 | 258 | if (idx >= 0) |
3278a2c2 | 259 | new->id = (new->seq << ipcmni_seq_shift()) + idx; |
e2652ae6 | 260 | return idx; |
b8fd9983 DB |
261 | } |
262 | ||
1da177e4 | 263 | /** |
8001c858 DB |
264 | * ipc_addid - add an ipc identifier |
265 | * @ids: ipc identifier set | |
266 | * @new: new ipc permission set | |
ebf66799 | 267 | * @limit: limit for the number of used ids |
1da177e4 | 268 | * |
8001c858 | 269 | * Add an entry 'new' to the ipc ids idr. The permissions object is |
27c331a1 | 270 | * initialised and the first free entry is set up and the index assigned |
8001c858 | 271 | * is returned. The 'new' entry is returned in a locked state on success. |
39cfffd7 | 272 | * |
8001c858 | 273 | * On failure the entry is not locked and a negative err-code is returned. |
39cfffd7 | 274 | * The caller must use ipc_rcu_putref() to free the identifier. |
1da177e4 | 275 | * |
8001c858 | 276 | * Called with writer ipc_ids.rwsem held. |
1da177e4 | 277 | */ |
ebf66799 | 278 | int ipc_addid(struct ipc_ids *ids, struct kern_ipc_perm *new, int limit) |
1da177e4 | 279 | { |
1efdb69b EB |
280 | kuid_t euid; |
281 | kgid_t egid; | |
e2652ae6 | 282 | int idx, err; |
1da177e4 | 283 | |
39cfffd7 MS |
284 | /* 1) Initialize the refcount so that ipc_rcu_putref works */ |
285 | refcount_set(&new->refcount, 1); | |
286 | ||
5ac893b8 WL |
287 | if (limit > ipc_mni) |
288 | limit = ipc_mni; | |
7ca7e564 | 289 | |
dc2c8c84 | 290 | if (ids->in_use >= limit) |
283bb7fa | 291 | return -ENOSPC; |
7ca7e564 | 292 | |
54924ea3 TH |
293 | idr_preload(GFP_KERNEL); |
294 | ||
e00b4ff7 | 295 | spin_lock_init(&new->lock); |
e00b4ff7 ND |
296 | rcu_read_lock(); |
297 | spin_lock(&new->lock); | |
298 | ||
b9a53227 LT |
299 | current_euid_egid(&euid, &egid); |
300 | new->cuid = new->uid = euid; | |
301 | new->gid = new->cgid = egid; | |
302 | ||
39cfffd7 MS |
303 | new->deleted = false; |
304 | ||
e2652ae6 | 305 | idx = ipc_idr_alloc(ids, new); |
54924ea3 | 306 | idr_preload_end(); |
0cfb6aee | 307 | |
e2652ae6 | 308 | if (idx >= 0 && new->key != IPC_PRIVATE) { |
0cfb6aee GK |
309 | err = rhashtable_insert_fast(&ids->key_ht, &new->khtnode, |
310 | ipc_kht_params); | |
311 | if (err < 0) { | |
e2652ae6 MS |
312 | idr_remove(&ids->ipcs_idr, idx); |
313 | idx = err; | |
0cfb6aee GK |
314 | } |
315 | } | |
e2652ae6 | 316 | if (idx < 0) { |
39cfffd7 | 317 | new->deleted = true; |
e00b4ff7 ND |
318 | spin_unlock(&new->lock); |
319 | rcu_read_unlock(); | |
e2652ae6 | 320 | return idx; |
e00b4ff7 | 321 | } |
7ca7e564 | 322 | |
1da177e4 | 323 | ids->in_use++; |
27c331a1 MS |
324 | if (idx > ids->max_idx) |
325 | ids->max_idx = idx; | |
e2652ae6 | 326 | return idx; |
1da177e4 LT |
327 | } |
328 | ||
7748dbfa | 329 | /** |
8001c858 DB |
330 | * ipcget_new - create a new ipc object |
331 | * @ns: ipc namespace | |
da3dae54 | 332 | * @ids: ipc identifier set |
8001c858 DB |
333 | * @ops: the actual creation routine to call |
334 | * @params: its parameters | |
335 | * | |
336 | * This routine is called by sys_msgget, sys_semget() and sys_shmget() | |
337 | * when the key is IPC_PRIVATE. | |
7748dbfa | 338 | */ |
b2d75cdd | 339 | static int ipcget_new(struct ipc_namespace *ns, struct ipc_ids *ids, |
eb66ec44 | 340 | const struct ipc_ops *ops, struct ipc_params *params) |
7748dbfa ND |
341 | { |
342 | int err; | |
7748dbfa | 343 | |
d9a605e4 | 344 | down_write(&ids->rwsem); |
7748dbfa | 345 | err = ops->getnew(ns, params); |
d9a605e4 | 346 | up_write(&ids->rwsem); |
7748dbfa ND |
347 | return err; |
348 | } | |
349 | ||
350 | /** | |
8001c858 DB |
351 | * ipc_check_perms - check security and permissions for an ipc object |
352 | * @ns: ipc namespace | |
353 | * @ipcp: ipc permission set | |
354 | * @ops: the actual security routine to call | |
355 | * @params: its parameters | |
f4566f04 | 356 | * |
8001c858 DB |
357 | * This routine is called by sys_msgget(), sys_semget() and sys_shmget() |
358 | * when the key is not IPC_PRIVATE and that key already exists in the | |
359 | * ds IDR. | |
f4566f04 | 360 | * |
8001c858 | 361 | * On success, the ipc id is returned. |
f4566f04 | 362 | * |
8001c858 | 363 | * It is called with ipc_ids.rwsem and ipcp->lock held. |
7748dbfa | 364 | */ |
b0e77598 SH |
365 | static int ipc_check_perms(struct ipc_namespace *ns, |
366 | struct kern_ipc_perm *ipcp, | |
eb66ec44 | 367 | const struct ipc_ops *ops, |
b0e77598 | 368 | struct ipc_params *params) |
7748dbfa ND |
369 | { |
370 | int err; | |
371 | ||
b0e77598 | 372 | if (ipcperms(ns, ipcp, params->flg)) |
7748dbfa ND |
373 | err = -EACCES; |
374 | else { | |
375 | err = ops->associate(ipcp, params->flg); | |
376 | if (!err) | |
377 | err = ipcp->id; | |
378 | } | |
379 | ||
380 | return err; | |
381 | } | |
382 | ||
383 | /** | |
8001c858 DB |
384 | * ipcget_public - get an ipc object or create a new one |
385 | * @ns: ipc namespace | |
da3dae54 | 386 | * @ids: ipc identifier set |
8001c858 DB |
387 | * @ops: the actual creation routine to call |
388 | * @params: its parameters | |
389 | * | |
390 | * This routine is called by sys_msgget, sys_semget() and sys_shmget() | |
391 | * when the key is not IPC_PRIVATE. | |
392 | * It adds a new entry if the key is not found and does some permission | |
393 | * / security checkings if the key is found. | |
394 | * | |
395 | * On success, the ipc id is returned. | |
7748dbfa | 396 | */ |
b2d75cdd | 397 | static int ipcget_public(struct ipc_namespace *ns, struct ipc_ids *ids, |
eb66ec44 | 398 | const struct ipc_ops *ops, struct ipc_params *params) |
7748dbfa ND |
399 | { |
400 | struct kern_ipc_perm *ipcp; | |
401 | int flg = params->flg; | |
402 | int err; | |
7748dbfa | 403 | |
3e148c79 ND |
404 | /* |
405 | * Take the lock as a writer since we are potentially going to add | |
406 | * a new entry + read locks are not "upgradable" | |
407 | */ | |
d9a605e4 | 408 | down_write(&ids->rwsem); |
7748dbfa ND |
409 | ipcp = ipc_findkey(ids, params->key); |
410 | if (ipcp == NULL) { | |
411 | /* key not used */ | |
412 | if (!(flg & IPC_CREAT)) | |
413 | err = -ENOENT; | |
7748dbfa ND |
414 | else |
415 | err = ops->getnew(ns, params); | |
416 | } else { | |
417 | /* ipc object has been locked by ipc_findkey() */ | |
418 | ||
419 | if (flg & IPC_CREAT && flg & IPC_EXCL) | |
420 | err = -EEXIST; | |
421 | else { | |
422 | err = 0; | |
423 | if (ops->more_checks) | |
424 | err = ops->more_checks(ipcp, params); | |
425 | if (!err) | |
f4566f04 ND |
426 | /* |
427 | * ipc_check_perms returns the IPC id on | |
428 | * success | |
429 | */ | |
b0e77598 | 430 | err = ipc_check_perms(ns, ipcp, ops, params); |
7748dbfa ND |
431 | } |
432 | ipc_unlock(ipcp); | |
433 | } | |
d9a605e4 | 434 | up_write(&ids->rwsem); |
7748dbfa ND |
435 | |
436 | return err; | |
437 | } | |
438 | ||
0cfb6aee GK |
439 | /** |
440 | * ipc_kht_remove - remove an ipc from the key hashtable | |
441 | * @ids: ipc identifier set | |
442 | * @ipcp: ipc perm structure containing the key to remove | |
443 | * | |
444 | * ipc_ids.rwsem (as a writer) and the spinlock for this ID are held | |
445 | * before this function is called, and remain locked on the exit. | |
446 | */ | |
447 | static void ipc_kht_remove(struct ipc_ids *ids, struct kern_ipc_perm *ipcp) | |
448 | { | |
449 | if (ipcp->key != IPC_PRIVATE) | |
450 | rhashtable_remove_fast(&ids->key_ht, &ipcp->khtnode, | |
451 | ipc_kht_params); | |
452 | } | |
7748dbfa | 453 | |
b869d5be MS |
454 | /** |
455 | * ipc_search_maxidx - search for the highest assigned index | |
456 | * @ids: ipc identifier set | |
457 | * @limit: known upper limit for highest assigned index | |
458 | * | |
459 | * The function determines the highest assigned index in @ids. It is intended | |
460 | * to be called when ids->max_idx needs to be updated. | |
461 | * Updating ids->max_idx is necessary when the current highest index ipc | |
462 | * object is deleted. | |
463 | * If no ipc object is allocated, then -1 is returned. | |
464 | * | |
465 | * ipc_ids.rwsem needs to be held by the caller. | |
466 | */ | |
467 | static int ipc_search_maxidx(struct ipc_ids *ids, int limit) | |
468 | { | |
469 | int tmpidx; | |
470 | int i; | |
471 | int retval; | |
472 | ||
473 | i = ilog2(limit+1); | |
474 | ||
475 | retval = 0; | |
476 | for (; i >= 0; i--) { | |
477 | tmpidx = retval | (1<<i); | |
478 | /* | |
479 | * "0" is a possible index value, thus search using | |
480 | * e.g. 15,7,3,1,0 instead of 16,8,4,2,1. | |
481 | */ | |
482 | tmpidx = tmpidx-1; | |
483 | if (idr_get_next(&ids->ipcs_idr, &tmpidx)) | |
484 | retval |= (1<<i); | |
485 | } | |
486 | return retval - 1; | |
487 | } | |
488 | ||
1da177e4 | 489 | /** |
8001c858 DB |
490 | * ipc_rmid - remove an ipc identifier |
491 | * @ids: ipc identifier set | |
492 | * @ipcp: ipc perm structure containing the identifier to remove | |
1da177e4 | 493 | * |
8001c858 DB |
494 | * ipc_ids.rwsem (as a writer) and the spinlock for this ID are held |
495 | * before this function is called, and remain locked on the exit. | |
1da177e4 | 496 | */ |
7ca7e564 | 497 | void ipc_rmid(struct ipc_ids *ids, struct kern_ipc_perm *ipcp) |
1da177e4 | 498 | { |
27c331a1 | 499 | int idx = ipcid_to_idx(ipcp->id); |
7ca7e564 | 500 | |
27c331a1 | 501 | idr_remove(&ids->ipcs_idr, idx); |
0cfb6aee | 502 | ipc_kht_remove(ids, ipcp); |
1da177e4 | 503 | ids->in_use--; |
72a8ff2f | 504 | ipcp->deleted = true; |
15df03c8 | 505 | |
27c331a1 | 506 | if (unlikely(idx == ids->max_idx)) { |
b869d5be MS |
507 | idx = ids->max_idx-1; |
508 | if (idx >= 0) | |
509 | idx = ipc_search_maxidx(ids, idx); | |
27c331a1 | 510 | ids->max_idx = idx; |
15df03c8 | 511 | } |
1da177e4 LT |
512 | } |
513 | ||
0cfb6aee GK |
514 | /** |
515 | * ipc_set_key_private - switch the key of an existing ipc to IPC_PRIVATE | |
516 | * @ids: ipc identifier set | |
517 | * @ipcp: ipc perm structure containing the key to modify | |
518 | * | |
519 | * ipc_ids.rwsem (as a writer) and the spinlock for this ID are held | |
520 | * before this function is called, and remain locked on the exit. | |
521 | */ | |
522 | void ipc_set_key_private(struct ipc_ids *ids, struct kern_ipc_perm *ipcp) | |
523 | { | |
524 | ipc_kht_remove(ids, ipcp); | |
525 | ipcp->key = IPC_PRIVATE; | |
526 | } | |
527 | ||
2a9d6481 | 528 | bool ipc_rcu_getref(struct kern_ipc_perm *ptr) |
1da177e4 | 529 | { |
9405c03e | 530 | return refcount_inc_not_zero(&ptr->refcount); |
65f27f38 DH |
531 | } |
532 | ||
dba4cdd3 MS |
533 | void ipc_rcu_putref(struct kern_ipc_perm *ptr, |
534 | void (*func)(struct rcu_head *head)) | |
1da177e4 | 535 | { |
9405c03e | 536 | if (!refcount_dec_and_test(&ptr->refcount)) |
1da177e4 LT |
537 | return; |
538 | ||
dba4cdd3 | 539 | call_rcu(&ptr->rcu, func); |
53dad6d3 DB |
540 | } |
541 | ||
1da177e4 | 542 | /** |
8001c858 DB |
543 | * ipcperms - check ipc permissions |
544 | * @ns: ipc namespace | |
545 | * @ipcp: ipc permission set | |
546 | * @flag: desired permission set | |
1da177e4 | 547 | * |
8001c858 DB |
548 | * Check user, group, other permissions for access |
549 | * to ipc resources. return 0 if allowed | |
b0e77598 | 550 | * |
0e056eb5 | 551 | * @flag will most probably be 0 or ``S_...UGO`` from <linux/stat.h> |
1da177e4 | 552 | */ |
b0e77598 SH |
553 | int ipcperms(struct ipc_namespace *ns, struct kern_ipc_perm *ipcp, short flag) |
554 | { | |
1efdb69b | 555 | kuid_t euid = current_euid(); |
a33e6751 | 556 | int requested_mode, granted_mode; |
1da177e4 | 557 | |
a33e6751 | 558 | audit_ipc_obj(ipcp); |
1da177e4 LT |
559 | requested_mode = (flag >> 6) | (flag >> 3) | flag; |
560 | granted_mode = ipcp->mode; | |
1efdb69b EB |
561 | if (uid_eq(euid, ipcp->cuid) || |
562 | uid_eq(euid, ipcp->uid)) | |
1da177e4 LT |
563 | granted_mode >>= 6; |
564 | else if (in_group_p(ipcp->cgid) || in_group_p(ipcp->gid)) | |
565 | granted_mode >>= 3; | |
566 | /* is there some bit set in requested_mode but not in granted_mode? */ | |
46c0a8ca | 567 | if ((requested_mode & ~granted_mode & 0007) && |
b0e77598 | 568 | !ns_capable(ns->user_ns, CAP_IPC_OWNER)) |
1da177e4 LT |
569 | return -1; |
570 | ||
571 | return security_ipc_permission(ipcp, flag); | |
572 | } | |
573 | ||
574 | /* | |
575 | * Functions to convert between the kern_ipc_perm structure and the | |
576 | * old/new ipc_perm structures | |
577 | */ | |
578 | ||
579 | /** | |
8001c858 DB |
580 | * kernel_to_ipc64_perm - convert kernel ipc permissions to user |
581 | * @in: kernel permissions | |
582 | * @out: new style ipc permissions | |
1da177e4 | 583 | * |
8001c858 DB |
584 | * Turn the kernel object @in into a set of permissions descriptions |
585 | * for returning to userspace (@out). | |
1da177e4 | 586 | */ |
239521f3 | 587 | void kernel_to_ipc64_perm(struct kern_ipc_perm *in, struct ipc64_perm *out) |
1da177e4 LT |
588 | { |
589 | out->key = in->key; | |
1efdb69b EB |
590 | out->uid = from_kuid_munged(current_user_ns(), in->uid); |
591 | out->gid = from_kgid_munged(current_user_ns(), in->gid); | |
592 | out->cuid = from_kuid_munged(current_user_ns(), in->cuid); | |
593 | out->cgid = from_kgid_munged(current_user_ns(), in->cgid); | |
1da177e4 LT |
594 | out->mode = in->mode; |
595 | out->seq = in->seq; | |
596 | } | |
597 | ||
598 | /** | |
8001c858 DB |
599 | * ipc64_perm_to_ipc_perm - convert new ipc permissions to old |
600 | * @in: new style ipc permissions | |
601 | * @out: old style ipc permissions | |
1da177e4 | 602 | * |
8001c858 DB |
603 | * Turn the new style permissions object @in into a compatibility |
604 | * object and store it into the @out pointer. | |
1da177e4 | 605 | */ |
239521f3 | 606 | void ipc64_perm_to_ipc_perm(struct ipc64_perm *in, struct ipc_perm *out) |
1da177e4 LT |
607 | { |
608 | out->key = in->key; | |
609 | SET_UID(out->uid, in->uid); | |
610 | SET_GID(out->gid, in->gid); | |
611 | SET_UID(out->cuid, in->cuid); | |
612 | SET_GID(out->cgid, in->cgid); | |
613 | out->mode = in->mode; | |
614 | out->seq = in->seq; | |
615 | } | |
616 | ||
4d2bff5e | 617 | /** |
0cfb6aee | 618 | * ipc_obtain_object_idr |
4d2bff5e DB |
619 | * @ids: ipc identifier set |
620 | * @id: ipc id to look for | |
621 | * | |
622 | * Look for an id in the ipc ids idr and return associated ipc object. | |
623 | * | |
624 | * Call inside the RCU critical section. | |
625 | * The ipc object is *not* locked on exit. | |
626 | */ | |
55b7ae50 | 627 | struct kern_ipc_perm *ipc_obtain_object_idr(struct ipc_ids *ids, int id) |
4d2bff5e DB |
628 | { |
629 | struct kern_ipc_perm *out; | |
27c331a1 | 630 | int idx = ipcid_to_idx(id); |
4d2bff5e | 631 | |
27c331a1 | 632 | out = idr_find(&ids->ipcs_idr, idx); |
4d2bff5e DB |
633 | if (!out) |
634 | return ERR_PTR(-EINVAL); | |
635 | ||
636 | return out; | |
637 | } | |
638 | ||
4d2bff5e DB |
639 | /** |
640 | * ipc_obtain_object_check | |
641 | * @ids: ipc identifier set | |
642 | * @id: ipc id to look for | |
643 | * | |
2e5ceb45 MS |
644 | * Similar to ipc_obtain_object_idr() but also checks the ipc object |
645 | * sequence number. | |
4d2bff5e DB |
646 | * |
647 | * Call inside the RCU critical section. | |
648 | * The ipc object is *not* locked on exit. | |
649 | */ | |
650 | struct kern_ipc_perm *ipc_obtain_object_check(struct ipc_ids *ids, int id) | |
651 | { | |
55b7ae50 | 652 | struct kern_ipc_perm *out = ipc_obtain_object_idr(ids, id); |
4d2bff5e DB |
653 | |
654 | if (IS_ERR(out)) | |
655 | goto out; | |
656 | ||
657 | if (ipc_checkid(out, id)) | |
6157dbbf | 658 | return ERR_PTR(-EINVAL); |
4d2bff5e | 659 | out: |
1da177e4 LT |
660 | return out; |
661 | } | |
662 | ||
b2d75cdd PE |
663 | /** |
664 | * ipcget - Common sys_*get() code | |
da3dae54 | 665 | * @ns: namespace |
8001c858 DB |
666 | * @ids: ipc identifier set |
667 | * @ops: operations to be called on ipc object creation, permission checks | |
668 | * and further checks | |
669 | * @params: the parameters needed by the previous operations. | |
b2d75cdd PE |
670 | * |
671 | * Common routine called by sys_msgget(), sys_semget() and sys_shmget(). | |
672 | */ | |
673 | int ipcget(struct ipc_namespace *ns, struct ipc_ids *ids, | |
eb66ec44 | 674 | const struct ipc_ops *ops, struct ipc_params *params) |
b2d75cdd PE |
675 | { |
676 | if (params->key == IPC_PRIVATE) | |
677 | return ipcget_new(ns, ids, ops, params); | |
678 | else | |
679 | return ipcget_public(ns, ids, ops, params); | |
680 | } | |
681 | ||
8f4a3809 | 682 | /** |
8001c858 | 683 | * ipc_update_perm - update the permissions of an ipc object |
8f4a3809 PP |
684 | * @in: the permission given as input. |
685 | * @out: the permission of the ipc to set. | |
686 | */ | |
1efdb69b | 687 | int ipc_update_perm(struct ipc64_perm *in, struct kern_ipc_perm *out) |
8f4a3809 | 688 | { |
1efdb69b EB |
689 | kuid_t uid = make_kuid(current_user_ns(), in->uid); |
690 | kgid_t gid = make_kgid(current_user_ns(), in->gid); | |
691 | if (!uid_valid(uid) || !gid_valid(gid)) | |
692 | return -EINVAL; | |
693 | ||
694 | out->uid = uid; | |
695 | out->gid = gid; | |
8f4a3809 PP |
696 | out->mode = (out->mode & ~S_IRWXUGO) |
697 | | (in->mode & S_IRWXUGO); | |
1efdb69b EB |
698 | |
699 | return 0; | |
8f4a3809 PP |
700 | } |
701 | ||
a5f75e7f | 702 | /** |
4241c1a3 | 703 | * ipcctl_obtain_check - retrieve an ipc object and check permissions |
8001c858 | 704 | * @ns: ipc namespace |
a5f75e7f PP |
705 | * @ids: the table of ids where to look for the ipc |
706 | * @id: the id of the ipc to retrieve | |
707 | * @cmd: the cmd to check | |
708 | * @perm: the permission to set | |
709 | * @extra_perm: one extra permission parameter used by msq | |
710 | * | |
711 | * This function does some common audit and permissions check for some IPC_XXX | |
712 | * cmd and is called from semctl_down, shmctl_down and msgctl_down. | |
0e056eb5 | 713 | * |
4241c1a3 MS |
714 | * It: |
715 | * - retrieves the ipc object with the given id in the given table. | |
0e056eb5 MCC |
716 | * - performs some audit and permission check, depending on the given cmd |
717 | * - returns a pointer to the ipc object or otherwise, the corresponding | |
718 | * error. | |
7b4cc5d8 | 719 | * |
d9a605e4 | 720 | * Call holding the both the rwsem and the rcu read lock. |
a5f75e7f | 721 | */ |
4241c1a3 | 722 | struct kern_ipc_perm *ipcctl_obtain_check(struct ipc_namespace *ns, |
3b1c4ad3 DB |
723 | struct ipc_ids *ids, int id, int cmd, |
724 | struct ipc64_perm *perm, int extra_perm) | |
444d0f62 | 725 | { |
1efdb69b | 726 | kuid_t euid; |
444d0f62 DB |
727 | int err = -EPERM; |
728 | struct kern_ipc_perm *ipcp; | |
a5f75e7f | 729 | |
444d0f62 | 730 | ipcp = ipc_obtain_object_check(ids, id); |
a5f75e7f PP |
731 | if (IS_ERR(ipcp)) { |
732 | err = PTR_ERR(ipcp); | |
7b4cc5d8 | 733 | goto err; |
a5f75e7f PP |
734 | } |
735 | ||
a33e6751 | 736 | audit_ipc_obj(ipcp); |
e816f370 AV |
737 | if (cmd == IPC_SET) |
738 | audit_ipc_set_perm(extra_perm, perm->uid, | |
444d0f62 | 739 | perm->gid, perm->mode); |
414c0708 DH |
740 | |
741 | euid = current_euid(); | |
1efdb69b | 742 | if (uid_eq(euid, ipcp->cuid) || uid_eq(euid, ipcp->uid) || |
b0e77598 | 743 | ns_capable(ns->user_ns, CAP_SYS_ADMIN)) |
7b4cc5d8 DB |
744 | return ipcp; /* successful lookup */ |
745 | err: | |
a5f75e7f PP |
746 | return ERR_PTR(err); |
747 | } | |
748 | ||
c1d7e01d | 749 | #ifdef CONFIG_ARCH_WANT_IPC_PARSE_VERSION |
1da177e4 LT |
750 | |
751 | ||
752 | /** | |
8001c858 DB |
753 | * ipc_parse_version - ipc call version |
754 | * @cmd: pointer to command | |
1da177e4 | 755 | * |
8001c858 DB |
756 | * Return IPC_64 for new style IPC and IPC_OLD for old style IPC. |
757 | * The @cmd value is turned from an encoding command and version into | |
758 | * just the command code. | |
1da177e4 | 759 | */ |
239521f3 | 760 | int ipc_parse_version(int *cmd) |
1da177e4 LT |
761 | { |
762 | if (*cmd & IPC_64) { | |
763 | *cmd ^= IPC_64; | |
764 | return IPC_64; | |
765 | } else { | |
766 | return IPC_OLD; | |
767 | } | |
768 | } | |
769 | ||
c1d7e01d | 770 | #endif /* CONFIG_ARCH_WANT_IPC_PARSE_VERSION */ |
ae781774 MW |
771 | |
772 | #ifdef CONFIG_PROC_FS | |
bc1fc6d8 EB |
773 | struct ipc_proc_iter { |
774 | struct ipc_namespace *ns; | |
03f1fc09 | 775 | struct pid_namespace *pid_ns; |
bc1fc6d8 EB |
776 | struct ipc_proc_iface *iface; |
777 | }; | |
778 | ||
03f1fc09 EB |
779 | struct pid_namespace *ipc_seq_pid_ns(struct seq_file *s) |
780 | { | |
781 | struct ipc_proc_iter *iter = s->private; | |
782 | return iter->pid_ns; | |
783 | } | |
784 | ||
7ca7e564 ND |
785 | /* |
786 | * This routine locks the ipc structure found at least at position pos. | |
787 | */ | |
b524b9ad AB |
788 | static struct kern_ipc_perm *sysvipc_find_ipc(struct ipc_ids *ids, loff_t pos, |
789 | loff_t *new_pos) | |
ae781774 | 790 | { |
20401d10 RA |
791 | struct kern_ipc_perm *ipc = NULL; |
792 | int max_idx = ipc_get_maxidx(ids); | |
ae781774 | 793 | |
20401d10 | 794 | if (max_idx == -1 || pos > max_idx) |
5e698222 | 795 | goto out; |
ae781774 | 796 | |
20401d10 | 797 | for (; pos <= max_idx; pos++) { |
7ca7e564 ND |
798 | ipc = idr_find(&ids->ipcs_idr, pos); |
799 | if (ipc != NULL) { | |
32a27500 DB |
800 | rcu_read_lock(); |
801 | ipc_lock_object(ipc); | |
5e698222 | 802 | break; |
ae781774 MW |
803 | } |
804 | } | |
5e698222 VA |
805 | out: |
806 | *new_pos = pos + 1; | |
807 | return ipc; | |
ae781774 MW |
808 | } |
809 | ||
7ca7e564 ND |
810 | static void *sysvipc_proc_next(struct seq_file *s, void *it, loff_t *pos) |
811 | { | |
812 | struct ipc_proc_iter *iter = s->private; | |
813 | struct ipc_proc_iface *iface = iter->iface; | |
814 | struct kern_ipc_perm *ipc = it; | |
815 | ||
816 | /* If we had an ipc id locked before, unlock it */ | |
817 | if (ipc && ipc != SEQ_START_TOKEN) | |
818 | ipc_unlock(ipc); | |
819 | ||
ed2ddbf8 | 820 | return sysvipc_find_ipc(&iter->ns->ids[iface->ids], *pos, pos); |
7ca7e564 ND |
821 | } |
822 | ||
ae781774 | 823 | /* |
f4566f04 ND |
824 | * File positions: pos 0 -> header, pos n -> ipc id = n - 1. |
825 | * SeqFile iterator: iterator value locked ipc pointer or SEQ_TOKEN_START. | |
ae781774 MW |
826 | */ |
827 | static void *sysvipc_proc_start(struct seq_file *s, loff_t *pos) | |
828 | { | |
bc1fc6d8 EB |
829 | struct ipc_proc_iter *iter = s->private; |
830 | struct ipc_proc_iface *iface = iter->iface; | |
73ea4130 KK |
831 | struct ipc_ids *ids; |
832 | ||
ed2ddbf8 | 833 | ids = &iter->ns->ids[iface->ids]; |
ae781774 MW |
834 | |
835 | /* | |
836 | * Take the lock - this will be released by the corresponding | |
837 | * call to stop(). | |
838 | */ | |
d9a605e4 | 839 | down_read(&ids->rwsem); |
ae781774 MW |
840 | |
841 | /* pos < 0 is invalid */ | |
842 | if (*pos < 0) | |
843 | return NULL; | |
844 | ||
845 | /* pos == 0 means header */ | |
846 | if (*pos == 0) | |
847 | return SEQ_START_TOKEN; | |
848 | ||
849 | /* Find the (pos-1)th ipc */ | |
7ca7e564 | 850 | return sysvipc_find_ipc(ids, *pos - 1, pos); |
ae781774 MW |
851 | } |
852 | ||
853 | static void sysvipc_proc_stop(struct seq_file *s, void *it) | |
854 | { | |
855 | struct kern_ipc_perm *ipc = it; | |
bc1fc6d8 EB |
856 | struct ipc_proc_iter *iter = s->private; |
857 | struct ipc_proc_iface *iface = iter->iface; | |
73ea4130 | 858 | struct ipc_ids *ids; |
ae781774 | 859 | |
f4566f04 | 860 | /* If we had a locked structure, release it */ |
ae781774 MW |
861 | if (ipc && ipc != SEQ_START_TOKEN) |
862 | ipc_unlock(ipc); | |
863 | ||
ed2ddbf8 | 864 | ids = &iter->ns->ids[iface->ids]; |
ae781774 | 865 | /* Release the lock we took in start() */ |
d9a605e4 | 866 | up_read(&ids->rwsem); |
ae781774 MW |
867 | } |
868 | ||
869 | static int sysvipc_proc_show(struct seq_file *s, void *it) | |
870 | { | |
bc1fc6d8 EB |
871 | struct ipc_proc_iter *iter = s->private; |
872 | struct ipc_proc_iface *iface = iter->iface; | |
ae781774 | 873 | |
7f032d6e JP |
874 | if (it == SEQ_START_TOKEN) { |
875 | seq_puts(s, iface->header); | |
876 | return 0; | |
877 | } | |
ae781774 MW |
878 | |
879 | return iface->show(s, it); | |
880 | } | |
881 | ||
88e9d34c | 882 | static const struct seq_operations sysvipc_proc_seqops = { |
ae781774 MW |
883 | .start = sysvipc_proc_start, |
884 | .stop = sysvipc_proc_stop, | |
885 | .next = sysvipc_proc_next, | |
886 | .show = sysvipc_proc_show, | |
887 | }; | |
888 | ||
bc1fc6d8 EB |
889 | static int sysvipc_proc_open(struct inode *inode, struct file *file) |
890 | { | |
bc1fc6d8 EB |
891 | struct ipc_proc_iter *iter; |
892 | ||
d66a0520 | 893 | iter = __seq_open_private(file, &sysvipc_proc_seqops, sizeof(*iter)); |
bc1fc6d8 | 894 | if (!iter) |
d66a0520 | 895 | return -ENOMEM; |
bc1fc6d8 | 896 | |
d9dda78b | 897 | iter->iface = PDE_DATA(inode); |
bc1fc6d8 | 898 | iter->ns = get_ipc_ns(current->nsproxy->ipc_ns); |
03f1fc09 | 899 | iter->pid_ns = get_pid_ns(task_active_pid_ns(current)); |
d66a0520 RJ |
900 | |
901 | return 0; | |
bc1fc6d8 EB |
902 | } |
903 | ||
904 | static int sysvipc_proc_release(struct inode *inode, struct file *file) | |
905 | { | |
906 | struct seq_file *seq = file->private_data; | |
907 | struct ipc_proc_iter *iter = seq->private; | |
908 | put_ipc_ns(iter->ns); | |
03f1fc09 | 909 | put_pid_ns(iter->pid_ns); |
bc1fc6d8 | 910 | return seq_release_private(inode, file); |
ae781774 MW |
911 | } |
912 | ||
97a32539 | 913 | static const struct proc_ops sysvipc_proc_ops = { |
d919b33d | 914 | .proc_flags = PROC_ENTRY_PERMANENT, |
97a32539 AD |
915 | .proc_open = sysvipc_proc_open, |
916 | .proc_read = seq_read, | |
917 | .proc_lseek = seq_lseek, | |
918 | .proc_release = sysvipc_proc_release, | |
ae781774 MW |
919 | }; |
920 | #endif /* CONFIG_PROC_FS */ |