sysv_sem.c revision 1.68.6.1 1 1.68.6.1 reinoud /* $NetBSD: sysv_sem.c,v 1.68.6.1 2007/12/09 16:04:02 reinoud Exp $ */
2 1.33 thorpej
3 1.33 thorpej /*-
4 1.33 thorpej * Copyright (c) 1999 The NetBSD Foundation, Inc.
5 1.33 thorpej * All rights reserved.
6 1.33 thorpej *
7 1.33 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.33 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.33 thorpej * NASA Ames Research Center.
10 1.33 thorpej *
11 1.33 thorpej * Redistribution and use in source and binary forms, with or without
12 1.33 thorpej * modification, are permitted provided that the following conditions
13 1.33 thorpej * are met:
14 1.33 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.33 thorpej * notice, this list of conditions and the following disclaimer.
16 1.33 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.33 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.33 thorpej * documentation and/or other materials provided with the distribution.
19 1.33 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.33 thorpej * must display the following acknowledgement:
21 1.33 thorpej * This product includes software developed by the NetBSD
22 1.33 thorpej * Foundation, Inc. and its contributors.
23 1.33 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.33 thorpej * contributors may be used to endorse or promote products derived
25 1.33 thorpej * from this software without specific prior written permission.
26 1.33 thorpej *
27 1.33 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.33 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.33 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.33 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.33 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.33 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.33 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.33 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.33 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.33 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.33 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.33 thorpej */
39 1.9 cgd
40 1.1 cgd /*
41 1.1 cgd * Implementation of SVID semaphores
42 1.1 cgd *
43 1.33 thorpej * Author: Daniel Boulet
44 1.1 cgd *
45 1.1 cgd * This software is provided ``AS IS'' without any warranties of any kind.
46 1.1 cgd */
47 1.42 lukem
48 1.42 lukem #include <sys/cdefs.h>
49 1.68.6.1 reinoud __KERNEL_RCSID(0, "$NetBSD: sysv_sem.c,v 1.68.6.1 2007/12/09 16:04:02 reinoud Exp $");
50 1.31 tron
51 1.32 tron #define SYSVSEM
52 1.1 cgd
53 1.3 mycroft #include <sys/param.h>
54 1.3 mycroft #include <sys/kernel.h>
55 1.3 mycroft #include <sys/sem.h>
56 1.38 simonb #include <sys/sysctl.h>
57 1.57 chs #include <sys/malloc.h>
58 1.38 simonb #include <sys/mount.h> /* XXX for <sys/syscallargs.h> */
59 1.10 cgd #include <sys/syscallargs.h>
60 1.61 elad #include <sys/kauth.h>
61 1.25 christos
62 1.48 jdolecek static int semtot = 0;
63 1.48 jdolecek struct semid_ds *sema; /* semaphore id pool */
64 1.48 jdolecek static struct __sem *sem; /* semaphore pool */
65 1.48 jdolecek static struct sem_undo *semu_list; /* list of active undo structures */
66 1.48 jdolecek static int *semu; /* undo structure pool */
67 1.1 cgd
68 1.27 christos #ifdef SEM_DEBUG
69 1.28 christos #define SEM_PRINTF(a) printf a
70 1.27 christos #else
71 1.27 christos #define SEM_PRINTF(a)
72 1.27 christos #endif
73 1.27 christos
74 1.53 junyoung struct sem_undo *semu_alloc(struct proc *);
75 1.53 junyoung int semundo_adjust(struct proc *, struct sem_undo **, int, int, int);
76 1.53 junyoung void semundo_clear(int, int);
77 1.25 christos
78 1.37 sommerfe /*
79 1.37 sommerfe * XXXSMP Once we go MP, there needs to be a lock for the semaphore system.
80 1.37 sommerfe * Until then, we're saved by being a non-preemptive kernel.
81 1.37 sommerfe */
82 1.37 sommerfe
83 1.25 christos void
84 1.59 thorpej seminit(void)
85 1.1 cgd {
86 1.48 jdolecek int i, sz;
87 1.48 jdolecek vaddr_t v;
88 1.1 cgd
89 1.48 jdolecek /* Allocate pageable memory for our structures */
90 1.51 enami sz = seminfo.semmni * sizeof(struct semid_ds) +
91 1.51 enami seminfo.semmns * sizeof(struct __sem) +
92 1.51 enami seminfo.semmnu * seminfo.semusz;
93 1.56 yamt v = uvm_km_alloc(kernel_map, round_page(sz), 0,
94 1.56 yamt UVM_KMF_WIRED|UVM_KMF_ZERO);
95 1.56 yamt if (v == 0)
96 1.48 jdolecek panic("sysv_sem: cannot allocate memory");
97 1.48 jdolecek sema = (void *)v;
98 1.48 jdolecek sem = (void *)(sema + seminfo.semmni);
99 1.48 jdolecek semu = (void *)(sem + seminfo.semmns);
100 1.5 mycroft
101 1.5 mycroft for (i = 0; i < seminfo.semmni; i++) {
102 1.33 thorpej sema[i]._sem_base = 0;
103 1.5 mycroft sema[i].sem_perm.mode = 0;
104 1.5 mycroft }
105 1.5 mycroft for (i = 0; i < seminfo.semmnu; i++) {
106 1.35 augustss struct sem_undo *suptr = SEMU(i);
107 1.5 mycroft suptr->un_proc = NULL;
108 1.5 mycroft }
109 1.5 mycroft semu_list = NULL;
110 1.44 christos exithook_establish(semexit, NULL);
111 1.1 cgd }
112 1.1 cgd
113 1.1 cgd /*
114 1.37 sommerfe * Placebo.
115 1.1 cgd */
116 1.1 cgd
117 1.1 cgd int
118 1.66 yamt sys_semconfig(struct lwp *l, void *v, register_t *retval)
119 1.23 thorpej {
120 1.51 enami
121 1.5 mycroft *retval = 0;
122 1.37 sommerfe return 0;
123 1.1 cgd }
124 1.1 cgd
125 1.1 cgd /*
126 1.1 cgd * Allocate a new sem_undo structure for a process
127 1.1 cgd * (returns ptr to structure or NULL if no more room)
128 1.1 cgd */
129 1.1 cgd
130 1.1 cgd struct sem_undo *
131 1.59 thorpej semu_alloc(struct proc *p)
132 1.1 cgd {
133 1.35 augustss int i;
134 1.35 augustss struct sem_undo *suptr;
135 1.35 augustss struct sem_undo **supptr;
136 1.5 mycroft int attempt;
137 1.1 cgd
138 1.1 cgd /*
139 1.5 mycroft * Try twice to allocate something.
140 1.5 mycroft * (we'll purge any empty structures after the first pass so
141 1.5 mycroft * two passes are always enough)
142 1.1 cgd */
143 1.1 cgd
144 1.5 mycroft for (attempt = 0; attempt < 2; attempt++) {
145 1.5 mycroft /*
146 1.5 mycroft * Look for a free structure.
147 1.5 mycroft * Fill it in and return it if we find one.
148 1.5 mycroft */
149 1.5 mycroft
150 1.5 mycroft for (i = 0; i < seminfo.semmnu; i++) {
151 1.5 mycroft suptr = SEMU(i);
152 1.5 mycroft if (suptr->un_proc == NULL) {
153 1.5 mycroft suptr->un_next = semu_list;
154 1.5 mycroft semu_list = suptr;
155 1.5 mycroft suptr->un_cnt = 0;
156 1.5 mycroft suptr->un_proc = p;
157 1.51 enami return (suptr);
158 1.5 mycroft }
159 1.5 mycroft }
160 1.1 cgd
161 1.5 mycroft /*
162 1.5 mycroft * We didn't find a free one, if this is the first attempt
163 1.5 mycroft * then try to free some structures.
164 1.5 mycroft */
165 1.5 mycroft
166 1.5 mycroft if (attempt == 0) {
167 1.5 mycroft /* All the structures are in use - try to free some */
168 1.5 mycroft int did_something = 0;
169 1.5 mycroft
170 1.5 mycroft supptr = &semu_list;
171 1.5 mycroft while ((suptr = *supptr) != NULL) {
172 1.5 mycroft if (suptr->un_cnt == 0) {
173 1.5 mycroft suptr->un_proc = NULL;
174 1.5 mycroft *supptr = suptr->un_next;
175 1.5 mycroft did_something = 1;
176 1.5 mycroft } else
177 1.52 enami supptr = &suptr->un_next;
178 1.5 mycroft }
179 1.5 mycroft
180 1.5 mycroft /* If we didn't free anything then just give-up */
181 1.5 mycroft if (!did_something)
182 1.51 enami return (NULL);
183 1.5 mycroft } else {
184 1.5 mycroft /*
185 1.5 mycroft * The second pass failed even though we freed
186 1.5 mycroft * something after the first pass!
187 1.5 mycroft * This is IMPOSSIBLE!
188 1.5 mycroft */
189 1.5 mycroft panic("semu_alloc - second attempt failed");
190 1.5 mycroft }
191 1.1 cgd }
192 1.25 christos return NULL;
193 1.1 cgd }
194 1.1 cgd
195 1.1 cgd /*
196 1.1 cgd * Adjust a particular entry for a particular proc
197 1.1 cgd */
198 1.1 cgd
199 1.1 cgd int
200 1.59 thorpej semundo_adjust(struct proc *p, struct sem_undo **supptr, int semid, int semnum,
201 1.59 thorpej int adjval)
202 1.1 cgd {
203 1.35 augustss struct sem_undo *suptr;
204 1.35 augustss struct undo *sunptr;
205 1.5 mycroft int i;
206 1.1 cgd
207 1.51 enami /*
208 1.51 enami * Look for and remember the sem_undo if the caller doesn't
209 1.51 enami * provide it
210 1.51 enami */
211 1.1 cgd
212 1.5 mycroft suptr = *supptr;
213 1.4 mycroft if (suptr == NULL) {
214 1.52 enami for (suptr = semu_list; suptr != NULL; suptr = suptr->un_next)
215 1.52 enami if (suptr->un_proc == p)
216 1.5 mycroft break;
217 1.52 enami
218 1.5 mycroft if (suptr == NULL) {
219 1.5 mycroft suptr = semu_alloc(p);
220 1.5 mycroft if (suptr == NULL)
221 1.51 enami return (ENOSPC);
222 1.5 mycroft }
223 1.52 enami *supptr = suptr;
224 1.1 cgd }
225 1.1 cgd
226 1.6 mycroft /*
227 1.51 enami * Look for the requested entry and adjust it (delete if
228 1.51 enami * adjval becomes 0).
229 1.6 mycroft */
230 1.6 mycroft sunptr = &suptr->un_ent[0];
231 1.5 mycroft for (i = 0; i < suptr->un_cnt; i++, sunptr++) {
232 1.6 mycroft if (sunptr->un_id != semid || sunptr->un_num != semnum)
233 1.6 mycroft continue;
234 1.52 enami sunptr->un_adjval += adjval;
235 1.6 mycroft if (sunptr->un_adjval == 0) {
236 1.6 mycroft suptr->un_cnt--;
237 1.6 mycroft if (i < suptr->un_cnt)
238 1.6 mycroft suptr->un_ent[i] =
239 1.6 mycroft suptr->un_ent[suptr->un_cnt];
240 1.5 mycroft }
241 1.51 enami return (0);
242 1.1 cgd }
243 1.1 cgd
244 1.5 mycroft /* Didn't find the right entry - create it */
245 1.11 mycroft if (suptr->un_cnt == SEMUME)
246 1.51 enami return (EINVAL);
247 1.11 mycroft
248 1.11 mycroft sunptr = &suptr->un_ent[suptr->un_cnt];
249 1.11 mycroft suptr->un_cnt++;
250 1.11 mycroft sunptr->un_adjval = adjval;
251 1.11 mycroft sunptr->un_id = semid;
252 1.11 mycroft sunptr->un_num = semnum;
253 1.51 enami return (0);
254 1.1 cgd }
255 1.1 cgd
256 1.1 cgd void
257 1.59 thorpej semundo_clear(int semid, int semnum)
258 1.1 cgd {
259 1.35 augustss struct sem_undo *suptr;
260 1.52 enami struct undo *sunptr, *sunend;
261 1.1 cgd
262 1.52 enami for (suptr = semu_list; suptr != NULL; suptr = suptr->un_next)
263 1.52 enami for (sunptr = &suptr->un_ent[0],
264 1.52 enami sunend = sunptr + suptr->un_cnt; sunptr < sunend;) {
265 1.6 mycroft if (sunptr->un_id == semid) {
266 1.6 mycroft if (semnum == -1 || sunptr->un_num == semnum) {
267 1.6 mycroft suptr->un_cnt--;
268 1.52 enami sunend--;
269 1.52 enami if (sunptr != sunend)
270 1.52 enami *sunptr = *sunend;
271 1.52 enami if (semnum != -1)
272 1.52 enami break;
273 1.52 enami else
274 1.52 enami continue;
275 1.6 mycroft }
276 1.6 mycroft }
277 1.52 enami sunptr++;
278 1.6 mycroft }
279 1.1 cgd }
280 1.1 cgd
281 1.1 cgd int
282 1.59 thorpej sys_____semctl13(struct lwp *l, void *v, register_t *retval)
283 1.23 thorpej {
284 1.34 christos struct sys_____semctl13_args /* {
285 1.10 cgd syscallarg(int) semid;
286 1.10 cgd syscallarg(int) semnum;
287 1.10 cgd syscallarg(int) cmd;
288 1.34 christos syscallarg(union __semun *) arg;
289 1.23 thorpej } */ *uap = v;
290 1.33 thorpej struct semid_ds sembuf;
291 1.33 thorpej int cmd, error;
292 1.34 christos void *pass_arg;
293 1.34 christos union __semun karg;
294 1.33 thorpej
295 1.33 thorpej cmd = SCARG(uap, cmd);
296 1.33 thorpej
297 1.33 thorpej switch (cmd) {
298 1.33 thorpej case IPC_SET:
299 1.33 thorpej case IPC_STAT:
300 1.33 thorpej pass_arg = &sembuf;
301 1.33 thorpej break;
302 1.33 thorpej
303 1.33 thorpej case GETALL:
304 1.33 thorpej case SETVAL:
305 1.33 thorpej case SETALL:
306 1.34 christos pass_arg = &karg;
307 1.34 christos break;
308 1.34 christos default:
309 1.34 christos pass_arg = NULL;
310 1.33 thorpej break;
311 1.33 thorpej }
312 1.33 thorpej
313 1.34 christos if (pass_arg) {
314 1.34 christos error = copyin(SCARG(uap, arg), &karg, sizeof(karg));
315 1.33 thorpej if (error)
316 1.34 christos return error;
317 1.34 christos if (cmd == IPC_SET) {
318 1.34 christos error = copyin(karg.buf, &sembuf, sizeof(sembuf));
319 1.34 christos if (error)
320 1.34 christos return (error);
321 1.34 christos }
322 1.33 thorpej }
323 1.33 thorpej
324 1.63 ad error = semctl1(l, SCARG(uap, semid), SCARG(uap, semnum), cmd,
325 1.33 thorpej pass_arg, retval);
326 1.33 thorpej
327 1.33 thorpej if (error == 0 && cmd == IPC_STAT)
328 1.34 christos error = copyout(&sembuf, karg.buf, sizeof(sembuf));
329 1.33 thorpej
330 1.33 thorpej return (error);
331 1.33 thorpej }
332 1.33 thorpej
333 1.33 thorpej int
334 1.63 ad semctl1(struct lwp *l, int semid, int semnum, int cmd, void *v,
335 1.59 thorpej register_t *retval)
336 1.33 thorpej {
337 1.63 ad kauth_cred_t cred = l->l_cred;
338 1.33 thorpej union __semun *arg = v;
339 1.33 thorpej struct semid_ds *sembuf = v, *semaptr;
340 1.33 thorpej int i, error, ix;
341 1.1 cgd
342 1.27 christos SEM_PRINTF(("call to semctl(%d, %d, %d, %p)\n",
343 1.33 thorpej semid, semnum, cmd, v));
344 1.1 cgd
345 1.33 thorpej ix = IPCID_TO_IX(semid);
346 1.49 jdolecek if (ix < 0 || ix >= seminfo.semmni)
347 1.33 thorpej return (EINVAL);
348 1.6 mycroft
349 1.33 thorpej semaptr = &sema[ix];
350 1.6 mycroft if ((semaptr->sem_perm.mode & SEM_ALLOC) == 0 ||
351 1.33 thorpej semaptr->sem_perm._seq != IPCID_TO_SEQ(semid))
352 1.33 thorpej return (EINVAL);
353 1.1 cgd
354 1.6 mycroft switch (cmd) {
355 1.6 mycroft case IPC_RMID:
356 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_M)) != 0)
357 1.33 thorpej return (error);
358 1.61 elad semaptr->sem_perm.cuid = kauth_cred_geteuid(cred);
359 1.61 elad semaptr->sem_perm.uid = kauth_cred_geteuid(cred);
360 1.6 mycroft semtot -= semaptr->sem_nsems;
361 1.33 thorpej for (i = semaptr->_sem_base - sem; i < semtot; i++)
362 1.6 mycroft sem[i] = sem[i + semaptr->sem_nsems];
363 1.6 mycroft for (i = 0; i < seminfo.semmni; i++) {
364 1.6 mycroft if ((sema[i].sem_perm.mode & SEM_ALLOC) &&
365 1.33 thorpej sema[i]._sem_base > semaptr->_sem_base)
366 1.33 thorpej sema[i]._sem_base -= semaptr->sem_nsems;
367 1.6 mycroft }
368 1.6 mycroft semaptr->sem_perm.mode = 0;
369 1.33 thorpej semundo_clear(ix, -1);
370 1.33 thorpej wakeup(semaptr);
371 1.6 mycroft break;
372 1.1 cgd
373 1.6 mycroft case IPC_SET:
374 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_M)))
375 1.33 thorpej return (error);
376 1.64 christos KASSERT(sembuf != NULL);
377 1.33 thorpej semaptr->sem_perm.uid = sembuf->sem_perm.uid;
378 1.33 thorpej semaptr->sem_perm.gid = sembuf->sem_perm.gid;
379 1.6 mycroft semaptr->sem_perm.mode = (semaptr->sem_perm.mode & ~0777) |
380 1.33 thorpej (sembuf->sem_perm.mode & 0777);
381 1.62 kardel semaptr->sem_ctime = time_second;
382 1.6 mycroft break;
383 1.1 cgd
384 1.6 mycroft case IPC_STAT:
385 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
386 1.33 thorpej return (error);
387 1.64 christos KASSERT(sembuf != NULL);
388 1.33 thorpej memcpy(sembuf, semaptr, sizeof(struct semid_ds));
389 1.6 mycroft break;
390 1.1 cgd
391 1.6 mycroft case GETNCNT:
392 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
393 1.33 thorpej return (error);
394 1.6 mycroft if (semnum < 0 || semnum >= semaptr->sem_nsems)
395 1.33 thorpej return (EINVAL);
396 1.33 thorpej *retval = semaptr->_sem_base[semnum].semncnt;
397 1.6 mycroft break;
398 1.1 cgd
399 1.6 mycroft case GETPID:
400 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
401 1.33 thorpej return (error);
402 1.6 mycroft if (semnum < 0 || semnum >= semaptr->sem_nsems)
403 1.33 thorpej return (EINVAL);
404 1.33 thorpej *retval = semaptr->_sem_base[semnum].sempid;
405 1.6 mycroft break;
406 1.1 cgd
407 1.6 mycroft case GETVAL:
408 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
409 1.33 thorpej return (error);
410 1.6 mycroft if (semnum < 0 || semnum >= semaptr->sem_nsems)
411 1.33 thorpej return (EINVAL);
412 1.33 thorpej *retval = semaptr->_sem_base[semnum].semval;
413 1.6 mycroft break;
414 1.1 cgd
415 1.6 mycroft case GETALL:
416 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
417 1.33 thorpej return (error);
418 1.60 christos KASSERT(arg != NULL);
419 1.6 mycroft for (i = 0; i < semaptr->sem_nsems; i++) {
420 1.33 thorpej error = copyout(&semaptr->_sem_base[i].semval,
421 1.33 thorpej &arg->array[i], sizeof(arg->array[i]));
422 1.33 thorpej if (error != 0)
423 1.6 mycroft break;
424 1.6 mycroft }
425 1.6 mycroft break;
426 1.1 cgd
427 1.6 mycroft case GETZCNT:
428 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_R)))
429 1.33 thorpej return (error);
430 1.6 mycroft if (semnum < 0 || semnum >= semaptr->sem_nsems)
431 1.33 thorpej return (EINVAL);
432 1.33 thorpej *retval = semaptr->_sem_base[semnum].semzcnt;
433 1.6 mycroft break;
434 1.1 cgd
435 1.6 mycroft case SETVAL:
436 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_W)))
437 1.33 thorpej return (error);
438 1.6 mycroft if (semnum < 0 || semnum >= semaptr->sem_nsems)
439 1.33 thorpej return (EINVAL);
440 1.60 christos KASSERT(arg != NULL);
441 1.33 thorpej semaptr->_sem_base[semnum].semval = arg->val;
442 1.33 thorpej semundo_clear(ix, semnum);
443 1.33 thorpej wakeup(semaptr);
444 1.6 mycroft break;
445 1.1 cgd
446 1.6 mycroft case SETALL:
447 1.33 thorpej if ((error = ipcperm(cred, &semaptr->sem_perm, IPC_W)))
448 1.33 thorpej return (error);
449 1.60 christos KASSERT(arg != NULL);
450 1.6 mycroft for (i = 0; i < semaptr->sem_nsems; i++) {
451 1.33 thorpej error = copyin(&arg->array[i],
452 1.33 thorpej &semaptr->_sem_base[i].semval,
453 1.33 thorpej sizeof(arg->array[i]));
454 1.33 thorpej if (error != 0)
455 1.6 mycroft break;
456 1.6 mycroft }
457 1.33 thorpej semundo_clear(ix, -1);
458 1.33 thorpej wakeup(semaptr);
459 1.6 mycroft break;
460 1.1 cgd
461 1.6 mycroft default:
462 1.33 thorpej return (EINVAL);
463 1.6 mycroft }
464 1.4 mycroft
465 1.33 thorpej return (error);
466 1.1 cgd }
467 1.1 cgd
468 1.1 cgd int
469 1.59 thorpej sys_semget(struct lwp *l, void *v, register_t *retval)
470 1.23 thorpej {
471 1.35 augustss struct sys_semget_args /* {
472 1.10 cgd syscallarg(key_t) key;
473 1.10 cgd syscallarg(int) nsems;
474 1.10 cgd syscallarg(int) semflg;
475 1.23 thorpej } */ *uap = v;
476 1.6 mycroft int semid, eval;
477 1.10 cgd int key = SCARG(uap, key);
478 1.10 cgd int nsems = SCARG(uap, nsems);
479 1.10 cgd int semflg = SCARG(uap, semflg);
480 1.63 ad kauth_cred_t cred = l->l_cred;
481 1.1 cgd
482 1.27 christos SEM_PRINTF(("semget(0x%x, %d, 0%o)\n", key, nsems, semflg));
483 1.1 cgd
484 1.6 mycroft if (key != IPC_PRIVATE) {
485 1.6 mycroft for (semid = 0; semid < seminfo.semmni; semid++) {
486 1.6 mycroft if ((sema[semid].sem_perm.mode & SEM_ALLOC) &&
487 1.33 thorpej sema[semid].sem_perm._key == key)
488 1.6 mycroft break;
489 1.6 mycroft }
490 1.6 mycroft if (semid < seminfo.semmni) {
491 1.27 christos SEM_PRINTF(("found public key\n"));
492 1.7 hpeyerl if ((eval = ipcperm(cred, &sema[semid].sem_perm,
493 1.7 hpeyerl semflg & 0700)))
494 1.51 enami return (eval);
495 1.6 mycroft if (nsems > 0 && sema[semid].sem_nsems < nsems) {
496 1.27 christos SEM_PRINTF(("too small\n"));
497 1.51 enami return (EINVAL);
498 1.6 mycroft }
499 1.6 mycroft if ((semflg & IPC_CREAT) && (semflg & IPC_EXCL)) {
500 1.27 christos SEM_PRINTF(("not exclusive\n"));
501 1.51 enami return (EEXIST);
502 1.6 mycroft }
503 1.6 mycroft goto found;
504 1.6 mycroft }
505 1.6 mycroft }
506 1.6 mycroft
507 1.27 christos SEM_PRINTF(("need to allocate the semid_ds\n"));
508 1.6 mycroft if (key == IPC_PRIVATE || (semflg & IPC_CREAT)) {
509 1.6 mycroft if (nsems <= 0 || nsems > seminfo.semmsl) {
510 1.27 christos SEM_PRINTF(("nsems out of range (0<%d<=%d)\n", nsems,
511 1.27 christos seminfo.semmsl));
512 1.51 enami return (EINVAL);
513 1.6 mycroft }
514 1.6 mycroft if (nsems > seminfo.semmns - semtot) {
515 1.51 enami SEM_PRINTF(("not enough semaphores left "
516 1.51 enami "(need %d, got %d)\n",
517 1.27 christos nsems, seminfo.semmns - semtot));
518 1.51 enami return (ENOSPC);
519 1.6 mycroft }
520 1.6 mycroft for (semid = 0; semid < seminfo.semmni; semid++) {
521 1.6 mycroft if ((sema[semid].sem_perm.mode & SEM_ALLOC) == 0)
522 1.6 mycroft break;
523 1.6 mycroft }
524 1.6 mycroft if (semid == seminfo.semmni) {
525 1.27 christos SEM_PRINTF(("no more semid_ds's available\n"));
526 1.51 enami return (ENOSPC);
527 1.6 mycroft }
528 1.27 christos SEM_PRINTF(("semid %d is available\n", semid));
529 1.33 thorpej sema[semid].sem_perm._key = key;
530 1.61 elad sema[semid].sem_perm.cuid = kauth_cred_geteuid(cred);
531 1.61 elad sema[semid].sem_perm.uid = kauth_cred_geteuid(cred);
532 1.61 elad sema[semid].sem_perm.cgid = kauth_cred_getegid(cred);
533 1.61 elad sema[semid].sem_perm.gid = kauth_cred_getegid(cred);
534 1.6 mycroft sema[semid].sem_perm.mode = (semflg & 0777) | SEM_ALLOC;
535 1.33 thorpej sema[semid].sem_perm._seq =
536 1.33 thorpej (sema[semid].sem_perm._seq + 1) & 0x7fff;
537 1.6 mycroft sema[semid].sem_nsems = nsems;
538 1.6 mycroft sema[semid].sem_otime = 0;
539 1.62 kardel sema[semid].sem_ctime = time_second;
540 1.33 thorpej sema[semid]._sem_base = &sem[semtot];
541 1.6 mycroft semtot += nsems;
542 1.33 thorpej memset(sema[semid]._sem_base, 0,
543 1.51 enami sizeof(sema[semid]._sem_base[0]) * nsems);
544 1.33 thorpej SEM_PRINTF(("sembase = %p, next = %p\n", sema[semid]._sem_base,
545 1.27 christos &sem[semtot]));
546 1.1 cgd } else {
547 1.27 christos SEM_PRINTF(("didn't find it and wasn't asked to create it\n"));
548 1.51 enami return (ENOENT);
549 1.1 cgd }
550 1.1 cgd
551 1.6 mycroft found:
552 1.6 mycroft *retval = IXSEQ_TO_IPCID(semid, sema[semid].sem_perm);
553 1.51 enami return (0);
554 1.1 cgd }
555 1.1 cgd
556 1.57 chs #define SMALL_SOPS 8
557 1.57 chs
558 1.1 cgd int
559 1.59 thorpej sys_semop(struct lwp *l, void *v, register_t *retval)
560 1.23 thorpej {
561 1.35 augustss struct sys_semop_args /* {
562 1.10 cgd syscallarg(int) semid;
563 1.10 cgd syscallarg(struct sembuf *) sops;
564 1.29 kleink syscallarg(size_t) nsops;
565 1.23 thorpej } */ *uap = v;
566 1.45 thorpej struct proc *p = l->l_proc;
567 1.52 enami int semid = SCARG(uap, semid), seq;
568 1.41 jdolecek size_t nsops = SCARG(uap, nsops);
569 1.57 chs struct sembuf small_sops[SMALL_SOPS];
570 1.57 chs struct sembuf *sops;
571 1.35 augustss struct semid_ds *semaptr;
572 1.35 augustss struct sembuf *sopptr = NULL;
573 1.35 augustss struct __sem *semptr = NULL;
574 1.6 mycroft struct sem_undo *suptr = NULL;
575 1.63 ad kauth_cred_t cred = l->l_cred;
576 1.54 enami int i, eval;
577 1.25 christos int do_wakeup, do_undos;
578 1.1 cgd
579 1.58 christos SEM_PRINTF(("call to semop(%d, %p, %zd)\n", semid, SCARG(uap,sops), nsops));
580 1.68.6.1 reinoud restart:
581 1.68.6.1 reinoud if (nsops <= SMALL_SOPS) {
582 1.68.6.1 reinoud sops = small_sops;
583 1.68.6.1 reinoud } else if (nsops <= seminfo.semopm) {
584 1.68.6.1 reinoud KERNEL_LOCK(1, l); /* XXXSMP */
585 1.68.6.1 reinoud sops = kmem_alloc(nsops * sizeof(*sops), KM_SLEEP);
586 1.68.6.1 reinoud KERNEL_UNLOCK_ONE(l); /* XXXSMP */
587 1.68.6.1 reinoud } else {
588 1.68.6.1 reinoud SEM_PRINTF(("too many sops (max=%d, nsops=%zd)\n",
589 1.68.6.1 reinoud seminfo.semopm, nsops));
590 1.68.6.1 reinoud return (E2BIG);
591 1.68.6.1 reinoud }
592 1.68.6.1 reinoud
593 1.68.6.1 reinoud error = copyin(SCARG(uap, sops), sops, nsops * sizeof(sops[0]));
594 1.68.6.1 reinoud if (error) {
595 1.68.6.1 reinoud SEM_PRINTF(("error = %d from copyin(%p, %p, %zd)\n", error,
596 1.68.6.1 reinoud SCARG(uap, sops), &sops, nsops * sizeof(sops[0])));
597 1.68.6.1 reinoud if (sops != small_sops) {
598 1.68.6.1 reinoud KERNEL_LOCK(1, l); /* XXXSMP */
599 1.68.6.1 reinoud kmem_free(sops, nsops * sizeof(*sops));
600 1.68.6.1 reinoud KERNEL_UNLOCK_ONE(l); /* XXXSMP */
601 1.68.6.1 reinoud }
602 1.68.6.1 reinoud return error;
603 1.68.6.1 reinoud }
604 1.68.6.1 reinoud
605 1.68.6.1 reinoud mutex_enter(&semlock);
606 1.68.6.1 reinoud /* In case of reallocation, we will wait for completion */
607 1.68.6.1 reinoud while (__predict_false(sem_realloc_state))
608 1.68.6.1 reinoud cv_wait(&sem_realloc_cv, &semlock);
609 1.1 cgd
610 1.6 mycroft semid = IPCID_TO_IX(semid); /* Convert back to zero origin */
611 1.49 jdolecek if (semid < 0 || semid >= seminfo.semmni)
612 1.51 enami return (EINVAL);
613 1.6 mycroft
614 1.6 mycroft semaptr = &sema[semid];
615 1.52 enami seq = IPCID_TO_SEQ(SCARG(uap, semid));
616 1.11 mycroft if ((semaptr->sem_perm.mode & SEM_ALLOC) == 0 ||
617 1.52 enami semaptr->sem_perm._seq != seq)
618 1.51 enami return (EINVAL);
619 1.6 mycroft
620 1.7 hpeyerl if ((eval = ipcperm(cred, &semaptr->sem_perm, IPC_W))) {
621 1.27 christos SEM_PRINTF(("eval = %d from ipaccess\n", eval));
622 1.51 enami return (eval);
623 1.6 mycroft }
624 1.1 cgd
625 1.57 chs if (nsops <= SMALL_SOPS) {
626 1.57 chs sops = small_sops;
627 1.57 chs } else if (nsops <= seminfo.semopm) {
628 1.57 chs sops = malloc(nsops * sizeof(*sops), M_TEMP, M_WAITOK);
629 1.57 chs } else {
630 1.57 chs SEM_PRINTF(("too many sops (max=%d, nsops=%zd)\n",
631 1.57 chs seminfo.semopm, nsops));
632 1.51 enami return (E2BIG);
633 1.6 mycroft }
634 1.1 cgd
635 1.52 enami for (i = 0; i < nsops; i++)
636 1.57 chs if (sops[i].sem_num >= semaptr->sem_nsems) {
637 1.57 chs eval = EFBIG;
638 1.57 chs goto out;
639 1.57 chs }
640 1.52 enami
641 1.51 enami /*
642 1.6 mycroft * Loop trying to satisfy the vector of requests.
643 1.6 mycroft * If we reach a point where we must wait, any requests already
644 1.6 mycroft * performed are rolled back and we go to sleep until some other
645 1.6 mycroft * process wakes us up. At this point, we start all over again.
646 1.6 mycroft *
647 1.6 mycroft * This ensures that from the perspective of other tasks, a set
648 1.6 mycroft * of requests is atomic (never partially satisfied).
649 1.6 mycroft */
650 1.6 mycroft do_undos = 0;
651 1.1 cgd
652 1.6 mycroft for (;;) {
653 1.6 mycroft do_wakeup = 0;
654 1.1 cgd
655 1.6 mycroft for (i = 0; i < nsops; i++) {
656 1.6 mycroft sopptr = &sops[i];
657 1.33 thorpej semptr = &semaptr->_sem_base[sopptr->sem_num];
658 1.1 cgd
659 1.51 enami SEM_PRINTF(("semop: semaptr=%p, sem_base=%p, "
660 1.51 enami "semptr=%p, sem[%d]=%d : op=%d, flag=%s\n",
661 1.33 thorpej semaptr, semaptr->_sem_base, semptr,
662 1.6 mycroft sopptr->sem_num, semptr->semval, sopptr->sem_op,
663 1.51 enami (sopptr->sem_flg & IPC_NOWAIT) ?
664 1.51 enami "nowait" : "wait"));
665 1.1 cgd
666 1.6 mycroft if (sopptr->sem_op < 0) {
667 1.25 christos if ((int)(semptr->semval +
668 1.51 enami sopptr->sem_op) < 0) {
669 1.51 enami SEM_PRINTF(("semop: "
670 1.51 enami "can't do it now\n"));
671 1.6 mycroft break;
672 1.6 mycroft } else {
673 1.6 mycroft semptr->semval += sopptr->sem_op;
674 1.6 mycroft if (semptr->semval == 0 &&
675 1.6 mycroft semptr->semzcnt > 0)
676 1.6 mycroft do_wakeup = 1;
677 1.6 mycroft }
678 1.6 mycroft if (sopptr->sem_flg & SEM_UNDO)
679 1.6 mycroft do_undos = 1;
680 1.6 mycroft } else if (sopptr->sem_op == 0) {
681 1.6 mycroft if (semptr->semval > 0) {
682 1.27 christos SEM_PRINTF(("semop: not zero now\n"));
683 1.6 mycroft break;
684 1.6 mycroft }
685 1.6 mycroft } else {
686 1.6 mycroft if (semptr->semncnt > 0)
687 1.6 mycroft do_wakeup = 1;
688 1.6 mycroft semptr->semval += sopptr->sem_op;
689 1.6 mycroft if (sopptr->sem_flg & SEM_UNDO)
690 1.6 mycroft do_undos = 1;
691 1.6 mycroft }
692 1.6 mycroft }
693 1.1 cgd
694 1.6 mycroft /*
695 1.6 mycroft * Did we get through the entire vector?
696 1.6 mycroft */
697 1.6 mycroft if (i >= nsops)
698 1.6 mycroft goto done;
699 1.1 cgd
700 1.6 mycroft /*
701 1.6 mycroft * No ... rollback anything that we've already done
702 1.6 mycroft */
703 1.51 enami SEM_PRINTF(("semop: rollback 0 through %d\n", i - 1));
704 1.52 enami while (i-- > 0)
705 1.52 enami semaptr->_sem_base[sops[i].sem_num].semval -=
706 1.52 enami sops[i].sem_op;
707 1.1 cgd
708 1.6 mycroft /*
709 1.6 mycroft * If the request that we couldn't satisfy has the
710 1.6 mycroft * NOWAIT flag set then return with EAGAIN.
711 1.6 mycroft */
712 1.57 chs if (sopptr->sem_flg & IPC_NOWAIT) {
713 1.57 chs eval = EAGAIN;
714 1.57 chs goto out;
715 1.57 chs }
716 1.1 cgd
717 1.6 mycroft if (sopptr->sem_op == 0)
718 1.6 mycroft semptr->semzcnt++;
719 1.6 mycroft else
720 1.6 mycroft semptr->semncnt++;
721 1.1 cgd
722 1.27 christos SEM_PRINTF(("semop: good night!\n"));
723 1.68 christos eval = tsleep((void *)semaptr, (PZERO - 4) | PCATCH,
724 1.6 mycroft "semwait", 0);
725 1.27 christos SEM_PRINTF(("semop: good morning (eval=%d)!\n", eval));
726 1.1 cgd
727 1.6 mycroft /*
728 1.6 mycroft * Make sure that the semaphore still exists
729 1.6 mycroft */
730 1.6 mycroft if ((semaptr->sem_perm.mode & SEM_ALLOC) == 0 ||
731 1.52 enami semaptr->sem_perm._seq != seq) {
732 1.57 chs eval = EIDRM;
733 1.57 chs goto out;
734 1.6 mycroft }
735 1.1 cgd
736 1.6 mycroft /*
737 1.6 mycroft * The semaphore is still alive. Readjust the count of
738 1.6 mycroft * waiting processes.
739 1.6 mycroft */
740 1.51 enami semptr = &semaptr->_sem_base[sopptr->sem_num];
741 1.6 mycroft if (sopptr->sem_op == 0)
742 1.6 mycroft semptr->semzcnt--;
743 1.6 mycroft else
744 1.6 mycroft semptr->semncnt--;
745 1.50 christos /*
746 1.50 christos * Is it really morning, or was our sleep interrupted?
747 1.50 christos * (Delayed check of tsleep() return code because we
748 1.50 christos * need to decrement sem[nz]cnt either way.)
749 1.50 christos */
750 1.57 chs if (eval != 0) {
751 1.57 chs eval = EINTR;
752 1.57 chs goto out;
753 1.57 chs }
754 1.50 christos SEM_PRINTF(("semop: good morning!\n"));
755 1.6 mycroft }
756 1.1 cgd
757 1.6 mycroft done:
758 1.6 mycroft /*
759 1.6 mycroft * Process any SEM_UNDO requests.
760 1.6 mycroft */
761 1.6 mycroft if (do_undos) {
762 1.5 mycroft for (i = 0; i < nsops; i++) {
763 1.6 mycroft /*
764 1.6 mycroft * We only need to deal with SEM_UNDO's for non-zero
765 1.6 mycroft * op's.
766 1.6 mycroft */
767 1.6 mycroft int adjval;
768 1.1 cgd
769 1.6 mycroft if ((sops[i].sem_flg & SEM_UNDO) == 0)
770 1.6 mycroft continue;
771 1.6 mycroft adjval = sops[i].sem_op;
772 1.6 mycroft if (adjval == 0)
773 1.6 mycroft continue;
774 1.6 mycroft eval = semundo_adjust(p, &suptr, semid,
775 1.6 mycroft sops[i].sem_num, -adjval);
776 1.6 mycroft if (eval == 0)
777 1.6 mycroft continue;
778 1.1 cgd
779 1.6 mycroft /*
780 1.6 mycroft * Oh-Oh! We ran out of either sem_undo's or undo's.
781 1.6 mycroft * Rollback the adjustments to this point and then
782 1.6 mycroft * rollback the semaphore ups and down so we can return
783 1.6 mycroft * with an error with all structures restored. We
784 1.6 mycroft * rollback the undo's in the exact reverse order that
785 1.6 mycroft * we applied them. This guarantees that we won't run
786 1.6 mycroft * out of space as we roll things back out.
787 1.6 mycroft */
788 1.52 enami while (i-- > 0) {
789 1.52 enami if ((sops[i].sem_flg & SEM_UNDO) == 0)
790 1.6 mycroft continue;
791 1.52 enami adjval = sops[i].sem_op;
792 1.6 mycroft if (adjval == 0)
793 1.6 mycroft continue;
794 1.6 mycroft if (semundo_adjust(p, &suptr, semid,
795 1.52 enami sops[i].sem_num, adjval) != 0)
796 1.1 cgd panic("semop - can't undo undos");
797 1.6 mycroft }
798 1.1 cgd
799 1.54 enami for (i = 0; i < nsops; i++)
800 1.54 enami semaptr->_sem_base[sops[i].sem_num].semval -=
801 1.54 enami sops[i].sem_op;
802 1.1 cgd
803 1.27 christos SEM_PRINTF(("eval = %d from semundo_adjust\n", eval));
804 1.57 chs goto out;
805 1.1 cgd } /* loop through the sops */
806 1.6 mycroft } /* if (do_undos) */
807 1.1 cgd
808 1.6 mycroft /* We're definitely done - set the sempid's */
809 1.6 mycroft for (i = 0; i < nsops; i++) {
810 1.1 cgd sopptr = &sops[i];
811 1.33 thorpej semptr = &semaptr->_sem_base[sopptr->sem_num];
812 1.1 cgd semptr->sempid = p->p_pid;
813 1.6 mycroft }
814 1.1 cgd
815 1.55 briggs /* Update sem_otime */
816 1.62 kardel semaptr->sem_otime = time_second;
817 1.55 briggs
818 1.6 mycroft /* Do a wakeup if any semaphore was up'd. */
819 1.6 mycroft if (do_wakeup) {
820 1.27 christos SEM_PRINTF(("semop: doing wakeup\n"));
821 1.1 cgd #ifdef SEM_WAKEUP
822 1.68 christos sem_wakeup((void *)semaptr);
823 1.1 cgd #else
824 1.68 christos wakeup((void *)semaptr);
825 1.1 cgd #endif
826 1.27 christos SEM_PRINTF(("semop: back from wakeup\n"));
827 1.6 mycroft }
828 1.27 christos SEM_PRINTF(("semop: done\n"));
829 1.6 mycroft *retval = 0;
830 1.57 chs
831 1.57 chs out:
832 1.57 chs if (sops != small_sops) {
833 1.57 chs free(sops, M_TEMP);
834 1.57 chs }
835 1.57 chs return eval;
836 1.1 cgd }
837 1.1 cgd
838 1.1 cgd /*
839 1.51 enami * Go through the undo structures for this process and apply the
840 1.51 enami * adjustments to semaphores.
841 1.1 cgd */
842 1.44 christos /*ARGSUSED*/
843 1.25 christos void
844 1.66 yamt semexit(struct proc *p, void *v)
845 1.1 cgd {
846 1.35 augustss struct sem_undo *suptr;
847 1.35 augustss struct sem_undo **supptr;
848 1.1 cgd
849 1.6 mycroft /*
850 1.51 enami * Go through the chain of undo vectors looking for one
851 1.51 enami * associated with this process.
852 1.17 mycroft */
853 1.17 mycroft
854 1.17 mycroft for (supptr = &semu_list; (suptr = *supptr) != NULL;
855 1.17 mycroft supptr = &suptr->un_next) {
856 1.17 mycroft if (suptr->un_proc == p)
857 1.17 mycroft break;
858 1.17 mycroft }
859 1.17 mycroft
860 1.17 mycroft /*
861 1.37 sommerfe * If there is no undo vector, skip to the end.
862 1.14 mycroft */
863 1.14 mycroft
864 1.37 sommerfe if (suptr == NULL)
865 1.37 sommerfe return;
866 1.51 enami
867 1.14 mycroft /*
868 1.37 sommerfe * We now have an undo vector for this process.
869 1.15 mycroft */
870 1.1 cgd
871 1.27 christos SEM_PRINTF(("proc @%p has undo structure with %d entries\n", p,
872 1.27 christos suptr->un_cnt));
873 1.1 cgd
874 1.5 mycroft /*
875 1.5 mycroft * If there are any active undo elements then process them.
876 1.5 mycroft */
877 1.5 mycroft if (suptr->un_cnt > 0) {
878 1.6 mycroft int ix;
879 1.1 cgd
880 1.6 mycroft for (ix = 0; ix < suptr->un_cnt; ix++) {
881 1.6 mycroft int semid = suptr->un_ent[ix].un_id;
882 1.6 mycroft int semnum = suptr->un_ent[ix].un_num;
883 1.6 mycroft int adjval = suptr->un_ent[ix].un_adjval;
884 1.6 mycroft struct semid_ds *semaptr;
885 1.6 mycroft
886 1.6 mycroft semaptr = &sema[semid];
887 1.6 mycroft if ((semaptr->sem_perm.mode & SEM_ALLOC) == 0)
888 1.6 mycroft panic("semexit - semid not allocated");
889 1.6 mycroft if (semnum >= semaptr->sem_nsems)
890 1.6 mycroft panic("semexit - semnum out of range");
891 1.6 mycroft
892 1.51 enami SEM_PRINTF(("semexit: %p id=%d num=%d(adj=%d) ; "
893 1.51 enami "sem=%d\n",
894 1.6 mycroft suptr->un_proc, suptr->un_ent[ix].un_id,
895 1.6 mycroft suptr->un_ent[ix].un_num,
896 1.6 mycroft suptr->un_ent[ix].un_adjval,
897 1.33 thorpej semaptr->_sem_base[semnum].semval));
898 1.6 mycroft
899 1.14 mycroft if (adjval < 0 &&
900 1.33 thorpej semaptr->_sem_base[semnum].semval < -adjval)
901 1.33 thorpej semaptr->_sem_base[semnum].semval = 0;
902 1.14 mycroft else
903 1.33 thorpej semaptr->_sem_base[semnum].semval += adjval;
904 1.1 cgd
905 1.1 cgd #ifdef SEM_WAKEUP
906 1.68 christos sem_wakeup((void *)semaptr);
907 1.1 cgd #else
908 1.68 christos wakeup((void *)semaptr);
909 1.1 cgd #endif
910 1.27 christos SEM_PRINTF(("semexit: back from wakeup\n"));
911 1.6 mycroft }
912 1.5 mycroft }
913 1.1 cgd
914 1.5 mycroft /*
915 1.5 mycroft * Deallocate the undo vector.
916 1.5 mycroft */
917 1.27 christos SEM_PRINTF(("removing vector\n"));
918 1.5 mycroft suptr->un_proc = NULL;
919 1.5 mycroft *supptr = suptr->un_next;
920 1.1 cgd }
921