Home | History | Annotate | Line # | Download | only in kern
uipc_sem.c revision 1.13
      1  1.13      cube /*	$NetBSD: uipc_sem.c,v 1.13 2006/03/05 00:49:19 cube Exp $	*/
      2   1.3   thorpej 
      3   1.3   thorpej /*-
      4   1.3   thorpej  * Copyright (c) 2003 The NetBSD Foundation, Inc.
      5   1.3   thorpej  * All rights reserved.
      6   1.3   thorpej  *
      7   1.3   thorpej  * This code is derived from software contributed to The NetBSD Foundation
      8   1.3   thorpej  * by Jason R. Thorpe of Wasabi Systems, Inc.
      9   1.3   thorpej  *
     10   1.3   thorpej  * Redistribution and use in source and binary forms, with or without
     11   1.3   thorpej  * modification, are permitted provided that the following conditions
     12   1.3   thorpej  * are met:
     13   1.3   thorpej  * 1. Redistributions of source code must retain the above copyright
     14   1.3   thorpej  *    notice, this list of conditions and the following disclaimer.
     15   1.3   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.3   thorpej  *    notice, this list of conditions and the following disclaimer in the
     17   1.3   thorpej  *    documentation and/or other materials provided with the distribution.
     18   1.3   thorpej  * 3. All advertising materials mentioning features or use of this software
     19   1.3   thorpej  *    must display the following acknowledgement:
     20   1.3   thorpej  *        This product includes software developed by the NetBSD
     21   1.3   thorpej  *        Foundation, Inc. and its contributors.
     22   1.3   thorpej  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23   1.3   thorpej  *    contributors may be used to endorse or promote products derived
     24   1.3   thorpej  *    from this software without specific prior written permission.
     25   1.3   thorpej  *
     26   1.3   thorpej  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27   1.3   thorpej  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28   1.3   thorpej  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29   1.3   thorpej  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30   1.3   thorpej  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31   1.3   thorpej  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32   1.3   thorpej  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33   1.3   thorpej  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34   1.3   thorpej  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35   1.3   thorpej  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36   1.3   thorpej  * POSSIBILITY OF SUCH DAMAGE.
     37   1.3   thorpej  */
     38   1.1  christos 
     39   1.1  christos /*
     40   1.1  christos  * Copyright (c) 2002 Alfred Perlstein <alfred (at) FreeBSD.org>
     41   1.1  christos  * All rights reserved.
     42   1.1  christos  *
     43   1.1  christos  * Redistribution and use in source and binary forms, with or without
     44   1.1  christos  * modification, are permitted provided that the following conditions
     45   1.1  christos  * are met:
     46   1.1  christos  * 1. Redistributions of source code must retain the above copyright
     47   1.1  christos  *    notice, this list of conditions and the following disclaimer.
     48   1.1  christos  * 2. Redistributions in binary form must reproduce the above copyright
     49   1.1  christos  *    notice, this list of conditions and the following disclaimer in the
     50   1.1  christos  *    documentation and/or other materials provided with the distribution.
     51   1.1  christos  *
     52   1.1  christos  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     53   1.1  christos  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     54   1.1  christos  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     55   1.1  christos  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     56   1.1  christos  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     57   1.1  christos  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     58   1.1  christos  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     59   1.1  christos  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     60   1.1  christos  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     61   1.1  christos  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     62   1.1  christos  * SUCH DAMAGE.
     63   1.1  christos  */
     64   1.9     lukem 
     65   1.9     lukem #include <sys/cdefs.h>
     66  1.13      cube __KERNEL_RCSID(0, "$NetBSD: uipc_sem.c,v 1.13 2006/03/05 00:49:19 cube Exp $");
     67   1.1  christos 
     68   1.1  christos #include "opt_posix.h"
     69   1.1  christos 
     70   1.1  christos #include <sys/param.h>
     71   1.1  christos #include <sys/systm.h>
     72   1.1  christos #include <sys/kernel.h>
     73   1.1  christos #include <sys/proc.h>
     74   1.1  christos #include <sys/lock.h>
     75   1.1  christos #include <sys/ksem.h>
     76   1.5      matt #include <sys/sa.h>
     77   1.1  christos #include <sys/syscall.h>
     78   1.1  christos #include <sys/stat.h>
     79   1.1  christos #include <sys/malloc.h>
     80   1.1  christos #include <sys/fcntl.h>
     81   1.1  christos 
     82   1.1  christos #include <sys/mount.h>
     83   1.1  christos 
     84   1.1  christos #include <sys/syscallargs.h>
     85   1.1  christos 
     86   1.1  christos #ifndef SEM_MAX
     87   1.1  christos #define SEM_MAX	30
     88   1.1  christos #endif
     89   1.1  christos 
     90   1.1  christos #define SEM_MAX_NAMELEN	14
     91   1.1  christos #define SEM_VALUE_MAX (~0U)
     92  1.13      cube #define SEM_HASHTBL_SIZE 13
     93   1.1  christos 
     94  1.13      cube #define SEM_TO_ID(x)	(((x)->ks_id))
     95  1.13      cube #define SEM_HASH(id)	((id) % SEM_HASHTBL_SIZE)
     96   1.4   thorpej 
     97   1.4   thorpej MALLOC_DEFINE(M_SEM, "p1003_1b_sem", "p1003_1b semaphores");
     98   1.1  christos 
     99   1.3   thorpej /*
    100   1.3   thorpej  * Note: to read the ks_name member, you need either the ks_interlock
    101   1.3   thorpej  * or the ksem_slock.  To write the ks_name member, you need both.  Make
    102   1.3   thorpej  * sure the order is ksem_slock -> ks_interlock.
    103   1.3   thorpej  */
    104   1.1  christos struct ksem {
    105   1.1  christos 	LIST_ENTRY(ksem) ks_entry;	/* global list entry */
    106  1.13      cube 	LIST_ENTRY(ksem) ks_hash;	/* hash list entry */
    107   1.3   thorpej 	struct simplelock ks_interlock;	/* lock on this ksem */
    108   1.1  christos 	char *ks_name;			/* if named, this is the name */
    109   1.3   thorpej 	unsigned int ks_ref;		/* number of references */
    110   1.1  christos 	mode_t ks_mode;			/* protection bits */
    111   1.1  christos 	uid_t ks_uid;			/* creator uid */
    112   1.1  christos 	gid_t ks_gid;			/* creator gid */
    113   1.1  christos 	unsigned int ks_value;		/* current value */
    114   1.3   thorpej 	unsigned int ks_waiters;	/* number of waiters */
    115  1.13      cube 	semid_t ks_id;			/* unique identifier */
    116   1.3   thorpej };
    117   1.3   thorpej 
    118   1.3   thorpej struct ksem_ref {
    119   1.3   thorpej 	LIST_ENTRY(ksem_ref) ksr_list;
    120   1.3   thorpej 	struct ksem *ksr_ksem;
    121   1.3   thorpej };
    122   1.3   thorpej 
    123   1.3   thorpej struct ksem_proc {
    124   1.3   thorpej 	struct lock kp_lock;
    125   1.3   thorpej 	LIST_HEAD(, ksem_ref) kp_ksems;
    126   1.1  christos };
    127   1.1  christos 
    128  1.13      cube LIST_HEAD(ksem_list, ksem);
    129  1.13      cube 
    130   1.1  christos /*
    131   1.3   thorpej  * ksem_slock protects ksem_head and nsems.  Only named semaphores go
    132   1.3   thorpej  * onto ksem_head.
    133   1.1  christos  */
    134   1.1  christos static struct simplelock ksem_slock;
    135  1.13      cube static struct ksem_list ksem_head = LIST_HEAD_INITIALIZER(&ksem_head);
    136  1.13      cube static struct ksem_list ksem_hash[SEM_HASHTBL_SIZE];
    137   1.3   thorpej static int nsems = 0;
    138   1.1  christos 
    139  1.13      cube /*
    140  1.13      cube  * ksem_counter is the last assigned semid_t.  It needs to be COMPAT_NETBSD32
    141  1.13      cube  * friendly, even though semid_t itself is defined as uintptr_t.
    142  1.13      cube  */
    143  1.13      cube static uint32_t ksem_counter = 1;
    144  1.13      cube 
    145  1.13      cube 
    146   1.3   thorpej static void
    147   1.3   thorpej ksem_free(struct ksem *ks)
    148   1.3   thorpej {
    149   1.1  christos 
    150   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    151   1.3   thorpej 	/*
    152   1.3   thorpej 	 * If the ksem is anonymous (or has been unlinked), then
    153   1.3   thorpej 	 * this is the end if its life.
    154   1.3   thorpej 	 */
    155   1.3   thorpej 	if (ks->ks_name == NULL) {
    156   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    157   1.1  christos 
    158   1.3   thorpej 		simple_lock(&ksem_slock);
    159   1.3   thorpej 		nsems--;
    160  1.13      cube 		LIST_REMOVE(ks, ks_hash);
    161   1.3   thorpej 		simple_unlock(&ksem_slock);
    162  1.13      cube 
    163  1.13      cube 		free(ks, M_SEM);
    164   1.3   thorpej 		return;
    165   1.3   thorpej 	}
    166   1.3   thorpej 	simple_unlock(&ks->ks_interlock);
    167   1.3   thorpej }
    168   1.1  christos 
    169  1.12     perry static inline void
    170   1.3   thorpej ksem_addref(struct ksem *ks)
    171   1.1  christos {
    172   1.1  christos 
    173   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    174   1.1  christos 	ks->ks_ref++;
    175   1.3   thorpej 	KASSERT(ks->ks_ref != 0);	/* XXX KDASSERT */
    176   1.1  christos }
    177   1.1  christos 
    178  1.12     perry static inline void
    179   1.3   thorpej ksem_delref(struct ksem *ks)
    180   1.1  christos {
    181   1.1  christos 
    182   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    183   1.3   thorpej 	KASSERT(ks->ks_ref != 0);	/* XXX KDASSERT */
    184   1.3   thorpej 	if (--ks->ks_ref == 0) {
    185   1.1  christos 		ksem_free(ks);
    186   1.3   thorpej 		return;
    187   1.3   thorpej 	}
    188   1.3   thorpej 	simple_unlock(&ks->ks_interlock);
    189   1.3   thorpej }
    190   1.3   thorpej 
    191   1.3   thorpej static struct ksem_proc *
    192   1.3   thorpej ksem_proc_alloc(void)
    193   1.3   thorpej {
    194   1.3   thorpej 	struct ksem_proc *kp;
    195   1.3   thorpej 
    196   1.3   thorpej 	kp = malloc(sizeof(*kp), M_SEM, M_WAITOK);
    197   1.3   thorpej 	lockinit(&kp->kp_lock, PWAIT, "ksproc", 0, 0);
    198   1.3   thorpej 	LIST_INIT(&kp->kp_ksems);
    199   1.3   thorpej 
    200   1.3   thorpej 	return (kp);
    201   1.1  christos }
    202   1.1  christos 
    203   1.3   thorpej static void
    204   1.3   thorpej ksem_add_proc(struct proc *p, struct ksem *ks)
    205   1.3   thorpej {
    206   1.3   thorpej 	struct ksem_proc *kp;
    207   1.3   thorpej 	struct ksem_ref *ksr;
    208   1.3   thorpej 
    209   1.3   thorpej 	if (p->p_ksems == NULL) {
    210   1.3   thorpej 		kp = ksem_proc_alloc();
    211   1.3   thorpej 		p->p_ksems = kp;
    212   1.3   thorpej 	} else
    213   1.3   thorpej 		kp = p->p_ksems;
    214   1.3   thorpej 
    215   1.3   thorpej 	ksr = malloc(sizeof(*ksr), M_SEM, M_WAITOK);
    216   1.3   thorpej 	ksr->ksr_ksem = ks;
    217   1.3   thorpej 
    218   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_EXCLUSIVE, NULL);
    219   1.3   thorpej 	LIST_INSERT_HEAD(&kp->kp_ksems, ksr, ksr_list);
    220   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    221   1.3   thorpej }
    222   1.3   thorpej 
    223   1.3   thorpej /* We MUST have a write lock on the ksem_proc list! */
    224   1.3   thorpej static struct ksem_ref *
    225   1.3   thorpej ksem_drop_proc(struct ksem_proc *kp, struct ksem *ks)
    226   1.1  christos {
    227   1.3   thorpej 	struct ksem_ref *ksr;
    228   1.1  christos 
    229   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    230   1.3   thorpej 	LIST_FOREACH(ksr, &kp->kp_ksems, ksr_list) {
    231   1.3   thorpej 		if (ksr->ksr_ksem == ks) {
    232   1.3   thorpej 			ksem_delref(ks);
    233   1.3   thorpej 			LIST_REMOVE(ksr, ksr_list);
    234   1.3   thorpej 			return (ksr);
    235   1.3   thorpej 		}
    236   1.1  christos 	}
    237   1.3   thorpej #ifdef DIAGNOSTIC
    238   1.3   thorpej 	panic("ksem_drop_proc: ksem_proc %p ksem %p", kp, ks);
    239   1.3   thorpej #endif
    240   1.1  christos 	return (NULL);
    241   1.1  christos }
    242   1.1  christos 
    243   1.3   thorpej static int
    244   1.3   thorpej ksem_perm(struct proc *p, struct ksem *ks)
    245   1.3   thorpej {
    246   1.3   thorpej 	struct ucred *uc;
    247   1.3   thorpej 
    248   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    249   1.3   thorpej 	uc = p->p_ucred;
    250   1.3   thorpej 	if ((uc->cr_uid == ks->ks_uid && (ks->ks_mode & S_IWUSR) != 0) ||
    251   1.3   thorpej 	    (uc->cr_gid == ks->ks_gid && (ks->ks_mode & S_IWGRP) != 0) ||
    252   1.3   thorpej 	    (ks->ks_mode & S_IWOTH) != 0 || suser(uc, &p->p_acflag) == 0)
    253   1.3   thorpej 		return (0);
    254   1.3   thorpej 	return (EPERM);
    255   1.3   thorpej }
    256   1.3   thorpej 
    257   1.1  christos static struct ksem *
    258  1.13      cube ksem_lookup_byid(semid_t id)
    259  1.13      cube {
    260  1.13      cube 	struct ksem *ks;
    261  1.13      cube 
    262  1.13      cube 	LOCK_ASSERT(simple_lock_held(&ksem_slock));
    263  1.13      cube 	LIST_FOREACH(ks, &ksem_hash[SEM_HASH(id)], ks_hash) {
    264  1.13      cube 		if (ks->ks_id == id)
    265  1.13      cube 			return ks;
    266  1.13      cube 	}
    267  1.13      cube 	return NULL;
    268  1.13      cube }
    269  1.13      cube 
    270  1.13      cube static struct ksem *
    271   1.3   thorpej ksem_lookup_byname(const char *name)
    272   1.1  christos {
    273   1.1  christos 	struct ksem *ks;
    274   1.1  christos 
    275   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ksem_slock));
    276   1.3   thorpej 	LIST_FOREACH(ks, &ksem_head, ks_entry) {
    277   1.3   thorpej 		if (strcmp(ks->ks_name, name) == 0) {
    278   1.3   thorpej 			simple_lock(&ks->ks_interlock);
    279   1.1  christos 			return (ks);
    280   1.3   thorpej 		}
    281   1.3   thorpej 	}
    282   1.1  christos 	return (NULL);
    283   1.1  christos }
    284   1.1  christos 
    285   1.1  christos static int
    286   1.3   thorpej ksem_create(struct proc *p, const char *name, struct ksem **ksret,
    287   1.3   thorpej     mode_t mode, unsigned int value)
    288   1.1  christos {
    289   1.1  christos 	struct ksem *ret;
    290   1.1  christos 	struct ucred *uc;
    291   1.1  christos 	size_t len;
    292   1.1  christos 
    293   1.1  christos 	uc = p->p_ucred;
    294   1.1  christos 	if (value > SEM_VALUE_MAX)
    295   1.1  christos 		return (EINVAL);
    296   1.1  christos 	ret = malloc(sizeof(*ret), M_SEM, M_WAITOK | M_ZERO);
    297   1.1  christos 	if (name != NULL) {
    298   1.1  christos 		len = strlen(name);
    299   1.1  christos 		if (len > SEM_MAX_NAMELEN) {
    300   1.1  christos 			free(ret, M_SEM);
    301   1.1  christos 			return (ENAMETOOLONG);
    302   1.1  christos 		}
    303   1.1  christos 		/* name must start with a '/' but not contain one. */
    304   1.1  christos 		if (*name != '/' || len < 2 || strchr(name + 1, '/') != NULL) {
    305   1.1  christos 			free(ret, M_SEM);
    306   1.1  christos 			return (EINVAL);
    307   1.1  christos 		}
    308   1.1  christos 		ret->ks_name = malloc(len + 1, M_SEM, M_WAITOK);
    309   1.6    itojun 		strlcpy(ret->ks_name, name, len + 1);
    310   1.3   thorpej 	} else
    311   1.1  christos 		ret->ks_name = NULL;
    312   1.1  christos 	ret->ks_mode = mode;
    313   1.1  christos 	ret->ks_value = value;
    314   1.1  christos 	ret->ks_ref = 1;
    315   1.1  christos 	ret->ks_waiters = 0;
    316   1.1  christos 	ret->ks_uid = uc->cr_uid;
    317   1.1  christos 	ret->ks_gid = uc->cr_gid;
    318   1.3   thorpej 	simple_lock_init(&ret->ks_interlock);
    319   1.3   thorpej 
    320   1.1  christos 	simple_lock(&ksem_slock);
    321   1.1  christos 	if (nsems >= SEM_MAX) {
    322   1.3   thorpej 		simple_unlock(&ksem_slock);
    323   1.3   thorpej 		if (ret->ks_name != NULL)
    324   1.3   thorpej 			free(ret->ks_name, M_SEM);
    325   1.3   thorpej 		free(ret, M_SEM);
    326   1.3   thorpej 		return (ENFILE);
    327   1.1  christos 	}
    328   1.3   thorpej 	nsems++;
    329  1.13      cube 	while (ksem_lookup_byid(ksem_counter) != NULL) {
    330  1.13      cube 		ksem_counter++;
    331  1.13      cube 		/* 0 is a special value for libpthread */
    332  1.13      cube 		if (ksem_counter == 0)
    333  1.13      cube 			ksem_counter++;
    334  1.13      cube 	}
    335  1.13      cube 	ret->ks_id = ksem_counter;
    336  1.13      cube 	LIST_INSERT_HEAD(&ksem_hash[SEM_HASH(ret->ks_id)], ret, ks_hash);
    337   1.1  christos 	simple_unlock(&ksem_slock);
    338   1.3   thorpej 
    339   1.3   thorpej 	*ksret = ret;
    340   1.3   thorpej 	return (0);
    341   1.1  christos }
    342   1.1  christos 
    343   1.1  christos int
    344   1.2  christos sys__ksem_init(struct lwp *l, void *v, register_t *retval)
    345   1.1  christos {
    346   1.2  christos 	struct sys__ksem_init_args /* {
    347   1.1  christos 		unsigned int value;
    348   1.1  christos 		semid_t *idp;
    349   1.1  christos 	} */ *uap = v;
    350  1.13      cube 
    351  1.13      cube 	return do_ksem_init(l, SCARG(uap, value), SCARG(uap, idp), copyout);
    352  1.13      cube }
    353  1.13      cube 
    354  1.13      cube int
    355  1.13      cube do_ksem_init(struct lwp *l, unsigned int value, semid_t *idp,
    356  1.13      cube     copyout_t docopyout)
    357  1.13      cube {
    358   1.1  christos 	struct ksem *ks;
    359   1.1  christos 	semid_t id;
    360   1.1  christos 	int error;
    361   1.1  christos 
    362   1.3   thorpej 	/* Note the mode does not matter for anonymous semaphores. */
    363  1.13      cube 	error = ksem_create(l->l_proc, NULL, &ks, 0, value);
    364   1.1  christos 	if (error)
    365   1.1  christos 		return (error);
    366   1.1  christos 	id = SEM_TO_ID(ks);
    367  1.13      cube 	error = (*docopyout)(&id, idp, sizeof(id));
    368   1.1  christos 	if (error) {
    369   1.3   thorpej 		simple_lock(&ks->ks_interlock);
    370   1.3   thorpej 		ksem_delref(ks);
    371   1.1  christos 		return (error);
    372   1.1  christos 	}
    373   1.3   thorpej 
    374   1.3   thorpej 	ksem_add_proc(l->l_proc, ks);
    375   1.3   thorpej 
    376   1.3   thorpej 	return (0);
    377   1.1  christos }
    378   1.1  christos 
    379   1.1  christos int
    380   1.2  christos sys__ksem_open(struct lwp *l, void *v, register_t *retval)
    381   1.1  christos {
    382   1.2  christos 	struct sys__ksem_open_args /* {
    383   1.1  christos 		const char *name;
    384   1.1  christos 		int oflag;
    385   1.1  christos 		mode_t mode;
    386   1.1  christos 		unsigned int value;
    387  1.10     perry 		semid_t *idp;
    388   1.1  christos 	} */ *uap = v;
    389  1.13      cube 
    390  1.13      cube 	return do_ksem_open(l, SCARG(uap, name), SCARG(uap, oflag),
    391  1.13      cube 	    SCARG(uap, mode), SCARG(uap, value), SCARG(uap, idp), copyout);
    392  1.13      cube }
    393  1.13      cube 
    394  1.13      cube int
    395  1.13      cube do_ksem_open(struct lwp *l, const char *semname, int oflag, mode_t mode,
    396  1.13      cube      unsigned int value, semid_t *idp, copyout_t docopyout)
    397  1.13      cube {
    398   1.1  christos 	char name[SEM_MAX_NAMELEN + 1];
    399   1.1  christos 	size_t done;
    400   1.1  christos 	int error;
    401   1.1  christos 	struct ksem *ksnew, *ks;
    402   1.1  christos 	semid_t id;
    403   1.1  christos 
    404  1.13      cube 	error = copyinstr(semname, name, sizeof(name), &done);
    405   1.1  christos 	if (error)
    406   1.1  christos 		return (error);
    407   1.1  christos 
    408   1.1  christos 	ksnew = NULL;
    409   1.1  christos 	simple_lock(&ksem_slock);
    410   1.1  christos 	ks = ksem_lookup_byname(name);
    411   1.3   thorpej 
    412   1.3   thorpej 	/* Found one? */
    413   1.3   thorpej 	if (ks != NULL) {
    414   1.3   thorpej 		/* Check for exclusive create. */
    415  1.13      cube 		if (oflag & O_EXCL) {
    416   1.3   thorpej 			simple_unlock(&ks->ks_interlock);
    417   1.1  christos 			simple_unlock(&ksem_slock);
    418   1.3   thorpej 			return (EEXIST);
    419   1.1  christos 		}
    420   1.3   thorpej  found_one:
    421   1.1  christos 		/*
    422   1.3   thorpej 		 * Verify permissions.  If we can access it, add
    423   1.3   thorpej 		 * this process's reference.
    424   1.1  christos 		 */
    425   1.3   thorpej 		LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    426   1.1  christos 		error = ksem_perm(l->l_proc, ks);
    427   1.3   thorpej 		if (error == 0)
    428   1.3   thorpej 			ksem_addref(ks);
    429   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    430   1.1  christos 		simple_unlock(&ksem_slock);
    431   1.1  christos 		if (error)
    432   1.1  christos 			return (error);
    433   1.3   thorpej 
    434   1.1  christos 		id = SEM_TO_ID(ks);
    435  1.13      cube 		error = (*docopyout)(&id, idp, sizeof(id));
    436   1.1  christos 		if (error) {
    437   1.3   thorpej 			simple_lock(&ks->ks_interlock);
    438   1.3   thorpej 			ksem_delref(ks);
    439   1.1  christos 			return (error);
    440   1.1  christos 		}
    441   1.3   thorpej 
    442   1.3   thorpej 		ksem_add_proc(l->l_proc, ks);
    443   1.3   thorpej 
    444   1.3   thorpej 		return (0);
    445   1.3   thorpej 	}
    446   1.3   thorpej 
    447   1.3   thorpej 	/*
    448   1.3   thorpej 	 * didn't ask for creation? error.
    449   1.3   thorpej 	 */
    450  1.13      cube 	if ((oflag & O_CREAT) == 0) {
    451   1.1  christos 		simple_unlock(&ksem_slock);
    452   1.3   thorpej 		return (ENOENT);
    453   1.1  christos 	}
    454   1.1  christos 
    455   1.3   thorpej 	/*
    456   1.3   thorpej 	 * We may block during creation, so drop the lock.
    457   1.3   thorpej 	 */
    458   1.3   thorpej 	simple_unlock(&ksem_slock);
    459  1.13      cube 	error = ksem_create(l->l_proc, name, &ksnew, mode, value);
    460   1.3   thorpej 	if (error != 0)
    461   1.3   thorpej 		return (error);
    462   1.3   thorpej 
    463   1.3   thorpej 	id = SEM_TO_ID(ksnew);
    464  1.13      cube 	error = (*docopyout)(&id, idp, sizeof(id));
    465   1.3   thorpej 	if (error) {
    466   1.3   thorpej 		free(ksnew->ks_name, M_SEM);
    467   1.3   thorpej 		ksnew->ks_name = NULL;
    468   1.1  christos 
    469   1.3   thorpej 		simple_lock(&ksnew->ks_interlock);
    470   1.3   thorpej 		ksem_delref(ksnew);
    471   1.3   thorpej 		return (error);
    472   1.3   thorpej 	}
    473   1.1  christos 
    474   1.3   thorpej 	/*
    475   1.3   thorpej 	 * We need to make sure we haven't lost a race while
    476   1.3   thorpej 	 * allocating during creation.
    477   1.3   thorpej 	 */
    478   1.3   thorpej 	simple_lock(&ksem_slock);
    479   1.3   thorpej 	if ((ks = ksem_lookup_byname(name)) != NULL) {
    480  1.13      cube 		if (oflag & O_EXCL) {
    481   1.3   thorpej 			simple_unlock(&ks->ks_interlock);
    482   1.3   thorpej 			simple_unlock(&ksem_slock);
    483   1.1  christos 
    484   1.3   thorpej 			free(ksnew->ks_name, M_SEM);
    485   1.3   thorpej 			ksnew->ks_name = NULL;
    486   1.1  christos 
    487   1.3   thorpej 			simple_lock(&ksnew->ks_interlock);
    488   1.3   thorpej 			ksem_delref(ksnew);
    489   1.3   thorpej 			return (EEXIST);
    490   1.3   thorpej 		}
    491   1.3   thorpej 		goto found_one;
    492   1.3   thorpej 	} else {
    493   1.3   thorpej 		/* ksnew already has its initial reference. */
    494  1.10     perry 		LIST_INSERT_HEAD(&ksem_head, ksnew, ks_entry);
    495   1.3   thorpej 		simple_unlock(&ksem_slock);
    496   1.1  christos 
    497   1.3   thorpej 		ksem_add_proc(l->l_proc, ksnew);
    498   1.1  christos 	}
    499   1.3   thorpej 	return (error);
    500   1.1  christos }
    501   1.1  christos 
    502   1.3   thorpej /* We must have a read lock on the ksem_proc list! */
    503   1.3   thorpej static struct ksem *
    504   1.3   thorpej ksem_lookup_proc(struct ksem_proc *kp, semid_t id)
    505   1.1  christos {
    506   1.3   thorpej 	struct ksem_ref *ksr;
    507   1.1  christos 
    508   1.3   thorpej 	LIST_FOREACH(ksr, &kp->kp_ksems, ksr_list) {
    509  1.13      cube 		if (id == SEM_TO_ID(ksr->ksr_ksem)) {
    510   1.3   thorpej 			simple_lock(&ksr->ksr_ksem->ks_interlock);
    511   1.3   thorpej 			return (ksr->ksr_ksem);
    512   1.3   thorpej 		}
    513   1.1  christos 	}
    514   1.3   thorpej 
    515   1.3   thorpej 	return (NULL);
    516   1.1  christos }
    517   1.1  christos 
    518   1.1  christos int
    519   1.2  christos sys__ksem_unlink(struct lwp *l, void *v, register_t *retval)
    520   1.1  christos {
    521   1.2  christos 	struct sys__ksem_unlink_args /* {
    522   1.1  christos 		const char *name;
    523   1.1  christos 	} */ *uap = v;
    524   1.3   thorpej 	char name[SEM_MAX_NAMELEN + 1], *cp;
    525   1.1  christos 	size_t done;
    526   1.1  christos 	struct ksem *ks;
    527   1.1  christos 	int error;
    528   1.1  christos 
    529   1.1  christos 	error = copyinstr(SCARG(uap, name), name, sizeof(name), &done);
    530   1.1  christos 	if (error)
    531   1.1  christos 		return error;
    532   1.1  christos 
    533   1.1  christos 	simple_lock(&ksem_slock);
    534   1.1  christos 	ks = ksem_lookup_byname(name);
    535   1.3   thorpej 	if (ks == NULL) {
    536   1.3   thorpej 		simple_unlock(&ksem_slock);
    537   1.3   thorpej 		return (ENOENT);
    538   1.1  christos 	}
    539   1.3   thorpej 
    540   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    541   1.3   thorpej 
    542   1.3   thorpej 	LIST_REMOVE(ks, ks_entry);
    543   1.3   thorpej 	cp = ks->ks_name;
    544   1.3   thorpej 	ks->ks_name = NULL;
    545   1.3   thorpej 
    546   1.1  christos 	simple_unlock(&ksem_slock);
    547   1.3   thorpej 
    548   1.3   thorpej 	if (ks->ks_ref == 0)
    549   1.3   thorpej 		ksem_free(ks);
    550   1.3   thorpej 	else
    551   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    552   1.3   thorpej 
    553   1.3   thorpej 	free(cp, M_SEM);
    554   1.3   thorpej 
    555   1.3   thorpej 	return (0);
    556   1.1  christos }
    557   1.1  christos 
    558   1.1  christos int
    559   1.2  christos sys__ksem_close(struct lwp *l, void *v, register_t *retval)
    560   1.1  christos {
    561   1.2  christos 	struct sys__ksem_close_args /* {
    562   1.1  christos 		semid_t id;
    563   1.1  christos 	} */ *uap = v;
    564   1.3   thorpej 	struct ksem_proc *kp;
    565   1.3   thorpej 	struct ksem_ref *ksr;
    566   1.1  christos 	struct ksem *ks;
    567   1.1  christos 
    568   1.3   thorpej 	if ((kp = l->l_proc->p_ksems) == NULL)
    569   1.3   thorpej 		return (EINVAL);
    570   1.3   thorpej 
    571   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_EXCLUSIVE, NULL);
    572   1.3   thorpej 
    573   1.3   thorpej 	ks = ksem_lookup_proc(kp, SCARG(uap, id));
    574   1.3   thorpej 	if (ks == NULL) {
    575   1.3   thorpej 		lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    576   1.3   thorpej 		return (EINVAL);
    577   1.3   thorpej 	}
    578   1.3   thorpej 
    579   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    580   1.3   thorpej 	if (ks->ks_name == NULL) {
    581   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    582   1.3   thorpej 		lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    583   1.3   thorpej 		return (EINVAL);
    584   1.3   thorpej 	}
    585   1.3   thorpej 
    586   1.3   thorpej 	ksr = ksem_drop_proc(kp, ks);
    587   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    588   1.3   thorpej 	free(ksr, M_SEM);
    589   1.3   thorpej 
    590   1.3   thorpej 	return (0);
    591   1.1  christos }
    592   1.1  christos 
    593   1.1  christos int
    594   1.2  christos sys__ksem_post(struct lwp *l, void *v, register_t *retval)
    595   1.1  christos {
    596   1.2  christos 	struct sys__ksem_post_args /* {
    597   1.1  christos 		semid_t id;
    598   1.1  christos 	} */ *uap = v;
    599   1.3   thorpej 	struct ksem_proc *kp;
    600   1.1  christos 	struct ksem *ks;
    601   1.1  christos 	int error;
    602   1.1  christos 
    603   1.3   thorpej 	if ((kp = l->l_proc->p_ksems) == NULL)
    604   1.3   thorpej 		return (EINVAL);
    605   1.3   thorpej 
    606   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_SHARED, NULL);
    607   1.3   thorpej 	ks = ksem_lookup_proc(kp, SCARG(uap, id));
    608   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    609   1.3   thorpej 	if (ks == NULL)
    610   1.3   thorpej 		return (EINVAL);
    611   1.3   thorpej 
    612   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    613   1.1  christos 	if (ks->ks_value == SEM_VALUE_MAX) {
    614   1.1  christos 		error = EOVERFLOW;
    615   1.3   thorpej 		goto out;
    616   1.1  christos 	}
    617   1.1  christos 	++ks->ks_value;
    618   1.3   thorpej 	if (ks->ks_waiters)
    619   1.1  christos 		wakeup(ks);
    620   1.1  christos 	error = 0;
    621   1.3   thorpej  out:
    622   1.3   thorpej 	simple_unlock(&ks->ks_interlock);
    623   1.3   thorpej 	return (error);
    624   1.3   thorpej }
    625   1.3   thorpej 
    626   1.3   thorpej static int
    627   1.3   thorpej ksem_wait(struct lwp *l, semid_t id, int tryflag)
    628   1.3   thorpej {
    629   1.3   thorpej 	struct ksem_proc *kp;
    630   1.3   thorpej 	struct ksem *ks;
    631   1.3   thorpej 	int error;
    632   1.3   thorpej 
    633   1.3   thorpej 	if ((kp = l->l_proc->p_ksems) == NULL)
    634   1.3   thorpej 		return (EINVAL);
    635   1.3   thorpej 
    636   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_SHARED, NULL);
    637   1.3   thorpej 	ks = ksem_lookup_proc(kp, id);
    638   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    639   1.3   thorpej 	if (ks == NULL)
    640   1.3   thorpej 		return (EINVAL);
    641   1.3   thorpej 
    642   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    643   1.3   thorpej 	ksem_addref(ks);
    644   1.3   thorpej 	while (ks->ks_value == 0) {
    645   1.3   thorpej 		ks->ks_waiters++;
    646  1.10     perry 		error = tryflag ? EAGAIN : ltsleep(ks, PCATCH, "psem", 0,
    647   1.3   thorpej 		    &ks->ks_interlock);
    648   1.3   thorpej 		ks->ks_waiters--;
    649   1.3   thorpej 		if (error)
    650   1.3   thorpej 			goto out;
    651   1.3   thorpej 	}
    652   1.3   thorpej 	ks->ks_value--;
    653   1.3   thorpej 	error = 0;
    654   1.3   thorpej  out:
    655   1.3   thorpej 	ksem_delref(ks);
    656   1.1  christos 	return (error);
    657   1.1  christos }
    658   1.1  christos 
    659   1.1  christos int
    660   1.2  christos sys__ksem_wait(struct lwp *l, void *v, register_t *retval)
    661   1.1  christos {
    662   1.2  christos 	struct sys__ksem_wait_args /* {
    663   1.1  christos 		semid_t id;
    664   1.1  christos 	} */ *uap = v;
    665   1.1  christos 
    666   1.1  christos 	return ksem_wait(l, SCARG(uap, id), 0);
    667   1.1  christos }
    668   1.1  christos 
    669   1.1  christos int
    670   1.2  christos sys__ksem_trywait(struct lwp *l, void *v, register_t *retval)
    671   1.1  christos {
    672   1.2  christos 	struct sys__ksem_trywait_args /* {
    673   1.1  christos 		semid_t id;
    674   1.1  christos 	} */ *uap = v;
    675   1.1  christos 
    676   1.1  christos 	return ksem_wait(l, SCARG(uap, id), 1);
    677   1.1  christos }
    678   1.1  christos 
    679   1.1  christos int
    680   1.2  christos sys__ksem_getvalue(struct lwp *l, void *v, register_t *retval)
    681   1.1  christos {
    682   1.2  christos 	struct sys__ksem_getvalue_args /* {
    683   1.1  christos 		semid_t id;
    684   1.1  christos 		unsigned int *value;
    685   1.1  christos 	} */ *uap = v;
    686   1.3   thorpej 	struct ksem_proc *kp;
    687   1.1  christos 	struct ksem *ks;
    688   1.1  christos 	unsigned int val;
    689   1.1  christos 
    690   1.3   thorpej 	if ((kp = l->l_proc->p_ksems) == NULL)
    691   1.3   thorpej 		return (EINVAL);
    692   1.3   thorpej 
    693   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_SHARED, NULL);
    694   1.3   thorpej 	ks = ksem_lookup_proc(kp, SCARG(uap, id));
    695   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    696   1.3   thorpej 	if (ks == NULL)
    697   1.1  christos 		return (EINVAL);
    698   1.3   thorpej 
    699   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    700   1.1  christos 	val = ks->ks_value;
    701   1.3   thorpej 	simple_unlock(&ks->ks_interlock);
    702   1.3   thorpej 
    703   1.3   thorpej 	return (copyout(&val, SCARG(uap, value), sizeof(val)));
    704   1.1  christos }
    705   1.1  christos 
    706   1.1  christos int
    707   1.2  christos sys__ksem_destroy(struct lwp *l, void *v, register_t *retval)
    708   1.1  christos {
    709   1.2  christos 	struct sys__ksem_destroy_args /*{
    710   1.1  christos 		semid_t id;
    711   1.1  christos 	} */ *uap = v;
    712   1.3   thorpej 	struct ksem_proc *kp;
    713   1.3   thorpej 	struct ksem_ref *ksr;
    714   1.1  christos 	struct ksem *ks;
    715   1.1  christos 
    716   1.3   thorpej 	if ((kp = l->l_proc->p_ksems) == NULL)
    717   1.3   thorpej 		return (EINVAL);
    718   1.3   thorpej 
    719   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_EXCLUSIVE, NULL);
    720   1.3   thorpej 
    721   1.3   thorpej 	ks = ksem_lookup_proc(kp, SCARG(uap, id));
    722   1.3   thorpej 	if (ks == NULL) {
    723   1.3   thorpej 		lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    724   1.3   thorpej 		return (EINVAL);
    725   1.3   thorpej 	}
    726   1.3   thorpej 
    727   1.3   thorpej 	LOCK_ASSERT(simple_lock_held(&ks->ks_interlock));
    728   1.3   thorpej 
    729   1.3   thorpej 	/*
    730   1.3   thorpej 	 * XXX This misses named semaphores which have been unlink'd,
    731   1.3   thorpej 	 * XXX but since behavior of destroying a named semaphore is
    732   1.3   thorpej 	 * XXX undefined, this is technically allowed.
    733   1.3   thorpej 	 */
    734   1.3   thorpej 	if (ks->ks_name != NULL) {
    735   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    736   1.3   thorpej 		lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    737   1.3   thorpej 		return (EINVAL);
    738   1.3   thorpej 	}
    739   1.3   thorpej 
    740   1.3   thorpej 	if (ks->ks_waiters) {
    741   1.3   thorpej 		simple_unlock(&ks->ks_interlock);
    742   1.3   thorpej 		lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    743   1.3   thorpej 		return (EBUSY);
    744   1.3   thorpej 	}
    745   1.3   thorpej 
    746   1.3   thorpej 	ksr = ksem_drop_proc(kp, ks);
    747   1.3   thorpej 	lockmgr(&kp->kp_lock, LK_RELEASE, NULL);
    748   1.3   thorpej 	free(ksr, M_SEM);
    749   1.3   thorpej 
    750   1.3   thorpej 	return (0);
    751   1.3   thorpej }
    752   1.3   thorpej 
    753   1.3   thorpej static void
    754   1.3   thorpej ksem_forkhook(struct proc *p2, struct proc *p1)
    755   1.3   thorpej {
    756   1.3   thorpej 	struct ksem_proc *kp1, *kp2;
    757   1.3   thorpej 	struct ksem_ref *ksr, *ksr1;
    758   1.3   thorpej 
    759   1.3   thorpej 	if ((kp1 = p1->p_ksems) == NULL) {
    760   1.3   thorpej 		p2->p_ksems = NULL;
    761   1.3   thorpej 		return;
    762   1.3   thorpej 	}
    763   1.3   thorpej 
    764   1.3   thorpej 	p2->p_ksems = kp2 = ksem_proc_alloc();
    765   1.3   thorpej 
    766   1.3   thorpej 	lockmgr(&kp1->kp_lock, LK_SHARED, NULL);
    767   1.3   thorpej 
    768   1.3   thorpej 	if (!LIST_EMPTY(&kp1->kp_ksems)) {
    769   1.3   thorpej 		LIST_FOREACH(ksr, &kp1->kp_ksems, ksr_list) {
    770   1.3   thorpej 			ksr1 = malloc(sizeof(*ksr), M_SEM, M_WAITOK);
    771   1.3   thorpej 			ksr1->ksr_ksem = ksr->ksr_ksem;
    772   1.3   thorpej 			simple_lock(&ksr->ksr_ksem->ks_interlock);
    773   1.3   thorpej 			ksem_addref(ksr->ksr_ksem);
    774   1.3   thorpej 			simple_unlock(&ksr->ksr_ksem->ks_interlock);
    775   1.3   thorpej 			LIST_INSERT_HEAD(&kp2->kp_ksems, ksr1, ksr_list);
    776   1.3   thorpej 		}
    777   1.1  christos 	}
    778   1.3   thorpej 
    779   1.3   thorpej 	lockmgr(&kp1->kp_lock, LK_RELEASE, NULL);
    780   1.1  christos }
    781   1.1  christos 
    782   1.1  christos static void
    783   1.8      fvdl ksem_exithook(struct proc *p, void *arg)
    784   1.1  christos {
    785   1.3   thorpej 	struct ksem_proc *kp;
    786   1.3   thorpej 	struct ksem_ref *ksr;
    787   1.3   thorpej 
    788   1.8      fvdl 	if ((kp = p->p_ksems) == NULL)
    789   1.3   thorpej 		return;
    790   1.1  christos 
    791   1.3   thorpej 	/* Don't bother locking; process is dying. */
    792   1.3   thorpej 
    793   1.3   thorpej 	while ((ksr = LIST_FIRST(&kp->kp_ksems)) != NULL) {
    794   1.3   thorpej 		LIST_REMOVE(ksr, ksr_list);
    795   1.3   thorpej 		simple_lock(&ksr->ksr_ksem->ks_interlock);
    796   1.3   thorpej 		ksem_delref(ksr->ksr_ksem);
    797   1.3   thorpej 		free(ksr, M_SEM);
    798   1.1  christos 	}
    799   1.1  christos }
    800   1.1  christos 
    801   1.1  christos void
    802   1.1  christos ksem_init(void)
    803   1.1  christos {
    804  1.13      cube 	int i;
    805   1.3   thorpej 
    806   1.1  christos 	simple_lock_init(&ksem_slock);
    807   1.1  christos 	exithook_establish(ksem_exithook, NULL);
    808   1.1  christos 	exechook_establish(ksem_exithook, NULL);
    809   1.3   thorpej 	forkhook_establish(ksem_forkhook);
    810  1.13      cube 
    811  1.13      cube 	for (i = 0; i < SEM_HASHTBL_SIZE; i++)
    812  1.13      cube 		LIST_INIT(&ksem_hash[i]);
    813   1.1  christos }
    814