sysproxy.c revision 1.5 1 /* $NetBSD: sysproxy.c,v 1.5 2019/04/18 08:31:44 ozaki-r Exp $ */
2
3 /*
4 * Copyright (c) 2010, 2011 Antti Kantee. All Rights Reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 */
27
28 #include <sys/cdefs.h>
29 __KERNEL_RCSID(0, "$NetBSD: sysproxy.c,v 1.5 2019/04/18 08:31:44 ozaki-r Exp $");
30
31 #include <sys/param.h>
32 #include <sys/filedesc.h>
33 #include <sys/kmem.h>
34 #include <sys/syscall.h>
35 #include <sys/syscallvar.h>
36 #include <sys/systm.h>
37 #include <sys/xcall.h>
38 #include <sys/lockdebug.h>
39
40 #define _RUMP_SYSPROXY
41 #include <rump/rumpuser.h>
42
43 #include <rump-sys/kern.h>
44
45 int
46 rump_init_server(const char *url)
47 {
48
49 return rumpuser_sp_init(url, ostype, osrelease, MACHINE);
50 }
51
52 static pid_t
53 hyp_getpid(void)
54 {
55
56 return curproc->p_pid;
57 }
58
59 static int
60 hyp_syscall(int num, void *arg, long *retval)
61 {
62 register_t regrv[2] = {0, 0};
63 struct lwp *l;
64 struct sysent *callp;
65 int rv;
66
67 if (__predict_false(num >= SYS_NSYSENT))
68 return ENOSYS;
69
70 /* XXX: always uses native syscall vector */
71 callp = rump_sysent + num;
72 l = curlwp;
73 rv = sy_invoke(callp, l, (void *)arg, regrv, num);
74 retval[0] = regrv[0];
75 retval[1] = regrv[1];
76
77 /* Sanity checks (from mi_userret) */
78 LOCKDEBUG_BARRIER(NULL, 0);
79 KASSERT(l->l_nopreempt == 0);
80
81 return rv;
82 }
83
84 static struct pmap remotepmap;
85
86 static int
87 hyp_rfork(void *priv, int flags, const char *comm)
88 {
89 struct rump_spctl *spctl;
90 struct vmspace *vm;
91 struct proc *p;
92 struct lwp *l;
93 int error;
94 bool initfds;
95
96 /*
97 * If we are forking off of pid 1, initialize file descriptors.
98 */
99 l = curlwp;
100 if (l->l_proc->p_pid == 1) {
101 KASSERT(flags == RUMP_RFFD_CLEAR);
102 initfds = true;
103 } else {
104 initfds = false;
105 }
106
107 /*
108 * Since it's a proxy proc, we create a vmspace for it.
109 */
110 spctl = kmem_zalloc(sizeof(*spctl), KM_SLEEP);
111 vm = &spctl->spctl_vm;
112 uvmspace_init(vm, &remotepmap, 0, 0, false);
113 spctl->spctl = priv;
114
115 if ((error = rump_lwproc_rfork_vmspace(vm, flags)) != 0) {
116 kmem_free(vm, sizeof(*vm));
117 return error;
118 }
119
120 /*
121 * We forked in this routine, so cannot use curlwp (const)
122 */
123 l = rump_lwproc_curlwp();
124 p = l->l_proc;
125
126 if (comm)
127 strlcpy(p->p_comm, comm, sizeof(p->p_comm));
128 if (initfds)
129 rump_consdev_init();
130
131 return 0;
132 }
133
134 /*
135 * Order all lwps in a process to exit. does *not* wait for them to drain.
136 */
137 static void
138 hyp_lwpexit(void)
139 {
140 struct proc *p = curproc;
141 uint64_t where;
142 struct lwp *l;
143
144 mutex_enter(p->p_lock);
145 /*
146 * First pass: mark all lwps in the process with LW_RUMP_QEXIT
147 * so that they know they should exit.
148 */
149 LIST_FOREACH(l, &p->p_lwps, l_sibling) {
150 if (l == curlwp)
151 continue;
152 l->l_flag |= LW_RUMP_QEXIT;
153 }
154 mutex_exit(p->p_lock);
155
156 /*
157 * Next, make sure everyone on all CPUs sees our status
158 * update. This keeps threads inside cv_wait() and makes
159 * sure we don't access a stale cv pointer later when
160 * we wake up the threads.
161 */
162
163 where = xc_broadcast(0, (xcfunc_t)nullop, NULL, NULL);
164 xc_wait(where);
165
166 /*
167 * Ok, all lwps are either:
168 * 1) not in the cv code
169 * 2) sleeping on l->l_private
170 * 3) sleeping on p->p_waitcv
171 *
172 * Either way, l_private is stable until we set PS_RUMP_LWPEXIT
173 * in p->p_sflag.
174 */
175
176 mutex_enter(p->p_lock);
177 LIST_FOREACH(l, &p->p_lwps, l_sibling) {
178 if (l->l_private)
179 cv_broadcast(l->l_private);
180 }
181 p->p_sflag |= PS_RUMP_LWPEXIT;
182 cv_broadcast(&p->p_waitcv);
183 mutex_exit(p->p_lock);
184 }
185
186 /*
187 * Notify process that all threads have been drained and exec is complete.
188 */
189 static void
190 hyp_execnotify(const char *comm)
191 {
192 struct proc *p = curproc;
193
194 fd_closeexec();
195 mutex_enter(p->p_lock);
196 KASSERT(p->p_nlwps == 1 && p->p_sflag & PS_RUMP_LWPEXIT);
197 p->p_sflag &= ~PS_RUMP_LWPEXIT;
198 mutex_exit(p->p_lock);
199 strlcpy(p->p_comm, comm, sizeof(p->p_comm));
200 }
201
202 /*
203 * Initialize interface pointers since component is present.
204 */
205 RUMP_COMPONENT(RUMP_COMPONENT_KERN)
206 {
207
208 rump_sysproxy_ops.rspo_copyin = rumpuser_sp_copyin;
209 rump_sysproxy_ops.rspo_copyinstr = rumpuser_sp_copyinstr;
210 rump_sysproxy_ops.rspo_copyout = rumpuser_sp_copyout;
211 rump_sysproxy_ops.rspo_copyoutstr = rumpuser_sp_copyoutstr;
212 rump_sysproxy_ops.rspo_anonmmap = rumpuser_sp_anonmmap;
213 rump_sysproxy_ops.rspo_raise = rumpuser_sp_raise;
214 rump_sysproxy_ops.rspo_fini = rumpuser_sp_fini;
215
216 rump_sysproxy_ops.rspo_hyp_getpid = hyp_getpid;
217 rump_sysproxy_ops.rspo_hyp_syscall = hyp_syscall;
218 rump_sysproxy_ops.rspo_hyp_rfork = hyp_rfork;
219 rump_sysproxy_ops.rspo_hyp_lwpexit = hyp_lwpexit;
220 rump_sysproxy_ops.rspo_hyp_execnotify = hyp_execnotify;
221 }
222