1 /*        $NetBSD: emul.c,v 1.202 2024/07/28 13:01:55 bad Exp $       */
2 
3 /*
4  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  *
15  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25  * SUCH DAMAGE.
26  */
27 
28 #include <sys/cdefs.h>
29 __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.202 2024/07/28 13:01:55 bad Exp $");
30 
31 #include <sys/param.h>
32 #include <sys/cprng.h>
33 #include <sys/filedesc.h>
34 #include <sys/fstrans.h>
35 #include <sys/kauth.h>
36 #include <sys/module.h>
37 #include <sys/reboot.h>
38 #include <sys/syscall.h>
39 #include <sys/pserialize.h>
40 #ifdef LOCKDEBUG
41 #include <sys/sleepq.h>
42 #endif
43 #include <sys/syncobj.h>
44 
45 #include <dev/cons.h>
46 
47 #include <rump-sys/kern.h>
48 
49 #include <rump/rumpuser.h>
50 
51 void (*rump_vfs_fini)(void) = (void *)nullop;
52 
53 /*
54  * physmem is largely unused (except for nmbcluster calculations),
55  * so pick a default value which suits ZFS.  if an application wants
56  * a very small memory footprint, it can still adjust this before
57  * calling rump_init()
58  */
59 #define PHYSMEM 512*256
60 psize_t physmem = PHYSMEM;
61 size_t nkmempages = PHYSMEM/2; /* from le chapeau */
62 #undef PHYSMEM
63 
64 struct vnode *rootvp;
65 dev_t rootdev = NODEV;
66 
67 const int schedppq = 1;
68 int cold = 1;
69 int shutting_down;
70 int boothowto = AB_SILENT;
71 struct tty *constty;
72 
73 const struct bdevsw *bdevsw0[255];
74 const struct bdevsw **bdevsw = bdevsw0;
75 const int sys_bdevsws = 255;
76 int max_bdevsws = 255;
77 
78 const struct cdevsw *cdevsw0[255];
79 const struct cdevsw **cdevsw = cdevsw0;
80 const int sys_cdevsws = 255;
81 int max_cdevsws = 255;
82 
83 int mem_no = 2;
84 
85 device_t booted_device;
86 device_t booted_wedge;
87 daddr_t booted_startblk;
88 uint64_t booted_nblks;
89 int booted_partition;
90 const char *booted_method;
91 
92 /* XXX: unused */
93 kmutex_t tty_lock;
94 krwlock_t exec_lock;
95 
96 /* sparc doesn't sport constant page size, pretend we have 4k pages */
97 #ifdef __sparc__
98 int nbpg = 4096;
99 int pgofset = 4096-1;
100 int pgshift = 12;
101 #endif
102 
103 /* on sun3 VM_MAX_ADDRESS is a const variable */
104 /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
105 #ifdef sun3
106 const vaddr_t kernbase = KERNBASE3;
107 #endif
108 
109 struct loadavg averunnable = {
110           { 0 * FSCALE,
111             1 * FSCALE,
112             11 * FSCALE, },
113           FSCALE,
114 };
115 
116 /*
117  * Include the autogenerated list of auto-loadable syscalls
118  */
119 #include <kern/syscalls_autoload.c>
120 
121 struct emul emul_netbsd = {
122           .e_name = "netbsd-rump",
123           .e_sysent = rump_sysent,
124           .e_nomodbits = rump_sysent_nomodbits,
125 #ifndef __HAVE_MINIMAL_EMUL
126           .e_nsysent = SYS_NSYSENT,
127 #endif
128           .e_vm_default_addr = uvm_default_mapaddr,
129 #ifdef __HAVE_SYSCALL_INTERN
130           .e_syscall_intern = syscall_intern,
131 #endif
132           .e_sc_autoload = netbsd_syscalls_autoload,
133 };
134 
135 /* not used, but need the symbols for pointer comparisons */
136 syncobj_t mutex_syncobj, rw_syncobj;
137 
138 int
kpause(const char * wmesg,bool intr,int timeo,kmutex_t * mtx)139 kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
140 {
141           extern int hz;
142           int rv __diagused;
143           uint64_t sec, nsec;
144 
145           if (mtx)
146                     mutex_exit(mtx);
147 
148           sec = timeo / hz;
149           nsec = (timeo % hz) * (1000000000 / hz);
150           rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
151           KASSERT(rv == 0);
152 
153           if (mtx)
154                     mutex_enter(mtx);
155 
156           return 0;
157 }
158 
159 vaddr_t
calc_cache_size(vsize_t vasz,int pct,int va_pct)160 calc_cache_size(vsize_t vasz, int pct, int va_pct)
161 {
162           paddr_t t;
163 
164           t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
165           if ((vaddr_t)t != t) {
166                     panic("%s: needs tweak", __func__);
167           }
168           return t;
169 }
170 
171 #define   RETURN_ADDRESS      (uintptr_t)__builtin_return_address(0)
172 
173 void
assert_sleepable(void)174 assert_sleepable(void)
175 {
176           const char *reason = NULL;
177 
178           /* always sleepable, although we should improve this */
179 
180           if (!pserialize_not_in_read_section()) {
181                     reason = "pserialize";
182           }
183 
184           if (reason) {
185                     panic("%s: %s caller=%p", __func__, reason,
186                         (void *)RETURN_ADDRESS);
187           }
188 }
189 
190 void
module_init_md(void)191 module_init_md(void)
192 {
193 
194           /*
195            * Nothing for now.  However, we should load the librump
196            * symbol table.
197            */
198 }
199 
200 /*
201  * Try to emulate all the MD definitions of DELAY() / delay().
202  * Would be nice to fix the #defines in MD headers, but this quicker.
203  *
204  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
205  * don't have it in the current hypercall revision, busyloop.
206  * Note that rather than calibrate a loop delay and work with that,
207  * get call gettime (which does not block) in a loop to make sure
208  * we didn't get virtual ghosttime.  That might be slightly inaccurate
209  * for very small delays ...
210  *
211  * The other option would be to run a thread in the hypervisor which
212  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
213  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
214  */
215 static void
rump_delay(unsigned int us)216 rump_delay(unsigned int us)
217 {
218           struct timespec target, tmp;
219           uint64_t sec, sec_ini, sec_now;
220           long nsec, nsec_ini, nsec_now;
221           int loops;
222 
223           rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
224 
225 #ifdef __mac68k__
226           sec = us / 1000;
227           nsec = (us % 1000) * 1000000;
228 #else
229           sec = us / 1000000;
230           nsec = (us % 1000000) * 1000;
231 #endif
232 
233           target.tv_sec = sec_ini;
234           tmp.tv_sec = sec;
235           target.tv_nsec = nsec_ini;
236           tmp.tv_nsec = nsec;
237           timespecadd(&target, &tmp, &target);
238 
239           if (__predict_false(sec != 0))
240                     printf("WARNING: over 1s delay\n");
241 
242           for (loops = 0; loops < 1000*1000*100; loops++) {
243                     struct timespec cur;
244 
245                     rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
246                         &sec_now, &nsec_now);
247                     cur.tv_sec = sec_now;
248                     cur.tv_nsec = nsec_now;
249                     if (timespeccmp(&cur, &target, >=)) {
250                               return;
251                     }
252           }
253           printf("WARNING: DELAY ESCAPED\n");
254 }
255 void (*delay_func)(unsigned int) = rump_delay;
256 __strong_alias(delay,rump_delay);
257 __strong_alias(_delay,rump_delay);
258 
259 /* Weak alias for getcwd_common to be used unless librumpvfs is present. */
260 
261 int rump_getcwd_common(struct vnode *, struct vnode *, char **, char *,
262     int, int, struct lwp *);
263 int
rump_getcwd_common(struct vnode * lvp,struct vnode * rvp,char ** bpp,char * bufp,int limit,int flags,struct lwp * l)264 rump_getcwd_common(struct vnode *lvp, struct vnode *rvp, char **bpp, char *bufp,
265     int limit, int flags, struct lwp *l)
266 {
267 
268           return ENOENT;
269 }
270 __weak_alias(getcwd_common,rump_getcwd_common);
271 
272 /* Weak alias for vnode_to_path to be used unless librumpvfs is present. */
273 
274 int rump_vnode_to_path(char *, size_t, struct vnode *, struct lwp *,
275     struct proc *);
276 int
rump_vnode_to_path(char * path,size_t len,struct vnode * vp,struct lwp * curl,struct proc * p)277 rump_vnode_to_path(char *path, size_t len, struct vnode *vp, struct lwp *curl,
278     struct proc *p)
279 {
280 
281           return ENOENT; /* pretend getcwd_common() failed. */
282 }
283 __weak_alias(vnode_to_path,rump_vnode_to_path);
284 
285 
286 /* Weak aliases for fstrans to be used unless librumpvfs is present. */
287 
288 void rump_fstrans_start(struct mount *);
289 void
rump_fstrans_start(struct mount * mp)290 rump_fstrans_start(struct mount *mp)
291 {
292 
293 }
294 __weak_alias(fstrans_start,rump_fstrans_start);
295 
296 int rump_fstrans_start_nowait(struct mount *);
297 int
rump_fstrans_start_nowait(struct mount * mp)298 rump_fstrans_start_nowait(struct mount *mp)
299 {
300 
301           return 0;
302 }
303 __weak_alias(fstrans_start_nowait,rump_fstrans_start_nowait);
304 
305 void rump_fstrans_start_lazy(struct mount *);
306 void
rump_fstrans_start_lazy(struct mount * mp)307 rump_fstrans_start_lazy(struct mount *mp)
308 {
309 
310 }
311 __weak_alias(fstrans_start_lazy,rump_fstrans_start_lazy);
312 
313 
314 void rump_fstrans_done(struct mount *);
315 void
rump_fstrans_done(struct mount * mp)316 rump_fstrans_done(struct mount *mp)
317 {
318 
319 }
320 __weak_alias(fstrans_done,rump_fstrans_done);
321 
322 
323 void rump_fstrans_lwp_dtor(struct lwp *);
324 void
rump_fstrans_lwp_dtor(struct lwp * l)325 rump_fstrans_lwp_dtor(struct lwp *l)
326 {
327 
328 }
329 __weak_alias(fstrans_lwp_dtor,rump_fstrans_lwp_dtor);
330 
331 static int
rump_filt_fsattach(struct knote * kn)332 rump_filt_fsattach(struct knote *kn)
333 {
334 
335           return EOPNOTSUPP;
336 }
337 
338 struct filterops rump_fs_filtops = {
339           .f_attach = rump_filt_fsattach,
340 };
341 __weak_alias(fs_filtops,rump_fs_filtops);
342 
343 struct pool_cache *rump_pnbuf_cache;
344 __weak_alias(pnbuf_cache,rump_pnbuf_cache);
345 
346 /*
347  * Provide weak aliases for tty routines used by printf.
348  * They will be used unless the rumpkern_tty component is present.
349  */
350 
351 int rump_ttycheckoutq(struct tty *, int);
352 int
rump_ttycheckoutq(struct tty * tp,int wait)353 rump_ttycheckoutq(struct tty *tp, int wait)
354 {
355 
356           return 1;
357 }
358 __weak_alias(ttycheckoutq,rump_ttycheckoutq);
359 
360 int rump_tputchar(int, int, struct tty *);
361 int
rump_tputchar(int c,int flags,struct tty * tp)362 rump_tputchar(int c, int flags, struct tty *tp)
363 {
364 
365           cnputc(c);
366           return 0;
367 }
368 __weak_alias(tputchar,rump_tputchar);
369 
370 void
cnputc(int c)371 cnputc(int c)
372 {
373 
374           rumpuser_putchar(c);
375 }
376 
377 void
cnflush(void)378 cnflush(void)
379 {
380 
381           /* done */
382 }
383 
384 void
resettodr(void)385 resettodr(void)
386 {
387 
388           /* setting clocks is not in the jurisdiction of rump kernels */
389 }
390 
391 #ifdef __HAVE_SYSCALL_INTERN
392 void
syscall_intern(struct proc * p)393 syscall_intern(struct proc *p)
394 {
395 
396           p->p_emuldata = NULL;
397 }
398 #endif
399 
400 #ifdef LOCKDEBUG
401 void
turnstile_print(volatile void * obj,void (* pr)(const char *,...))402 turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
403 {
404 
405           /* nada */
406 }
407 #endif
408 
409 void
cpu_reboot(int howto,char * bootstr)410 cpu_reboot(int howto, char *bootstr)
411 {
412           int ruhow = 0;
413           void *finiarg;
414 
415           printf("rump kernel halting...\n");
416 
417           if (!RUMP_LOCALPROC_P(curproc))
418                     finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
419           else
420                     finiarg = NULL;
421 
422           /* dump means we really take the dive here */
423           if ((howto & RB_DUMP) || panicstr) {
424                     ruhow = RUMPUSER_PANIC;
425                     goto out;
426           }
427 
428           /* try to sync */
429           if (!((howto & RB_NOSYNC) || panicstr)) {
430                     rump_vfs_fini();
431           }
432 
433           doshutdownhooks();
434 
435           /* your wish is my command */
436           if (howto & RB_HALT) {
437                     printf("rump kernel halted (with RB_HALT, not exiting)\n");
438                     rump_sysproxy_fini(finiarg);
439                     for (;;) {
440                               rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
441                     }
442           }
443 
444           /* this function is __dead, we must exit */
445  out:
446           rump_sysproxy_fini(finiarg);
447           rumpuser_exit(ruhow);
448 }
449