1 /*-
2 * Copyright (c) 1982, 1986, 1989, 1991, 1993
3 * The Regents of the University of California. All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 4. Neither the name of the University nor the names of its contributors
14 * may be used to endorse or promote products derived from this software
15 * without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 * @(#)kern_proc.c 8.7 (Berkeley) 2/14/95
30 */
31
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
34
35 #include "opt_compat.h"
36 #include "opt_ddb.h"
37 #include "opt_kdtrace.h"
38 #include "opt_ktrace.h"
39 #include "opt_kstack_pages.h"
40 #include "opt_stack.h"
41
42 #include <sys/param.h>
43 #include <sys/systm.h>
44 #include <sys/elf.h>
45 #include <sys/exec.h>
46 #include <sys/kernel.h>
47 #include <sys/limits.h>
48 #include <sys/lock.h>
49 #include <sys/loginclass.h>
50 #include <sys/malloc.h>
51 #include <sys/mman.h>
52 #include <sys/mount.h>
53 #include <sys/mutex.h>
54 #include <sys/proc.h>
55 #include <sys/ptrace.h>
56 #include <sys/refcount.h>
57 #include <sys/resourcevar.h>
58 #include <sys/rwlock.h>
59 #include <sys/sbuf.h>
60 #include <sys/sysent.h>
61 #include <sys/sched.h>
62 #include <sys/smp.h>
63 #include <sys/stack.h>
64 #include <sys/stat.h>
65 #include <sys/sysctl.h>
66 #include <sys/filedesc.h>
67 #include <sys/tty.h>
68 #include <sys/signalvar.h>
69 #include <sys/sdt.h>
70 #include <sys/sx.h>
71 #include <sys/user.h>
72 #include <sys/jail.h>
73 #include <sys/vnode.h>
74 #include <sys/eventhandler.h>
75
76 #ifdef DDB
77 #include <ddb/ddb.h>
78 #endif
79
80 #include <vm/vm.h>
81 #include <vm/vm_param.h>
82 #include <vm/vm_extern.h>
83 #include <vm/pmap.h>
84 #include <vm/vm_map.h>
85 #include <vm/vm_object.h>
86 #include <vm/vm_page.h>
87 #include <vm/uma.h>
88
89 #ifdef COMPAT_FREEBSD32
90 #include <compat/freebsd32/freebsd32.h>
91 #include <compat/freebsd32/freebsd32_util.h>
92 #endif
93
94 SDT_PROVIDER_DEFINE(proc);
95 SDT_PROBE_DEFINE4(proc, kernel, ctor, entry, "struct proc *", "int",
96 "void *", "int");
97 SDT_PROBE_DEFINE4(proc, kernel, ctor, return, "struct proc *", "int",
98 "void *", "int");
99 SDT_PROBE_DEFINE4(proc, kernel, dtor, entry, "struct proc *", "int",
100 "void *", "struct thread *");
101 SDT_PROBE_DEFINE3(proc, kernel, dtor, return, "struct proc *", "int",
102 "void *");
103 SDT_PROBE_DEFINE3(proc, kernel, init, entry, "struct proc *", "int",
104 "int");
105 SDT_PROBE_DEFINE3(proc, kernel, init, return, "struct proc *", "int",
106 "int");
107
108 MALLOC_DEFINE(M_PGRP, "pgrp", "process group header");
109 MALLOC_DEFINE(M_SESSION, "session", "session header");
110 static MALLOC_DEFINE(M_PROC, "proc", "Proc structures");
111 MALLOC_DEFINE(M_SUBPROC, "subproc", "Proc sub-structures");
112
113 static void doenterpgrp(struct proc *, struct pgrp *);
114 static void orphanpg(struct pgrp *pg);
115 static void fill_kinfo_aggregate(struct proc *p, struct kinfo_proc *kp);
116 static void fill_kinfo_proc_only(struct proc *p, struct kinfo_proc *kp);
117 static void fill_kinfo_thread(struct thread *td, struct kinfo_proc *kp,
118 int preferthread);
119 static void pgadjustjobc(struct pgrp *pgrp, int entering);
120 static void pgdelete(struct pgrp *);
121 static int proc_ctor(void *mem, int size, void *arg, int flags);
122 static void proc_dtor(void *mem, int size, void *arg);
123 static int proc_init(void *mem, int size, int flags);
124 static void proc_fini(void *mem, int size);
125 static void pargs_free(struct pargs *pa);
126 static struct proc *zpfind_locked(pid_t pid);
127
128 /*
129 * Other process lists
130 */
131 struct pidhashhead *pidhashtbl;
132 u_long pidhash;
133 struct pgrphashhead *pgrphashtbl;
134 u_long pgrphash;
135 struct proclist allproc;
136 struct proclist zombproc;
137 struct sx allproc_lock;
138 struct sx proctree_lock;
139 struct mtx ppeers_lock;
140 uma_zone_t proc_zone;
141
142 int kstack_pages = KSTACK_PAGES;
143 SYSCTL_INT(_kern, OID_AUTO, kstack_pages, CTLFLAG_RD, &kstack_pages, 0,
144 "Kernel stack size in pages");
145 static int vmmap_skip_res_cnt = 0;
146 SYSCTL_INT(_kern, OID_AUTO, proc_vmmap_skip_resident_count, CTLFLAG_RW,
147 &vmmap_skip_res_cnt, 0,
148 "Skip calculation of the pages resident count in kern.proc.vmmap");
149
150 CTASSERT(sizeof(struct kinfo_proc) == KINFO_PROC_SIZE);
151 #ifdef COMPAT_FREEBSD32
152 CTASSERT(sizeof(struct kinfo_proc32) == KINFO_PROC32_SIZE);
153 #endif
154
155 /*
156 * Initialize global process hashing structures.
157 */
158 void
procinit()159 procinit()
160 {
161
162 sx_init(&allproc_lock, "allproc");
163 sx_init(&proctree_lock, "proctree");
164 mtx_init(&ppeers_lock, "p_peers", NULL, MTX_DEF);
165 LIST_INIT(&allproc);
166 LIST_INIT(&zombproc);
167 pidhashtbl = hashinit(maxproc / 4, M_PROC, &pidhash);
168 pgrphashtbl = hashinit(maxproc / 4, M_PROC, &pgrphash);
169 proc_zone = uma_zcreate("PROC", sched_sizeof_proc(),
170 proc_ctor, proc_dtor, proc_init, proc_fini,
171 UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
172 uihashinit();
173 }
174
175 /*
176 * Prepare a proc for use.
177 */
178 static int
proc_ctor(void * mem,int size,void * arg,int flags)179 proc_ctor(void *mem, int size, void *arg, int flags)
180 {
181 struct proc *p;
182
183 p = (struct proc *)mem;
184 SDT_PROBE(proc, kernel, ctor , entry, p, size, arg, flags, 0);
185 EVENTHANDLER_INVOKE(process_ctor, p);
186 SDT_PROBE(proc, kernel, ctor , return, p, size, arg, flags, 0);
187 return (0);
188 }
189
190 /*
191 * Reclaim a proc after use.
192 */
193 static void
proc_dtor(void * mem,int size,void * arg)194 proc_dtor(void *mem, int size, void *arg)
195 {
196 struct proc *p;
197 struct thread *td;
198
199 /* INVARIANTS checks go here */
200 p = (struct proc *)mem;
201 td = FIRST_THREAD_IN_PROC(p);
202 SDT_PROBE(proc, kernel, dtor, entry, p, size, arg, td, 0);
203 if (td != NULL) {
204 #ifdef INVARIANTS
205 KASSERT((p->p_numthreads == 1),
206 ("bad number of threads in exiting process"));
207 KASSERT(STAILQ_EMPTY(&p->p_ktr), ("proc_dtor: non-empty p_ktr"));
208 #endif
209 /* Free all OSD associated to this thread. */
210 osd_thread_exit(td);
211 }
212 EVENTHANDLER_INVOKE(process_dtor, p);
213 if (p->p_ksi != NULL)
214 KASSERT(! KSI_ONQ(p->p_ksi), ("SIGCHLD queue"));
215 SDT_PROBE(proc, kernel, dtor, return, p, size, arg, 0, 0);
216 }
217
218 /*
219 * Initialize type-stable parts of a proc (when newly created).
220 */
221 static int
proc_init(void * mem,int size,int flags)222 proc_init(void *mem, int size, int flags)
223 {
224 struct proc *p;
225
226 p = (struct proc *)mem;
227 SDT_PROBE(proc, kernel, init, entry, p, size, flags, 0, 0);
228 p->p_sched = (struct p_sched *)&p[1];
229 bzero(&p->p_mtx, sizeof(struct mtx));
230 mtx_init(&p->p_mtx, "process lock", NULL, MTX_DEF | MTX_DUPOK);
231 mtx_init(&p->p_slock, "process slock", NULL, MTX_SPIN | MTX_RECURSE);
232 cv_init(&p->p_pwait, "ppwait");
233 cv_init(&p->p_dbgwait, "dbgwait");
234 TAILQ_INIT(&p->p_threads); /* all threads in proc */
235 EVENTHANDLER_INVOKE(process_init, p);
236 p->p_stats = pstats_alloc();
237 SDT_PROBE(proc, kernel, init, return, p, size, flags, 0, 0);
238 return (0);
239 }
240
241 /*
242 * UMA should ensure that this function is never called.
243 * Freeing a proc structure would violate type stability.
244 */
245 static void
proc_fini(void * mem,int size)246 proc_fini(void *mem, int size)
247 {
248 #ifdef notnow
249 struct proc *p;
250
251 p = (struct proc *)mem;
252 EVENTHANDLER_INVOKE(process_fini, p);
253 pstats_free(p->p_stats);
254 thread_free(FIRST_THREAD_IN_PROC(p));
255 mtx_destroy(&p->p_mtx);
256 if (p->p_ksi != NULL)
257 ksiginfo_free(p->p_ksi);
258 #else
259 panic("proc reclaimed");
260 #endif
261 }
262
263 /*
264 * Is p an inferior of the current process?
265 */
266 int
inferior(struct proc * p)267 inferior(struct proc *p)
268 {
269
270 sx_assert(&proctree_lock, SX_LOCKED);
271 PROC_LOCK_ASSERT(p, MA_OWNED);
272 for (; p != curproc; p = proc_realparent(p)) {
273 if (p->p_pid == 0)
274 return (0);
275 }
276 return (1);
277 }
278
279 struct proc *
pfind_locked(pid_t pid)280 pfind_locked(pid_t pid)
281 {
282 struct proc *p;
283
284 sx_assert(&allproc_lock, SX_LOCKED);
285 LIST_FOREACH(p, PIDHASH(pid), p_hash) {
286 if (p->p_pid == pid) {
287 PROC_LOCK(p);
288 if (p->p_state == PRS_NEW) {
289 PROC_UNLOCK(p);
290 p = NULL;
291 }
292 break;
293 }
294 }
295 return (p);
296 }
297
298 /*
299 * Locate a process by number; return only "live" processes -- i.e., neither
300 * zombies nor newly born but incompletely initialized processes. By not
301 * returning processes in the PRS_NEW state, we allow callers to avoid
302 * testing for that condition to avoid dereferencing p_ucred, et al.
303 */
304 struct proc *
pfind(pid_t pid)305 pfind(pid_t pid)
306 {
307 struct proc *p;
308
309 sx_slock(&allproc_lock);
310 p = pfind_locked(pid);
311 sx_sunlock(&allproc_lock);
312 return (p);
313 }
314
315 static struct proc *
pfind_tid_locked(pid_t tid)316 pfind_tid_locked(pid_t tid)
317 {
318 struct proc *p;
319 struct thread *td;
320
321 sx_assert(&allproc_lock, SX_LOCKED);
322 FOREACH_PROC_IN_SYSTEM(p) {
323 PROC_LOCK(p);
324 if (p->p_state == PRS_NEW) {
325 PROC_UNLOCK(p);
326 continue;
327 }
328 FOREACH_THREAD_IN_PROC(p, td) {
329 if (td->td_tid == tid)
330 goto found;
331 }
332 PROC_UNLOCK(p);
333 }
334 found:
335 return (p);
336 }
337
338 /*
339 * Locate a process group by number.
340 * The caller must hold proctree_lock.
341 */
342 struct pgrp *
pgfind(pgid)343 pgfind(pgid)
344 register pid_t pgid;
345 {
346 register struct pgrp *pgrp;
347
348 sx_assert(&proctree_lock, SX_LOCKED);
349
350 LIST_FOREACH(pgrp, PGRPHASH(pgid), pg_hash) {
351 if (pgrp->pg_id == pgid) {
352 PGRP_LOCK(pgrp);
353 return (pgrp);
354 }
355 }
356 return (NULL);
357 }
358
359 /*
360 * Locate process and do additional manipulations, depending on flags.
361 */
362 int
pget(pid_t pid,int flags,struct proc ** pp)363 pget(pid_t pid, int flags, struct proc **pp)
364 {
365 struct proc *p;
366 int error;
367
368 sx_slock(&allproc_lock);
369 if (pid <= PID_MAX) {
370 p = pfind_locked(pid);
371 if (p == NULL && (flags & PGET_NOTWEXIT) == 0)
372 p = zpfind_locked(pid);
373 } else if ((flags & PGET_NOTID) == 0) {
374 p = pfind_tid_locked(pid);
375 } else {
376 p = NULL;
377 }
378 sx_sunlock(&allproc_lock);
379 if (p == NULL)
380 return (ESRCH);
381 if ((flags & PGET_CANSEE) != 0) {
382 error = p_cansee(curthread, p);
383 if (error != 0)
384 goto errout;
385 }
386 if ((flags & PGET_CANDEBUG) != 0) {
387 error = p_candebug(curthread, p);
388 if (error != 0)
389 goto errout;
390 }
391 if ((flags & PGET_ISCURRENT) != 0 && curproc != p) {
392 error = EPERM;
393 goto errout;
394 }
395 if ((flags & PGET_NOTWEXIT) != 0 && (p->p_flag & P_WEXIT) != 0) {
396 error = ESRCH;
397 goto errout;
398 }
399 if ((flags & PGET_NOTINEXEC) != 0 && (p->p_flag & P_INEXEC) != 0) {
400 /*
401 * XXXRW: Not clear ESRCH is the right error during proc
402 * execve().
403 */
404 error = ESRCH;
405 goto errout;
406 }
407 if ((flags & PGET_HOLD) != 0) {
408 _PHOLD(p);
409 PROC_UNLOCK(p);
410 }
411 *pp = p;
412 return (0);
413 errout:
414 PROC_UNLOCK(p);
415 return (error);
416 }
417
418 /*
419 * Create a new process group.
420 * pgid must be equal to the pid of p.
421 * Begin a new session if required.
422 */
423 int
enterpgrp(p,pgid,pgrp,sess)424 enterpgrp(p, pgid, pgrp, sess)
425 register struct proc *p;
426 pid_t pgid;
427 struct pgrp *pgrp;
428 struct session *sess;
429 {
430
431 sx_assert(&proctree_lock, SX_XLOCKED);
432
433 KASSERT(pgrp != NULL, ("enterpgrp: pgrp == NULL"));
434 KASSERT(p->p_pid == pgid,
435 ("enterpgrp: new pgrp and pid != pgid"));
436 KASSERT(pgfind(pgid) == NULL,
437 ("enterpgrp: pgrp with pgid exists"));
438 KASSERT(!SESS_LEADER(p),
439 ("enterpgrp: session leader attempted setpgrp"));
440
441 mtx_init(&pgrp->pg_mtx, "process group", NULL, MTX_DEF | MTX_DUPOK);
442
443 if (sess != NULL) {
444 /*
445 * new session
446 */
447 mtx_init(&sess->s_mtx, "session", NULL, MTX_DEF);
448 PROC_LOCK(p);
449 p->p_flag &= ~P_CONTROLT;
450 PROC_UNLOCK(p);
451 PGRP_LOCK(pgrp);
452 sess->s_leader = p;
453 sess->s_sid = p->p_pid;
454 refcount_init(&sess->s_count, 1);
455 sess->s_ttyvp = NULL;
456 sess->s_ttydp = NULL;
457 sess->s_ttyp = NULL;
458 bcopy(p->p_session->s_login, sess->s_login,
459 sizeof(sess->s_login));
460 pgrp->pg_session = sess;
461 KASSERT(p == curproc,
462 ("enterpgrp: mksession and p != curproc"));
463 } else {
464 pgrp->pg_session = p->p_session;
465 sess_hold(pgrp->pg_session);
466 PGRP_LOCK(pgrp);
467 }
468 pgrp->pg_id = pgid;
469 LIST_INIT(&pgrp->pg_members);
470
471 /*
472 * As we have an exclusive lock of proctree_lock,
473 * this should not deadlock.
474 */
475 LIST_INSERT_HEAD(PGRPHASH(pgid), pgrp, pg_hash);
476 pgrp->pg_jobc = 0;
477 SLIST_INIT(&pgrp->pg_sigiolst);
478 PGRP_UNLOCK(pgrp);
479
480 doenterpgrp(p, pgrp);
481 return (0);
482 }
483
484 /*
485 * Move p to an existing process group
486 */
487 int
enterthispgrp(p,pgrp)488 enterthispgrp(p, pgrp)
489 register struct proc *p;
490 struct pgrp *pgrp;
491 {
492
493 sx_assert(&proctree_lock, SX_XLOCKED);
494 PROC_LOCK_ASSERT(p, MA_NOTOWNED);
495 PGRP_LOCK_ASSERT(pgrp, MA_NOTOWNED);
496 PGRP_LOCK_ASSERT(p->p_pgrp, MA_NOTOWNED);
497 SESS_LOCK_ASSERT(p->p_session, MA_NOTOWNED);
498 KASSERT(pgrp->pg_session == p->p_session,
499 ("%s: pgrp's session %p, p->p_session %p.\n",
500 __func__,
501 pgrp->pg_session,
502 p->p_session));
503 KASSERT(pgrp != p->p_pgrp,
504 ("%s: p belongs to pgrp.", __func__));
505
506 doenterpgrp(p, pgrp);
507
508 return (0);
509 }
510
511 /*
512 * Move p to a process group
513 */
514 static void
doenterpgrp(p,pgrp)515 doenterpgrp(p, pgrp)
516 struct proc *p;
517 struct pgrp *pgrp;
518 {
519 struct pgrp *savepgrp;
520
521 sx_assert(&proctree_lock, SX_XLOCKED);
522 PROC_LOCK_ASSERT(p, MA_NOTOWNED);
523 PGRP_LOCK_ASSERT(pgrp, MA_NOTOWNED);
524 PGRP_LOCK_ASSERT(p->p_pgrp, MA_NOTOWNED);
525 SESS_LOCK_ASSERT(p->p_session, MA_NOTOWNED);
526
527 savepgrp = p->p_pgrp;
528
529 /*
530 * Adjust eligibility of affected pgrps to participate in job control.
531 * Increment eligibility counts before decrementing, otherwise we
532 * could reach 0 spuriously during the first call.
533 */
534 fixjobc(p, pgrp, 1);
535 fixjobc(p, p->p_pgrp, 0);
536
537 PGRP_LOCK(pgrp);
538 PGRP_LOCK(savepgrp);
539 PROC_LOCK(p);
540 LIST_REMOVE(p, p_pglist);
541 p->p_pgrp = pgrp;
542 PROC_UNLOCK(p);
543 LIST_INSERT_HEAD(&pgrp->pg_members, p, p_pglist);
544 PGRP_UNLOCK(savepgrp);
545 PGRP_UNLOCK(pgrp);
546 if (LIST_EMPTY(&savepgrp->pg_members))
547 pgdelete(savepgrp);
548 }
549
550 /*
551 * remove process from process group
552 */
553 int
leavepgrp(p)554 leavepgrp(p)
555 register struct proc *p;
556 {
557 struct pgrp *savepgrp;
558
559 sx_assert(&proctree_lock, SX_XLOCKED);
560 savepgrp = p->p_pgrp;
561 PGRP_LOCK(savepgrp);
562 PROC_LOCK(p);
563 LIST_REMOVE(p, p_pglist);
564 p->p_pgrp = NULL;
565 PROC_UNLOCK(p);
566 PGRP_UNLOCK(savepgrp);
567 if (LIST_EMPTY(&savepgrp->pg_members))
568 pgdelete(savepgrp);
569 return (0);
570 }
571
572 /*
573 * delete a process group
574 */
575 static void
pgdelete(pgrp)576 pgdelete(pgrp)
577 register struct pgrp *pgrp;
578 {
579 struct session *savesess;
580 struct tty *tp;
581
582 sx_assert(&proctree_lock, SX_XLOCKED);
583 PGRP_LOCK_ASSERT(pgrp, MA_NOTOWNED);
584 SESS_LOCK_ASSERT(pgrp->pg_session, MA_NOTOWNED);
585
586 /*
587 * Reset any sigio structures pointing to us as a result of
588 * F_SETOWN with our pgid.
589 */
590 funsetownlst(&pgrp->pg_sigiolst);
591
592 PGRP_LOCK(pgrp);
593 tp = pgrp->pg_session->s_ttyp;
594 LIST_REMOVE(pgrp, pg_hash);
595 savesess = pgrp->pg_session;
596 PGRP_UNLOCK(pgrp);
597
598 /* Remove the reference to the pgrp before deallocating it. */
599 if (tp != NULL) {
600 tty_lock(tp);
601 tty_rel_pgrp(tp, pgrp);
602 }
603
604 mtx_destroy(&pgrp->pg_mtx);
605 free(pgrp, M_PGRP);
606 sess_release(savesess);
607 }
608
609 static void
pgadjustjobc(pgrp,entering)610 pgadjustjobc(pgrp, entering)
611 struct pgrp *pgrp;
612 int entering;
613 {
614
615 PGRP_LOCK(pgrp);
616 if (entering)
617 pgrp->pg_jobc++;
618 else {
619 --pgrp->pg_jobc;
620 if (pgrp->pg_jobc == 0)
621 orphanpg(pgrp);
622 }
623 PGRP_UNLOCK(pgrp);
624 }
625
626 /*
627 * Adjust pgrp jobc counters when specified process changes process group.
628 * We count the number of processes in each process group that "qualify"
629 * the group for terminal job control (those with a parent in a different
630 * process group of the same session). If that count reaches zero, the
631 * process group becomes orphaned. Check both the specified process'
632 * process group and that of its children.
633 * entering == 0 => p is leaving specified group.
634 * entering == 1 => p is entering specified group.
635 */
636 void
fixjobc(p,pgrp,entering)637 fixjobc(p, pgrp, entering)
638 register struct proc *p;
639 register struct pgrp *pgrp;
640 int entering;
641 {
642 register struct pgrp *hispgrp;
643 register struct session *mysession;
644
645 sx_assert(&proctree_lock, SX_LOCKED);
646 PROC_LOCK_ASSERT(p, MA_NOTOWNED);
647 PGRP_LOCK_ASSERT(pgrp, MA_NOTOWNED);
648 SESS_LOCK_ASSERT(pgrp->pg_session, MA_NOTOWNED);
649
650 /*
651 * Check p's parent to see whether p qualifies its own process
652 * group; if so, adjust count for p's process group.
653 */
654 mysession = pgrp->pg_session;
655 if ((hispgrp = p->p_pptr->p_pgrp) != pgrp &&
656 hispgrp->pg_session == mysession)
657 pgadjustjobc(pgrp, entering);
658
659 /*
660 * Check this process' children to see whether they qualify
661 * their process groups; if so, adjust counts for children's
662 * process groups.
663 */
664 LIST_FOREACH(p, &p->p_children, p_sibling) {
665 hispgrp = p->p_pgrp;
666 if (hispgrp == pgrp ||
667 hispgrp->pg_session != mysession)
668 continue;
669 PROC_LOCK(p);
670 if (p->p_state == PRS_ZOMBIE) {
671 PROC_UNLOCK(p);
672 continue;
673 }
674 PROC_UNLOCK(p);
675 pgadjustjobc(hispgrp, entering);
676 }
677 }
678
679 /*
680 * A process group has become orphaned;
681 * if there are any stopped processes in the group,
682 * hang-up all process in that group.
683 */
684 static void
orphanpg(pg)685 orphanpg(pg)
686 struct pgrp *pg;
687 {
688 register struct proc *p;
689
690 PGRP_LOCK_ASSERT(pg, MA_OWNED);
691
692 LIST_FOREACH(p, &pg->pg_members, p_pglist) {
693 PROC_LOCK(p);
694 if (P_SHOULDSTOP(p)) {
695 PROC_UNLOCK(p);
696 LIST_FOREACH(p, &pg->pg_members, p_pglist) {
697 PROC_LOCK(p);
698 kern_psignal(p, SIGHUP);
699 kern_psignal(p, SIGCONT);
700 PROC_UNLOCK(p);
701 }
702 return;
703 }
704 PROC_UNLOCK(p);
705 }
706 }
707
708 void
sess_hold(struct session * s)709 sess_hold(struct session *s)
710 {
711
712 refcount_acquire(&s->s_count);
713 }
714
715 void
sess_release(struct session * s)716 sess_release(struct session *s)
717 {
718
719 if (refcount_release(&s->s_count)) {
720 if (s->s_ttyp != NULL) {
721 tty_lock(s->s_ttyp);
722 tty_rel_sess(s->s_ttyp, s);
723 }
724 mtx_destroy(&s->s_mtx);
725 free(s, M_SESSION);
726 }
727 }
728
729 #ifdef DDB
730
DB_SHOW_COMMAND(pgrpdump,pgrpdump)731 DB_SHOW_COMMAND(pgrpdump, pgrpdump)
732 {
733 register struct pgrp *pgrp;
734 register struct proc *p;
735 register int i;
736
737 for (i = 0; i <= pgrphash; i++) {
738 if (!LIST_EMPTY(&pgrphashtbl[i])) {
739 printf("\tindx %d\n", i);
740 LIST_FOREACH(pgrp, &pgrphashtbl[i], pg_hash) {
741 printf(
742 "\tpgrp %p, pgid %ld, sess %p, sesscnt %d, mem %p\n",
743 (void *)pgrp, (long)pgrp->pg_id,
744 (void *)pgrp->pg_session,
745 pgrp->pg_session->s_count,
746 (void *)LIST_FIRST(&pgrp->pg_members));
747 LIST_FOREACH(p, &pgrp->pg_members, p_pglist) {
748 printf("\t\tpid %ld addr %p pgrp %p\n",
749 (long)p->p_pid, (void *)p,
750 (void *)p->p_pgrp);
751 }
752 }
753 }
754 }
755 }
756 #endif /* DDB */
757
758 /*
759 * Calculate the kinfo_proc members which contain process-wide
760 * informations.
761 * Must be called with the target process locked.
762 */
763 static void
fill_kinfo_aggregate(struct proc * p,struct kinfo_proc * kp)764 fill_kinfo_aggregate(struct proc *p, struct kinfo_proc *kp)
765 {
766 struct thread *td;
767
768 PROC_LOCK_ASSERT(p, MA_OWNED);
769
770 kp->ki_estcpu = 0;
771 kp->ki_pctcpu = 0;
772 FOREACH_THREAD_IN_PROC(p, td) {
773 thread_lock(td);
774 kp->ki_pctcpu += sched_pctcpu(td);
775 kp->ki_estcpu += td->td_estcpu;
776 thread_unlock(td);
777 }
778 }
779
780 /*
781 * Clear kinfo_proc and fill in any information that is common
782 * to all threads in the process.
783 * Must be called with the target process locked.
784 */
785 static void
fill_kinfo_proc_only(struct proc * p,struct kinfo_proc * kp)786 fill_kinfo_proc_only(struct proc *p, struct kinfo_proc *kp)
787 {
788 struct thread *td0;
789 struct tty *tp;
790 struct session *sp;
791 struct ucred *cred;
792 struct sigacts *ps;
793
794 PROC_LOCK_ASSERT(p, MA_OWNED);
795 bzero(kp, sizeof(*kp));
796
797 kp->ki_structsize = sizeof(*kp);
798 kp->ki_paddr = p;
799 kp->ki_addr =/* p->p_addr; */0; /* XXX */
800 kp->ki_args = p->p_args;
801 kp->ki_textvp = p->p_textvp;
802 #ifdef KTRACE
803 kp->ki_tracep = p->p_tracevp;
804 kp->ki_traceflag = p->p_traceflag;
805 #endif
806 kp->ki_fd = p->p_fd;
807 kp->ki_vmspace = p->p_vmspace;
808 kp->ki_flag = p->p_flag;
809 kp->ki_flag2 = p->p_flag2;
810 cred = p->p_ucred;
811 if (cred) {
812 kp->ki_uid = cred->cr_uid;
813 kp->ki_ruid = cred->cr_ruid;
814 kp->ki_svuid = cred->cr_svuid;
815 kp->ki_cr_flags = 0;
816 if (cred->cr_flags & CRED_FLAG_CAPMODE)
817 kp->ki_cr_flags |= KI_CRF_CAPABILITY_MODE;
818 /* XXX bde doesn't like KI_NGROUPS */
819 if (cred->cr_ngroups > KI_NGROUPS) {
820 kp->ki_ngroups = KI_NGROUPS;
821 kp->ki_cr_flags |= KI_CRF_GRP_OVERFLOW;
822 } else
823 kp->ki_ngroups = cred->cr_ngroups;
824 bcopy(cred->cr_groups, kp->ki_groups,
825 kp->ki_ngroups * sizeof(gid_t));
826 kp->ki_rgid = cred->cr_rgid;
827 kp->ki_svgid = cred->cr_svgid;
828 /* If jailed(cred), emulate the old P_JAILED flag. */
829 if (jailed(cred)) {
830 kp->ki_flag |= P_JAILED;
831 /* If inside the jail, use 0 as a jail ID. */
832 if (cred->cr_prison != curthread->td_ucred->cr_prison)
833 kp->ki_jid = cred->cr_prison->pr_id;
834 }
835 strlcpy(kp->ki_loginclass, cred->cr_loginclass->lc_name,
836 sizeof(kp->ki_loginclass));
837 }
838 ps = p->p_sigacts;
839 if (ps) {
840 mtx_lock(&ps->ps_mtx);
841 kp->ki_sigignore = ps->ps_sigignore;
842 kp->ki_sigcatch = ps->ps_sigcatch;
843 mtx_unlock(&ps->ps_mtx);
844 }
845 if (p->p_state != PRS_NEW &&
846 p->p_state != PRS_ZOMBIE &&
847 p->p_vmspace != NULL) {
848 struct vmspace *vm = p->p_vmspace;
849
850 kp->ki_size = vm->vm_map.size;
851 kp->ki_rssize = vmspace_resident_count(vm); /*XXX*/
852 FOREACH_THREAD_IN_PROC(p, td0) {
853 if (!TD_IS_SWAPPED(td0))
854 kp->ki_rssize += td0->td_kstack_pages;
855 }
856 kp->ki_swrss = vm->vm_swrss;
857 kp->ki_tsize = vm->vm_tsize;
858 kp->ki_dsize = vm->vm_dsize;
859 kp->ki_ssize = vm->vm_ssize;
860 } else if (p->p_state == PRS_ZOMBIE)
861 kp->ki_stat = SZOMB;
862 if (kp->ki_flag & P_INMEM)
863 kp->ki_sflag = PS_INMEM;
864 else
865 kp->ki_sflag = 0;
866 /* Calculate legacy swtime as seconds since 'swtick'. */
867 kp->ki_swtime = (ticks - p->p_swtick) / hz;
868 kp->ki_pid = p->p_pid;
869 kp->ki_nice = p->p_nice;
870 kp->ki_fibnum = p->p_fibnum;
871 kp->ki_start = p->p_stats->p_start;
872 timevaladd(&kp->ki_start, &boottime);
873 PROC_SLOCK(p);
874 rufetch(p, &kp->ki_rusage);
875 kp->ki_runtime = cputick2usec(p->p_rux.rux_runtime);
876 calcru(p, &kp->ki_rusage.ru_utime, &kp->ki_rusage.ru_stime);
877 PROC_SUNLOCK(p);
878 calccru(p, &kp->ki_childutime, &kp->ki_childstime);
879 /* Some callers want child times in a single value. */
880 kp->ki_childtime = kp->ki_childstime;
881 timevaladd(&kp->ki_childtime, &kp->ki_childutime);
882
883 FOREACH_THREAD_IN_PROC(p, td0)
884 kp->ki_cow += td0->td_cow;
885
886 tp = NULL;
887 if (p->p_pgrp) {
888 kp->ki_pgid = p->p_pgrp->pg_id;
889 kp->ki_jobc = p->p_pgrp->pg_jobc;
890 sp = p->p_pgrp->pg_session;
891
892 if (sp != NULL) {
893 kp->ki_sid = sp->s_sid;
894 SESS_LOCK(sp);
895 strlcpy(kp->ki_login, sp->s_login,
896 sizeof(kp->ki_login));
897 if (sp->s_ttyvp)
898 kp->ki_kiflag |= KI_CTTY;
899 if (SESS_LEADER(p))
900 kp->ki_kiflag |= KI_SLEADER;
901 /* XXX proctree_lock */
902 tp = sp->s_ttyp;
903 SESS_UNLOCK(sp);
904 }
905 }
906 if ((p->p_flag & P_CONTROLT) && tp != NULL) {
907 kp->ki_tdev = tty_udev(tp);
908 kp->ki_tpgid = tp->t_pgrp ? tp->t_pgrp->pg_id : NO_PID;
909 if (tp->t_session)
910 kp->ki_tsid = tp->t_session->s_sid;
911 } else
912 kp->ki_tdev = NODEV;
913 if (p->p_comm[0] != '\0')
914 strlcpy(kp->ki_comm, p->p_comm, sizeof(kp->ki_comm));
915 if (p->p_sysent && p->p_sysent->sv_name != NULL &&
916 p->p_sysent->sv_name[0] != '\0')
917 strlcpy(kp->ki_emul, p->p_sysent->sv_name, sizeof(kp->ki_emul));
918 kp->ki_siglist = p->p_siglist;
919 kp->ki_xstat = p->p_xstat;
920 kp->ki_acflag = p->p_acflag;
921 kp->ki_lock = p->p_lock;
922 if (p->p_pptr)
923 kp->ki_ppid = p->p_pptr->p_pid;
924 }
925
926 /*
927 * Fill in information that is thread specific. Must be called with
928 * target process locked. If 'preferthread' is set, overwrite certain
929 * process-related fields that are maintained for both threads and
930 * processes.
931 */
932 static void
fill_kinfo_thread(struct thread * td,struct kinfo_proc * kp,int preferthread)933 fill_kinfo_thread(struct thread *td, struct kinfo_proc *kp, int preferthread)
934 {
935 struct proc *p;
936
937 p = td->td_proc;
938 kp->ki_tdaddr = td;
939 PROC_LOCK_ASSERT(p, MA_OWNED);
940
941 if (preferthread)
942 PROC_SLOCK(p);
943 thread_lock(td);
944 if (td->td_wmesg != NULL)
945 strlcpy(kp->ki_wmesg, td->td_wmesg, sizeof(kp->ki_wmesg));
946 else
947 bzero(kp->ki_wmesg, sizeof(kp->ki_wmesg));
948 strlcpy(kp->ki_tdname, td->td_name, sizeof(kp->ki_tdname));
949 if (TD_ON_LOCK(td)) {
950 kp->ki_kiflag |= KI_LOCKBLOCK;
951 strlcpy(kp->ki_lockname, td->td_lockname,
952 sizeof(kp->ki_lockname));
953 } else {
954 kp->ki_kiflag &= ~KI_LOCKBLOCK;
955 bzero(kp->ki_lockname, sizeof(kp->ki_lockname));
956 }
957
958 if (p->p_state == PRS_NORMAL) { /* approximate. */
959 if (TD_ON_RUNQ(td) ||
960 TD_CAN_RUN(td) ||
961 TD_IS_RUNNING(td)) {
962 kp->ki_stat = SRUN;
963 } else if (P_SHOULDSTOP(p)) {
964 kp->ki_stat = SSTOP;
965 } else if (TD_IS_SLEEPING(td)) {
966 kp->ki_stat = SSLEEP;
967 } else if (TD_ON_LOCK(td)) {
968 kp->ki_stat = SLOCK;
969 } else {
970 kp->ki_stat = SWAIT;
971 }
972 } else if (p->p_state == PRS_ZOMBIE) {
973 kp->ki_stat = SZOMB;
974 } else {
975 kp->ki_stat = SIDL;
976 }
977
978 /* Things in the thread */
979 kp->ki_wchan = td->td_wchan;
980 kp->ki_pri.pri_level = td->td_priority;
981 kp->ki_pri.pri_native = td->td_base_pri;
982 kp->ki_lastcpu = td->td_lastcpu;
983 kp->ki_oncpu = td->td_oncpu;
984 kp->ki_tdflags = td->td_flags;
985 kp->ki_tid = td->td_tid;
986 kp->ki_numthreads = p->p_numthreads;
987 kp->ki_pcb = td->td_pcb;
988 kp->ki_kstack = (void *)td->td_kstack;
989 kp->ki_slptime = (ticks - td->td_slptick) / hz;
990 kp->ki_pri.pri_class = td->td_pri_class;
991 kp->ki_pri.pri_user = td->td_user_pri;
992
993 if (preferthread) {
994 rufetchtd(td, &kp->ki_rusage);
995 kp->ki_runtime = cputick2usec(td->td_rux.rux_runtime);
996 kp->ki_pctcpu = sched_pctcpu(td);
997 kp->ki_estcpu = td->td_estcpu;
998 kp->ki_cow = td->td_cow;
999 }
1000
1001 /* We can't get this anymore but ps etc never used it anyway. */
1002 kp->ki_rqindex = 0;
1003
1004 if (preferthread)
1005 kp->ki_siglist = td->td_siglist;
1006 kp->ki_sigmask = td->td_sigmask;
1007 thread_unlock(td);
1008 if (preferthread)
1009 PROC_SUNLOCK(p);
1010 }
1011
1012 /*
1013 * Fill in a kinfo_proc structure for the specified process.
1014 * Must be called with the target process locked.
1015 */
1016 void
fill_kinfo_proc(struct proc * p,struct kinfo_proc * kp)1017 fill_kinfo_proc(struct proc *p, struct kinfo_proc *kp)
1018 {
1019
1020 MPASS(FIRST_THREAD_IN_PROC(p) != NULL);
1021
1022 fill_kinfo_proc_only(p, kp);
1023 fill_kinfo_thread(FIRST_THREAD_IN_PROC(p), kp, 0);
1024 fill_kinfo_aggregate(p, kp);
1025 }
1026
1027 struct pstats *
pstats_alloc(void)1028 pstats_alloc(void)
1029 {
1030
1031 return (malloc(sizeof(struct pstats), M_SUBPROC, M_ZERO|M_WAITOK));
1032 }
1033
1034 /*
1035 * Copy parts of p_stats; zero the rest of p_stats (statistics).
1036 */
1037 void
pstats_fork(struct pstats * src,struct pstats * dst)1038 pstats_fork(struct pstats *src, struct pstats *dst)
1039 {
1040
1041 bzero(&dst->pstat_startzero,
1042 __rangeof(struct pstats, pstat_startzero, pstat_endzero));
1043 bcopy(&src->pstat_startcopy, &dst->pstat_startcopy,
1044 __rangeof(struct pstats, pstat_startcopy, pstat_endcopy));
1045 }
1046
1047 void
pstats_free(struct pstats * ps)1048 pstats_free(struct pstats *ps)
1049 {
1050
1051 free(ps, M_SUBPROC);
1052 }
1053
1054 static struct proc *
zpfind_locked(pid_t pid)1055 zpfind_locked(pid_t pid)
1056 {
1057 struct proc *p;
1058
1059 sx_assert(&allproc_lock, SX_LOCKED);
1060 LIST_FOREACH(p, &zombproc, p_list) {
1061 if (p->p_pid == pid) {
1062 PROC_LOCK(p);
1063 break;
1064 }
1065 }
1066 return (p);
1067 }
1068
1069 /*
1070 * Locate a zombie process by number
1071 */
1072 struct proc *
zpfind(pid_t pid)1073 zpfind(pid_t pid)
1074 {
1075 struct proc *p;
1076
1077 sx_slock(&allproc_lock);
1078 p = zpfind_locked(pid);
1079 sx_sunlock(&allproc_lock);
1080 return (p);
1081 }
1082
1083 #ifdef COMPAT_FREEBSD32
1084
1085 /*
1086 * This function is typically used to copy out the kernel address, so
1087 * it can be replaced by assignment of zero.
1088 */
1089 static inline uint32_t
ptr32_trim(void * ptr)1090 ptr32_trim(void *ptr)
1091 {
1092 uintptr_t uptr;
1093
1094 uptr = (uintptr_t)ptr;
1095 return ((uptr > UINT_MAX) ? 0 : uptr);
1096 }
1097
1098 #define PTRTRIM_CP(src,dst,fld) \
1099 do { (dst).fld = ptr32_trim((src).fld); } while (0)
1100
1101 static void
freebsd32_kinfo_proc_out(const struct kinfo_proc * ki,struct kinfo_proc32 * ki32)1102 freebsd32_kinfo_proc_out(const struct kinfo_proc *ki, struct kinfo_proc32 *ki32)
1103 {
1104 int i;
1105
1106 bzero(ki32, sizeof(struct kinfo_proc32));
1107 ki32->ki_structsize = sizeof(struct kinfo_proc32);
1108 CP(*ki, *ki32, ki_layout);
1109 PTRTRIM_CP(*ki, *ki32, ki_args);
1110 PTRTRIM_CP(*ki, *ki32, ki_paddr);
1111 PTRTRIM_CP(*ki, *ki32, ki_addr);
1112 PTRTRIM_CP(*ki, *ki32, ki_tracep);
1113 PTRTRIM_CP(*ki, *ki32, ki_textvp);
1114 PTRTRIM_CP(*ki, *ki32, ki_fd);
1115 PTRTRIM_CP(*ki, *ki32, ki_vmspace);
1116 PTRTRIM_CP(*ki, *ki32, ki_wchan);
1117 CP(*ki, *ki32, ki_pid);
1118 CP(*ki, *ki32, ki_ppid);
1119 CP(*ki, *ki32, ki_pgid);
1120 CP(*ki, *ki32, ki_tpgid);
1121 CP(*ki, *ki32, ki_sid);
1122 CP(*ki, *ki32, ki_tsid);
1123 CP(*ki, *ki32, ki_jobc);
1124 CP(*ki, *ki32, ki_tdev);
1125 CP(*ki, *ki32, ki_siglist);
1126 CP(*ki, *ki32, ki_sigmask);
1127 CP(*ki, *ki32, ki_sigignore);
1128 CP(*ki, *ki32, ki_sigcatch);
1129 CP(*ki, *ki32, ki_uid);
1130 CP(*ki, *ki32, ki_ruid);
1131 CP(*ki, *ki32, ki_svuid);
1132 CP(*ki, *ki32, ki_rgid);
1133 CP(*ki, *ki32, ki_svgid);
1134 CP(*ki, *ki32, ki_ngroups);
1135 for (i = 0; i < KI_NGROUPS; i++)
1136 CP(*ki, *ki32, ki_groups[i]);
1137 CP(*ki, *ki32, ki_size);
1138 CP(*ki, *ki32, ki_rssize);
1139 CP(*ki, *ki32, ki_swrss);
1140 CP(*ki, *ki32, ki_tsize);
1141 CP(*ki, *ki32, ki_dsize);
1142 CP(*ki, *ki32, ki_ssize);
1143 CP(*ki, *ki32, ki_xstat);
1144 CP(*ki, *ki32, ki_acflag);
1145 CP(*ki, *ki32, ki_pctcpu);
1146 CP(*ki, *ki32, ki_estcpu);
1147 CP(*ki, *ki32, ki_slptime);
1148 CP(*ki, *ki32, ki_swtime);
1149 CP(*ki, *ki32, ki_cow);
1150 CP(*ki, *ki32, ki_runtime);
1151 TV_CP(*ki, *ki32, ki_start);
1152 TV_CP(*ki, *ki32, ki_childtime);
1153 CP(*ki, *ki32, ki_flag);
1154 CP(*ki, *ki32, ki_kiflag);
1155 CP(*ki, *ki32, ki_traceflag);
1156 CP(*ki, *ki32, ki_stat);
1157 CP(*ki, *ki32, ki_nice);
1158 CP(*ki, *ki32, ki_lock);
1159 CP(*ki, *ki32, ki_rqindex);
1160 CP(*ki, *ki32, ki_oncpu);
1161 CP(*ki, *ki32, ki_lastcpu);
1162 bcopy(ki->ki_tdname, ki32->ki_tdname, TDNAMLEN + 1);
1163 bcopy(ki->ki_wmesg, ki32->ki_wmesg, WMESGLEN + 1);
1164 bcopy(ki->ki_login, ki32->ki_login, LOGNAMELEN + 1);
1165 bcopy(ki->ki_lockname, ki32->ki_lockname, LOCKNAMELEN + 1);
1166 bcopy(ki->ki_comm, ki32->ki_comm, COMMLEN + 1);
1167 bcopy(ki->ki_emul, ki32->ki_emul, KI_EMULNAMELEN + 1);
1168 bcopy(ki->ki_loginclass, ki32->ki_loginclass, LOGINCLASSLEN + 1);
1169 CP(*ki, *ki32, ki_flag2);
1170 CP(*ki, *ki32, ki_fibnum);
1171 CP(*ki, *ki32, ki_cr_flags);
1172 CP(*ki, *ki32, ki_jid);
1173 CP(*ki, *ki32, ki_numthreads);
1174 CP(*ki, *ki32, ki_tid);
1175 CP(*ki, *ki32, ki_pri);
1176 freebsd32_rusage_out(&ki->ki_rusage, &ki32->ki_rusage);
1177 freebsd32_rusage_out(&ki->ki_rusage_ch, &ki32->ki_rusage_ch);
1178 PTRTRIM_CP(*ki, *ki32, ki_pcb);
1179 PTRTRIM_CP(*ki, *ki32, ki_kstack);
1180 PTRTRIM_CP(*ki, *ki32, ki_udata);
1181 CP(*ki, *ki32, ki_sflag);
1182 CP(*ki, *ki32, ki_tdflags);
1183 }
1184 #endif
1185
1186 int
kern_proc_out(struct proc * p,struct sbuf * sb,int flags)1187 kern_proc_out(struct proc *p, struct sbuf *sb, int flags)
1188 {
1189 struct thread *td;
1190 struct kinfo_proc ki;
1191 #ifdef COMPAT_FREEBSD32
1192 struct kinfo_proc32 ki32;
1193 #endif
1194 int error;
1195
1196 PROC_LOCK_ASSERT(p, MA_OWNED);
1197 MPASS(FIRST_THREAD_IN_PROC(p) != NULL);
1198
1199 error = 0;
1200 fill_kinfo_proc(p, &ki);
1201 if ((flags & KERN_PROC_NOTHREADS) != 0) {
1202 #ifdef COMPAT_FREEBSD32
1203 if ((flags & KERN_PROC_MASK32) != 0) {
1204 freebsd32_kinfo_proc_out(&ki, &ki32);
1205 if (sbuf_bcat(sb, &ki32, sizeof(ki32)) != 0)
1206 error = ENOMEM;
1207 } else
1208 #endif
1209 if (sbuf_bcat(sb, &ki, sizeof(ki)) != 0)
1210 error = ENOMEM;
1211 } else {
1212 FOREACH_THREAD_IN_PROC(p, td) {
1213 fill_kinfo_thread(td, &ki, 1);
1214 #ifdef COMPAT_FREEBSD32
1215 if ((flags & KERN_PROC_MASK32) != 0) {
1216 freebsd32_kinfo_proc_out(&ki, &ki32);
1217 if (sbuf_bcat(sb, &ki32, sizeof(ki32)) != 0)
1218 error = ENOMEM;
1219 } else
1220 #endif
1221 if (sbuf_bcat(sb, &ki, sizeof(ki)) != 0)
1222 error = ENOMEM;
1223 if (error != 0)
1224 break;
1225 }
1226 }
1227 PROC_UNLOCK(p);
1228 return (error);
1229 }
1230
1231 static int
sysctl_out_proc(struct proc * p,struct sysctl_req * req,int flags,int doingzomb)1232 sysctl_out_proc(struct proc *p, struct sysctl_req *req, int flags,
1233 int doingzomb)
1234 {
1235 struct sbuf sb;
1236 struct kinfo_proc ki;
1237 struct proc *np;
1238 int error, error2;
1239 pid_t pid;
1240
1241 pid = p->p_pid;
1242 sbuf_new_for_sysctl(&sb, (char *)&ki, sizeof(ki), req);
1243 error = kern_proc_out(p, &sb, flags);
1244 error2 = sbuf_finish(&sb);
1245 sbuf_delete(&sb);
1246 if (error != 0)
1247 return (error);
1248 else if (error2 != 0)
1249 return (error2);
1250 if (doingzomb)
1251 np = zpfind(pid);
1252 else {
1253 if (pid == 0)
1254 return (0);
1255 np = pfind(pid);
1256 }
1257 if (np == NULL)
1258 return (ESRCH);
1259 if (np != p) {
1260 PROC_UNLOCK(np);
1261 return (ESRCH);
1262 }
1263 PROC_UNLOCK(np);
1264 return (0);
1265 }
1266
1267 static int
sysctl_kern_proc(SYSCTL_HANDLER_ARGS)1268 sysctl_kern_proc(SYSCTL_HANDLER_ARGS)
1269 {
1270 int *name = (int *)arg1;
1271 u_int namelen = arg2;
1272 struct proc *p;
1273 int flags, doingzomb, oid_number;
1274 int error = 0;
1275
1276 oid_number = oidp->oid_number;
1277 if (oid_number != KERN_PROC_ALL &&
1278 (oid_number & KERN_PROC_INC_THREAD) == 0)
1279 flags = KERN_PROC_NOTHREADS;
1280 else {
1281 flags = 0;
1282 oid_number &= ~KERN_PROC_INC_THREAD;
1283 }
1284 #ifdef COMPAT_FREEBSD32
1285 if (req->flags & SCTL_MASK32)
1286 flags |= KERN_PROC_MASK32;
1287 #endif
1288 if (oid_number == KERN_PROC_PID) {
1289 if (namelen != 1)
1290 return (EINVAL);
1291 error = sysctl_wire_old_buffer(req, 0);
1292 if (error)
1293 return (error);
1294 error = pget((pid_t)name[0], PGET_CANSEE, &p);
1295 if (error != 0)
1296 return (error);
1297 error = sysctl_out_proc(p, req, flags, 0);
1298 return (error);
1299 }
1300
1301 switch (oid_number) {
1302 case KERN_PROC_ALL:
1303 if (namelen != 0)
1304 return (EINVAL);
1305 break;
1306 case KERN_PROC_PROC:
1307 if (namelen != 0 && namelen != 1)
1308 return (EINVAL);
1309 break;
1310 default:
1311 if (namelen != 1)
1312 return (EINVAL);
1313 break;
1314 }
1315
1316 if (!req->oldptr) {
1317 /* overestimate by 5 procs */
1318 error = SYSCTL_OUT(req, 0, sizeof (struct kinfo_proc) * 5);
1319 if (error)
1320 return (error);
1321 }
1322 error = sysctl_wire_old_buffer(req, 0);
1323 if (error != 0)
1324 return (error);
1325 sx_slock(&allproc_lock);
1326 for (doingzomb=0 ; doingzomb < 2 ; doingzomb++) {
1327 if (!doingzomb)
1328 p = LIST_FIRST(&allproc);
1329 else
1330 p = LIST_FIRST(&zombproc);
1331 for (; p != 0; p = LIST_NEXT(p, p_list)) {
1332 /*
1333 * Skip embryonic processes.
1334 */
1335 PROC_LOCK(p);
1336 if (p->p_state == PRS_NEW) {
1337 PROC_UNLOCK(p);
1338 continue;
1339 }
1340 KASSERT(p->p_ucred != NULL,
1341 ("process credential is NULL for non-NEW proc"));
1342 /*
1343 * Show a user only appropriate processes.
1344 */
1345 if (p_cansee(curthread, p)) {
1346 PROC_UNLOCK(p);
1347 continue;
1348 }
1349 /*
1350 * TODO - make more efficient (see notes below).
1351 * do by session.
1352 */
1353 switch (oid_number) {
1354
1355 case KERN_PROC_GID:
1356 if (p->p_ucred->cr_gid != (gid_t)name[0]) {
1357 PROC_UNLOCK(p);
1358 continue;
1359 }
1360 break;
1361
1362 case KERN_PROC_PGRP:
1363 /* could do this by traversing pgrp */
1364 if (p->p_pgrp == NULL ||
1365 p->p_pgrp->pg_id != (pid_t)name[0]) {
1366 PROC_UNLOCK(p);
1367 continue;
1368 }
1369 break;
1370
1371 case KERN_PROC_RGID:
1372 if (p->p_ucred->cr_rgid != (gid_t)name[0]) {
1373 PROC_UNLOCK(p);
1374 continue;
1375 }
1376 break;
1377
1378 case KERN_PROC_SESSION:
1379 if (p->p_session == NULL ||
1380 p->p_session->s_sid != (pid_t)name[0]) {
1381 PROC_UNLOCK(p);
1382 continue;
1383 }
1384 break;
1385
1386 case KERN_PROC_TTY:
1387 if ((p->p_flag & P_CONTROLT) == 0 ||
1388 p->p_session == NULL) {
1389 PROC_UNLOCK(p);
1390 continue;
1391 }
1392 /* XXX proctree_lock */
1393 SESS_LOCK(p->p_session);
1394 if (p->p_session->s_ttyp == NULL ||
1395 tty_udev(p->p_session->s_ttyp) !=
1396 (dev_t)name[0]) {
1397 SESS_UNLOCK(p->p_session);
1398 PROC_UNLOCK(p);
1399 continue;
1400 }
1401 SESS_UNLOCK(p->p_session);
1402 break;
1403
1404 case KERN_PROC_UID:
1405 if (p->p_ucred->cr_uid != (uid_t)name[0]) {
1406 PROC_UNLOCK(p);
1407 continue;
1408 }
1409 break;
1410
1411 case KERN_PROC_RUID:
1412 if (p->p_ucred->cr_ruid != (uid_t)name[0]) {
1413 PROC_UNLOCK(p);
1414 continue;
1415 }
1416 break;
1417
1418 case KERN_PROC_PROC:
1419 break;
1420
1421 default:
1422 break;
1423
1424 }
1425
1426 error = sysctl_out_proc(p, req, flags, doingzomb);
1427 if (error) {
1428 sx_sunlock(&allproc_lock);
1429 return (error);
1430 }
1431 }
1432 }
1433 sx_sunlock(&allproc_lock);
1434 return (0);
1435 }
1436
1437 struct pargs *
pargs_alloc(int len)1438 pargs_alloc(int len)
1439 {
1440 struct pargs *pa;
1441
1442 pa = malloc(sizeof(struct pargs) + len, M_PARGS,
1443 M_WAITOK);
1444 refcount_init(&pa->ar_ref, 1);
1445 pa->ar_length = len;
1446 return (pa);
1447 }
1448
1449 static void
pargs_free(struct pargs * pa)1450 pargs_free(struct pargs *pa)
1451 {
1452
1453 free(pa, M_PARGS);
1454 }
1455
1456 void
pargs_hold(struct pargs * pa)1457 pargs_hold(struct pargs *pa)
1458 {
1459
1460 if (pa == NULL)
1461 return;
1462 refcount_acquire(&pa->ar_ref);
1463 }
1464
1465 void
pargs_drop(struct pargs * pa)1466 pargs_drop(struct pargs *pa)
1467 {
1468
1469 if (pa == NULL)
1470 return;
1471 if (refcount_release(&pa->ar_ref))
1472 pargs_free(pa);
1473 }
1474
1475 static int
proc_read_mem(struct thread * td,struct proc * p,vm_offset_t offset,void * buf,size_t len)1476 proc_read_mem(struct thread *td, struct proc *p, vm_offset_t offset, void* buf,
1477 size_t len)
1478 {
1479 struct iovec iov;
1480 struct uio uio;
1481
1482 iov.iov_base = (caddr_t)buf;
1483 iov.iov_len = len;
1484 uio.uio_iov = &iov;
1485 uio.uio_iovcnt = 1;
1486 uio.uio_offset = offset;
1487 uio.uio_resid = (ssize_t)len;
1488 uio.uio_segflg = UIO_SYSSPACE;
1489 uio.uio_rw = UIO_READ;
1490 uio.uio_td = td;
1491
1492 return (proc_rwmem(p, &uio));
1493 }
1494
1495 static int
proc_read_string(struct thread * td,struct proc * p,const char * sptr,char * buf,size_t len)1496 proc_read_string(struct thread *td, struct proc *p, const char *sptr, char *buf,
1497 size_t len)
1498 {
1499 size_t i;
1500 int error;
1501
1502 error = proc_read_mem(td, p, (vm_offset_t)sptr, buf, len);
1503 /*
1504 * Reading the chunk may validly return EFAULT if the string is shorter
1505 * than the chunk and is aligned at the end of the page, assuming the
1506 * next page is not mapped. So if EFAULT is returned do a fallback to
1507 * one byte read loop.
1508 */
1509 if (error == EFAULT) {
1510 for (i = 0; i < len; i++, buf++, sptr++) {
1511 error = proc_read_mem(td, p, (vm_offset_t)sptr, buf, 1);
1512 if (error != 0)
1513 return (error);
1514 if (*buf == '\0')
1515 break;
1516 }
1517 error = 0;
1518 }
1519 return (error);
1520 }
1521
1522 #define PROC_AUXV_MAX 256 /* Safety limit on auxv size. */
1523
1524 enum proc_vector_type {
1525 PROC_ARG,
1526 PROC_ENV,
1527 PROC_AUX,
1528 };
1529
1530 #ifdef COMPAT_FREEBSD32
1531 static int
get_proc_vector32(struct thread * td,struct proc * p,char *** proc_vectorp,size_t * vsizep,enum proc_vector_type type)1532 get_proc_vector32(struct thread *td, struct proc *p, char ***proc_vectorp,
1533 size_t *vsizep, enum proc_vector_type type)
1534 {
1535 struct freebsd32_ps_strings pss;
1536 Elf32_Auxinfo aux;
1537 vm_offset_t vptr, ptr;
1538 uint32_t *proc_vector32;
1539 char **proc_vector;
1540 size_t vsize, size;
1541 int i, error;
1542
1543 error = proc_read_mem(td, p, (vm_offset_t)(p->p_sysent->sv_psstrings),
1544 &pss, sizeof(pss));
1545 if (error != 0)
1546 return (error);
1547 switch (type) {
1548 case PROC_ARG:
1549 vptr = (vm_offset_t)PTRIN(pss.ps_argvstr);
1550 vsize = pss.ps_nargvstr;
1551 if (vsize > ARG_MAX)
1552 return (ENOEXEC);
1553 size = vsize * sizeof(int32_t);
1554 break;
1555 case PROC_ENV:
1556 vptr = (vm_offset_t)PTRIN(pss.ps_envstr);
1557 vsize = pss.ps_nenvstr;
1558 if (vsize > ARG_MAX)
1559 return (ENOEXEC);
1560 size = vsize * sizeof(int32_t);
1561 break;
1562 case PROC_AUX:
1563 vptr = (vm_offset_t)PTRIN(pss.ps_envstr) +
1564 (pss.ps_nenvstr + 1) * sizeof(int32_t);
1565 if (vptr % 4 != 0)
1566 return (ENOEXEC);
1567 for (ptr = vptr, i = 0; i < PROC_AUXV_MAX; i++) {
1568 error = proc_read_mem(td, p, ptr, &aux, sizeof(aux));
1569 if (error != 0)
1570 return (error);
1571 if (aux.a_type == AT_NULL)
1572 break;
1573 ptr += sizeof(aux);
1574 }
1575 if (aux.a_type != AT_NULL)
1576 return (ENOEXEC);
1577 vsize = i + 1;
1578 size = vsize * sizeof(aux);
1579 break;
1580 default:
1581 KASSERT(0, ("Wrong proc vector type: %d", type));
1582 return (EINVAL);
1583 }
1584 proc_vector32 = malloc(size, M_TEMP, M_WAITOK);
1585 error = proc_read_mem(td, p, vptr, proc_vector32, size);
1586 if (error != 0)
1587 goto done;
1588 if (type == PROC_AUX) {
1589 *proc_vectorp = (char **)proc_vector32;
1590 *vsizep = vsize;
1591 return (0);
1592 }
1593 proc_vector = malloc(vsize * sizeof(char *), M_TEMP, M_WAITOK);
1594 for (i = 0; i < (int)vsize; i++)
1595 proc_vector[i] = PTRIN(proc_vector32[i]);
1596 *proc_vectorp = proc_vector;
1597 *vsizep = vsize;
1598 done:
1599 free(proc_vector32, M_TEMP);
1600 return (error);
1601 }
1602 #endif
1603
1604 static int
get_proc_vector(struct thread * td,struct proc * p,char *** proc_vectorp,size_t * vsizep,enum proc_vector_type type)1605 get_proc_vector(struct thread *td, struct proc *p, char ***proc_vectorp,
1606 size_t *vsizep, enum proc_vector_type type)
1607 {
1608 struct ps_strings pss;
1609 Elf_Auxinfo aux;
1610 vm_offset_t vptr, ptr;
1611 char **proc_vector;
1612 size_t vsize, size;
1613 int error, i;
1614
1615 #ifdef COMPAT_FREEBSD32
1616 if (SV_PROC_FLAG(p, SV_ILP32) != 0)
1617 return (get_proc_vector32(td, p, proc_vectorp, vsizep, type));
1618 #endif
1619 error = proc_read_mem(td, p, (vm_offset_t)(p->p_sysent->sv_psstrings),
1620 &pss, sizeof(pss));
1621 if (error != 0)
1622 return (error);
1623 switch (type) {
1624 case PROC_ARG:
1625 vptr = (vm_offset_t)pss.ps_argvstr;
1626 vsize = pss.ps_nargvstr;
1627 if (vsize > ARG_MAX)
1628 return (ENOEXEC);
1629 size = vsize * sizeof(char *);
1630 break;
1631 case PROC_ENV:
1632 vptr = (vm_offset_t)pss.ps_envstr;
1633 vsize = pss.ps_nenvstr;
1634 if (vsize > ARG_MAX)
1635 return (ENOEXEC);
1636 size = vsize * sizeof(char *);
1637 break;
1638 case PROC_AUX:
1639 /*
1640 * The aux array is just above env array on the stack. Check
1641 * that the address is naturally aligned.
1642 */
1643 vptr = (vm_offset_t)pss.ps_envstr + (pss.ps_nenvstr + 1)
1644 * sizeof(char *);
1645 #if __ELF_WORD_SIZE == 64
1646 if (vptr % sizeof(uint64_t) != 0)
1647 #else
1648 if (vptr % sizeof(uint32_t) != 0)
1649 #endif
1650 return (ENOEXEC);
1651 /*
1652 * We count the array size reading the aux vectors from the
1653 * stack until AT_NULL vector is returned. So (to keep the code
1654 * simple) we read the process stack twice: the first time here
1655 * to find the size and the second time when copying the vectors
1656 * to the allocated proc_vector.
1657 */
1658 for (ptr = vptr, i = 0; i < PROC_AUXV_MAX; i++) {
1659 error = proc_read_mem(td, p, ptr, &aux, sizeof(aux));
1660 if (error != 0)
1661 return (error);
1662 if (aux.a_type == AT_NULL)
1663 break;
1664 ptr += sizeof(aux);
1665 }
1666 /*
1667 * If the PROC_AUXV_MAX entries are iterated over, and we have
1668 * not reached AT_NULL, it is most likely we are reading wrong
1669 * data: either the process doesn't have auxv array or data has
1670 * been modified. Return the error in this case.
1671 */
1672 if (aux.a_type != AT_NULL)
1673 return (ENOEXEC);
1674 vsize = i + 1;
1675 size = vsize * sizeof(aux);
1676 break;
1677 default:
1678 KASSERT(0, ("Wrong proc vector type: %d", type));
1679 return (EINVAL); /* In case we are built without INVARIANTS. */
1680 }
1681 proc_vector = malloc(size, M_TEMP, M_WAITOK);
1682 if (proc_vector == NULL)
1683 return (ENOMEM);
1684 error = proc_read_mem(td, p, vptr, proc_vector, size);
1685 if (error != 0) {
1686 free(proc_vector, M_TEMP);
1687 return (error);
1688 }
1689 *proc_vectorp = proc_vector;
1690 *vsizep = vsize;
1691
1692 return (0);
1693 }
1694
1695 #define GET_PS_STRINGS_CHUNK_SZ 256 /* Chunk size (bytes) for ps_strings operations. */
1696
1697 static int
get_ps_strings(struct thread * td,struct proc * p,struct sbuf * sb,enum proc_vector_type type)1698 get_ps_strings(struct thread *td, struct proc *p, struct sbuf *sb,
1699 enum proc_vector_type type)
1700 {
1701 size_t done, len, nchr, vsize;
1702 int error, i;
1703 char **proc_vector, *sptr;
1704 char pss_string[GET_PS_STRINGS_CHUNK_SZ];
1705
1706 PROC_ASSERT_HELD(p);
1707
1708 /*
1709 * We are not going to read more than 2 * (PATH_MAX + ARG_MAX) bytes.
1710 */
1711 nchr = 2 * (PATH_MAX + ARG_MAX);
1712
1713 error = get_proc_vector(td, p, &proc_vector, &vsize, type);
1714 if (error != 0)
1715 return (error);
1716 for (done = 0, i = 0; i < (int)vsize && done < nchr; i++) {
1717 /*
1718 * The program may have scribbled into its argv array, e.g. to
1719 * remove some arguments. If that has happened, break out
1720 * before trying to read from NULL.
1721 */
1722 if (proc_vector[i] == NULL)
1723 break;
1724 for (sptr = proc_vector[i]; ; sptr += GET_PS_STRINGS_CHUNK_SZ) {
1725 error = proc_read_string(td, p, sptr, pss_string,
1726 sizeof(pss_string));
1727 if (error != 0)
1728 goto done;
1729 len = strnlen(pss_string, GET_PS_STRINGS_CHUNK_SZ);
1730 if (done + len >= nchr)
1731 len = nchr - done - 1;
1732 sbuf_bcat(sb, pss_string, len);
1733 if (len != GET_PS_STRINGS_CHUNK_SZ)
1734 break;
1735 done += GET_PS_STRINGS_CHUNK_SZ;
1736 }
1737 sbuf_bcat(sb, "", 1);
1738 done += len + 1;
1739 }
1740 done:
1741 free(proc_vector, M_TEMP);
1742 return (error);
1743 }
1744
1745 int
proc_getargv(struct thread * td,struct proc * p,struct sbuf * sb)1746 proc_getargv(struct thread *td, struct proc *p, struct sbuf *sb)
1747 {
1748
1749 return (get_ps_strings(curthread, p, sb, PROC_ARG));
1750 }
1751
1752 int
proc_getenvv(struct thread * td,struct proc * p,struct sbuf * sb)1753 proc_getenvv(struct thread *td, struct proc *p, struct sbuf *sb)
1754 {
1755
1756 return (get_ps_strings(curthread, p, sb, PROC_ENV));
1757 }
1758
1759 int
proc_getauxv(struct thread * td,struct proc * p,struct sbuf * sb)1760 proc_getauxv(struct thread *td, struct proc *p, struct sbuf *sb)
1761 {
1762 size_t vsize, size;
1763 char **auxv;
1764 int error;
1765
1766 error = get_proc_vector(td, p, &auxv, &vsize, PROC_AUX);
1767 if (error == 0) {
1768 #ifdef COMPAT_FREEBSD32
1769 if (SV_PROC_FLAG(p, SV_ILP32) != 0)
1770 size = vsize * sizeof(Elf32_Auxinfo);
1771 else
1772 #endif
1773 size = vsize * sizeof(Elf_Auxinfo);
1774 if (sbuf_bcat(sb, auxv, size) != 0)
1775 error = ENOMEM;
1776 free(auxv, M_TEMP);
1777 }
1778 return (error);
1779 }
1780
1781 /*
1782 * This sysctl allows a process to retrieve the argument list or process
1783 * title for another process without groping around in the address space
1784 * of the other process. It also allow a process to set its own "process
1785 * title to a string of its own choice.
1786 */
1787 static int
sysctl_kern_proc_args(SYSCTL_HANDLER_ARGS)1788 sysctl_kern_proc_args(SYSCTL_HANDLER_ARGS)
1789 {
1790 int *name = (int *)arg1;
1791 u_int namelen = arg2;
1792 struct pargs *newpa, *pa;
1793 struct proc *p;
1794 struct sbuf sb;
1795 int flags, error = 0, error2;
1796
1797 if (namelen != 1)
1798 return (EINVAL);
1799
1800 flags = PGET_CANSEE;
1801 if (req->newptr != NULL)
1802 flags |= PGET_ISCURRENT;
1803 error = pget((pid_t)name[0], flags, &p);
1804 if (error)
1805 return (error);
1806
1807 pa = p->p_args;
1808 if (pa != NULL) {
1809 pargs_hold(pa);
1810 PROC_UNLOCK(p);
1811 error = SYSCTL_OUT(req, pa->ar_args, pa->ar_length);
1812 pargs_drop(pa);
1813 } else if ((p->p_flag & (P_WEXIT | P_SYSTEM)) == 0) {
1814 _PHOLD(p);
1815 PROC_UNLOCK(p);
1816 sbuf_new_for_sysctl(&sb, NULL, GET_PS_STRINGS_CHUNK_SZ, req);
1817 error = proc_getargv(curthread, p, &sb);
1818 error2 = sbuf_finish(&sb);
1819 PRELE(p);
1820 sbuf_delete(&sb);
1821 if (error == 0 && error2 != 0)
1822 error = error2;
1823 } else {
1824 PROC_UNLOCK(p);
1825 }
1826 if (error != 0 || req->newptr == NULL)
1827 return (error);
1828
1829 if (req->newlen + sizeof(struct pargs) > ps_arg_cache_limit)
1830 return (ENOMEM);
1831 newpa = pargs_alloc(req->newlen);
1832 error = SYSCTL_IN(req, newpa->ar_args, req->newlen);
1833 if (error != 0) {
1834 pargs_free(newpa);
1835 return (error);
1836 }
1837 PROC_LOCK(p);
1838 pa = p->p_args;
1839 p->p_args = newpa;
1840 PROC_UNLOCK(p);
1841 pargs_drop(pa);
1842 return (0);
1843 }
1844
1845 /*
1846 * This sysctl allows a process to retrieve environment of another process.
1847 */
1848 static int
sysctl_kern_proc_env(SYSCTL_HANDLER_ARGS)1849 sysctl_kern_proc_env(SYSCTL_HANDLER_ARGS)
1850 {
1851 int *name = (int *)arg1;
1852 u_int namelen = arg2;
1853 struct proc *p;
1854 struct sbuf sb;
1855 int error, error2;
1856
1857 if (namelen != 1)
1858 return (EINVAL);
1859
1860 error = pget((pid_t)name[0], PGET_WANTREAD, &p);
1861 if (error != 0)
1862 return (error);
1863 if ((p->p_flag & P_SYSTEM) != 0) {
1864 PRELE(p);
1865 return (0);
1866 }
1867
1868 sbuf_new_for_sysctl(&sb, NULL, GET_PS_STRINGS_CHUNK_SZ, req);
1869 error = proc_getenvv(curthread, p, &sb);
1870 error2 = sbuf_finish(&sb);
1871 PRELE(p);
1872 sbuf_delete(&sb);
1873 return (error != 0 ? error : error2);
1874 }
1875
1876 /*
1877 * This sysctl allows a process to retrieve ELF auxiliary vector of
1878 * another process.
1879 */
1880 static int
sysctl_kern_proc_auxv(SYSCTL_HANDLER_ARGS)1881 sysctl_kern_proc_auxv(SYSCTL_HANDLER_ARGS)
1882 {
1883 int *name = (int *)arg1;
1884 u_int namelen = arg2;
1885 struct proc *p;
1886 struct sbuf sb;
1887 int error, error2;
1888
1889 if (namelen != 1)
1890 return (EINVAL);
1891
1892 error = pget((pid_t)name[0], PGET_WANTREAD, &p);
1893 if (error != 0)
1894 return (error);
1895 if ((p->p_flag & P_SYSTEM) != 0) {
1896 PRELE(p);
1897 return (0);
1898 }
1899 sbuf_new_for_sysctl(&sb, NULL, GET_PS_STRINGS_CHUNK_SZ, req);
1900 error = proc_getauxv(curthread, p, &sb);
1901 error2 = sbuf_finish(&sb);
1902 PRELE(p);
1903 sbuf_delete(&sb);
1904 return (error != 0 ? error : error2);
1905 }
1906
1907 /*
1908 * This sysctl allows a process to retrieve the path of the executable for
1909 * itself or another process.
1910 */
1911 static int
sysctl_kern_proc_pathname(SYSCTL_HANDLER_ARGS)1912 sysctl_kern_proc_pathname(SYSCTL_HANDLER_ARGS)
1913 {
1914 pid_t *pidp = (pid_t *)arg1;
1915 unsigned int arglen = arg2;
1916 struct proc *p;
1917 struct vnode *vp;
1918 char *retbuf, *freebuf;
1919 int error;
1920
1921 if (arglen != 1)
1922 return (EINVAL);
1923 if (*pidp == -1) { /* -1 means this process */
1924 p = req->td->td_proc;
1925 } else {
1926 error = pget(*pidp, PGET_CANSEE, &p);
1927 if (error != 0)
1928 return (error);
1929 }
1930
1931 vp = p->p_textvp;
1932 if (vp == NULL) {
1933 if (*pidp != -1)
1934 PROC_UNLOCK(p);
1935 return (0);
1936 }
1937 vref(vp);
1938 if (*pidp != -1)
1939 PROC_UNLOCK(p);
1940 error = vn_fullpath(req->td, vp, &retbuf, &freebuf);
1941 vrele(vp);
1942 if (error)
1943 return (error);
1944 error = SYSCTL_OUT(req, retbuf, strlen(retbuf) + 1);
1945 free(freebuf, M_TEMP);
1946 return (error);
1947 }
1948
1949 static int
sysctl_kern_proc_sv_name(SYSCTL_HANDLER_ARGS)1950 sysctl_kern_proc_sv_name(SYSCTL_HANDLER_ARGS)
1951 {
1952 struct proc *p;
1953 char *sv_name;
1954 int *name;
1955 int namelen;
1956 int error;
1957
1958 namelen = arg2;
1959 if (namelen != 1)
1960 return (EINVAL);
1961
1962 name = (int *)arg1;
1963 error = pget((pid_t)name[0], PGET_CANSEE, &p);
1964 if (error != 0)
1965 return (error);
1966 sv_name = p->p_sysent->sv_name;
1967 PROC_UNLOCK(p);
1968 return (sysctl_handle_string(oidp, sv_name, 0, req));
1969 }
1970
1971 #ifdef KINFO_OVMENTRY_SIZE
1972 CTASSERT(sizeof(struct kinfo_ovmentry) == KINFO_OVMENTRY_SIZE);
1973 #endif
1974
1975 #ifdef COMPAT_FREEBSD7
1976 static int
sysctl_kern_proc_ovmmap(SYSCTL_HANDLER_ARGS)1977 sysctl_kern_proc_ovmmap(SYSCTL_HANDLER_ARGS)
1978 {
1979 vm_map_entry_t entry, tmp_entry;
1980 unsigned int last_timestamp;
1981 char *fullpath, *freepath;
1982 struct kinfo_ovmentry *kve;
1983 struct vattr va;
1984 struct ucred *cred;
1985 int error, *name;
1986 struct vnode *vp;
1987 struct proc *p;
1988 vm_map_t map;
1989 struct vmspace *vm;
1990
1991 name = (int *)arg1;
1992 error = pget((pid_t)name[0], PGET_WANTREAD, &p);
1993 if (error != 0)
1994 return (error);
1995 vm = vmspace_acquire_ref(p);
1996 if (vm == NULL) {
1997 PRELE(p);
1998 return (ESRCH);
1999 }
2000 kve = malloc(sizeof(*kve), M_TEMP, M_WAITOK);
2001
2002 map = &vm->vm_map;
2003 vm_map_lock_read(map);
2004 for (entry = map->header.next; entry != &map->header;
2005 entry = entry->next) {
2006 vm_object_t obj, tobj, lobj;
2007 vm_offset_t addr;
2008
2009 if (entry->eflags & MAP_ENTRY_IS_SUB_MAP)
2010 continue;
2011
2012 bzero(kve, sizeof(*kve));
2013 kve->kve_structsize = sizeof(*kve);
2014
2015 kve->kve_private_resident = 0;
2016 obj = entry->object.vm_object;
2017 if (obj != NULL) {
2018 VM_OBJECT_RLOCK(obj);
2019 if (obj->shadow_count == 1)
2020 kve->kve_private_resident =
2021 obj->resident_page_count;
2022 }
2023 kve->kve_resident = 0;
2024 addr = entry->start;
2025 while (addr < entry->end) {
2026 if (pmap_extract(map->pmap, addr))
2027 kve->kve_resident++;
2028 addr += PAGE_SIZE;
2029 }
2030
2031 for (lobj = tobj = obj; tobj; tobj = tobj->backing_object) {
2032 if (tobj != obj)
2033 VM_OBJECT_RLOCK(tobj);
2034 if (lobj != obj)
2035 VM_OBJECT_RUNLOCK(lobj);
2036 lobj = tobj;
2037 }
2038
2039 kve->kve_start = (void*)entry->start;
2040 kve->kve_end = (void*)entry->end;
2041 kve->kve_offset = (off_t)entry->offset;
2042
2043 if (entry->protection & VM_PROT_READ)
2044 kve->kve_protection |= KVME_PROT_READ;
2045 if (entry->protection & VM_PROT_WRITE)
2046 kve->kve_protection |= KVME_PROT_WRITE;
2047 if (entry->protection & VM_PROT_EXECUTE)
2048 kve->kve_protection |= KVME_PROT_EXEC;
2049
2050 if (entry->eflags & MAP_ENTRY_COW)
2051 kve->kve_flags |= KVME_FLAG_COW;
2052 if (entry->eflags & MAP_ENTRY_NEEDS_COPY)
2053 kve->kve_flags |= KVME_FLAG_NEEDS_COPY;
2054 if (entry->eflags & MAP_ENTRY_NOCOREDUMP)
2055 kve->kve_flags |= KVME_FLAG_NOCOREDUMP;
2056
2057 last_timestamp = map->timestamp;
2058 vm_map_unlock_read(map);
2059
2060 kve->kve_fileid = 0;
2061 kve->kve_fsid = 0;
2062 freepath = NULL;
2063 fullpath = "";
2064 if (lobj) {
2065 vp = NULL;
2066 switch (lobj->type) {
2067 case OBJT_DEFAULT:
2068 kve->kve_type = KVME_TYPE_DEFAULT;
2069 break;
2070 case OBJT_VNODE:
2071 kve->kve_type = KVME_TYPE_VNODE;
2072 vp = lobj->handle;
2073 vref(vp);
2074 break;
2075 case OBJT_SWAP:
2076 kve->kve_type = KVME_TYPE_SWAP;
2077 break;
2078 case OBJT_DEVICE:
2079 kve->kve_type = KVME_TYPE_DEVICE;
2080 break;
2081 case OBJT_PHYS:
2082 kve->kve_type = KVME_TYPE_PHYS;
2083 break;
2084 case OBJT_DEAD:
2085 kve->kve_type = KVME_TYPE_DEAD;
2086 break;
2087 case OBJT_SG:
2088 kve->kve_type = KVME_TYPE_SG;
2089 break;
2090 default:
2091 kve->kve_type = KVME_TYPE_UNKNOWN;
2092 break;
2093 }
2094 if (lobj != obj)
2095 VM_OBJECT_RUNLOCK(lobj);
2096
2097 kve->kve_ref_count = obj->ref_count;
2098 kve->kve_shadow_count = obj->shadow_count;
2099 VM_OBJECT_RUNLOCK(obj);
2100 if (vp != NULL) {
2101 vn_fullpath(curthread, vp, &fullpath,
2102 &freepath);
2103 cred = curthread->td_ucred;
2104 vn_lock(vp, LK_SHARED | LK_RETRY);
2105 if (VOP_GETATTR(vp, &va, cred) == 0) {
2106 kve->kve_fileid = va.va_fileid;
2107 kve->kve_fsid = va.va_fsid;
2108 }
2109 vput(vp);
2110 }
2111 } else {
2112 kve->kve_type = KVME_TYPE_NONE;
2113 kve->kve_ref_count = 0;
2114 kve->kve_shadow_count = 0;
2115 }
2116
2117 strlcpy(kve->kve_path, fullpath, sizeof(kve->kve_path));
2118 if (freepath != NULL)
2119 free(freepath, M_TEMP);
2120
2121 error = SYSCTL_OUT(req, kve, sizeof(*kve));
2122 vm_map_lock_read(map);
2123 if (error)
2124 break;
2125 if (last_timestamp != map->timestamp) {
2126 vm_map_lookup_entry(map, addr - 1, &tmp_entry);
2127 entry = tmp_entry;
2128 }
2129 }
2130 vm_map_unlock_read(map);
2131 vmspace_free(vm);
2132 PRELE(p);
2133 free(kve, M_TEMP);
2134 return (error);
2135 }
2136 #endif /* COMPAT_FREEBSD7 */
2137
2138 #ifdef KINFO_VMENTRY_SIZE
2139 CTASSERT(sizeof(struct kinfo_vmentry) == KINFO_VMENTRY_SIZE);
2140 #endif
2141
2142 static void
kern_proc_vmmap_resident(vm_map_t map,vm_map_entry_t entry,struct kinfo_vmentry * kve)2143 kern_proc_vmmap_resident(vm_map_t map, vm_map_entry_t entry,
2144 struct kinfo_vmentry *kve)
2145 {
2146 vm_object_t obj, tobj;
2147 vm_page_t m, m_adv;
2148 vm_offset_t addr;
2149 vm_paddr_t locked_pa;
2150 vm_pindex_t pi, pi_adv, pindex;
2151
2152 locked_pa = 0;
2153 obj = entry->object.vm_object;
2154 addr = entry->start;
2155 m_adv = NULL;
2156 pi = OFF_TO_IDX(entry->offset);
2157 for (; addr < entry->end; addr += IDX_TO_OFF(pi_adv), pi += pi_adv) {
2158 if (m_adv != NULL) {
2159 m = m_adv;
2160 } else {
2161 pi_adv = OFF_TO_IDX(entry->end - addr);
2162 pindex = pi;
2163 for (tobj = obj;; tobj = tobj->backing_object) {
2164 m = vm_page_find_least(tobj, pindex);
2165 if (m != NULL) {
2166 if (m->pindex == pindex)
2167 break;
2168 if (pi_adv > m->pindex - pindex) {
2169 pi_adv = m->pindex - pindex;
2170 m_adv = m;
2171 }
2172 }
2173 if (tobj->backing_object == NULL)
2174 goto next;
2175 pindex += OFF_TO_IDX(tobj->
2176 backing_object_offset);
2177 }
2178 }
2179 m_adv = NULL;
2180 if (m->psind != 0 && addr + pagesizes[1] <= entry->end &&
2181 (addr & (pagesizes[1] - 1)) == 0 &&
2182 (pmap_mincore(map->pmap, addr, &locked_pa) &
2183 MINCORE_SUPER) != 0) {
2184 kve->kve_flags |= KVME_FLAG_SUPER;
2185 pi_adv = OFF_TO_IDX(pagesizes[1]);
2186 } else {
2187 /*
2188 * We do not test the found page on validity.
2189 * Either the page is busy and being paged in,
2190 * or it was invalidated. The first case
2191 * should be counted as resident, the second
2192 * is not so clear; we do account both.
2193 */
2194 pi_adv = 1;
2195 }
2196 kve->kve_resident += pi_adv;
2197 next:;
2198 }
2199 PA_UNLOCK_COND(locked_pa);
2200 }
2201
2202 /*
2203 * Must be called with the process locked and will return unlocked.
2204 */
2205 int
kern_proc_vmmap_out(struct proc * p,struct sbuf * sb)2206 kern_proc_vmmap_out(struct proc *p, struct sbuf *sb)
2207 {
2208 vm_map_entry_t entry, tmp_entry;
2209 struct vattr va;
2210 vm_map_t map;
2211 vm_object_t obj, tobj, lobj;
2212 char *fullpath, *freepath;
2213 struct kinfo_vmentry *kve;
2214 struct ucred *cred;
2215 struct vnode *vp;
2216 struct vmspace *vm;
2217 vm_offset_t addr;
2218 unsigned int last_timestamp;
2219 int error;
2220
2221 PROC_LOCK_ASSERT(p, MA_OWNED);
2222
2223 _PHOLD(p);
2224 PROC_UNLOCK(p);
2225 vm = vmspace_acquire_ref(p);
2226 if (vm == NULL) {
2227 PRELE(p);
2228 return (ESRCH);
2229 }
2230 kve = malloc(sizeof(*kve), M_TEMP, M_WAITOK);
2231
2232 error = 0;
2233 map = &vm->vm_map;
2234 vm_map_lock_read(map);
2235 for (entry = map->header.next; entry != &map->header;
2236 entry = entry->next) {
2237 if (entry->eflags & MAP_ENTRY_IS_SUB_MAP)
2238 continue;
2239
2240 addr = entry->end;
2241 bzero(kve, sizeof(*kve));
2242 obj = entry->object.vm_object;
2243 if (obj != NULL) {
2244 for (tobj = obj; tobj != NULL;
2245 tobj = tobj->backing_object) {
2246 VM_OBJECT_RLOCK(tobj);
2247 lobj = tobj;
2248 }
2249 if (obj->backing_object == NULL)
2250 kve->kve_private_resident =
2251 obj->resident_page_count;
2252 if (!vmmap_skip_res_cnt)
2253 kern_proc_vmmap_resident(map, entry, kve);
2254 for (tobj = obj; tobj != NULL;
2255 tobj = tobj->backing_object) {
2256 if (tobj != obj && tobj != lobj)
2257 VM_OBJECT_RUNLOCK(tobj);
2258 }
2259 } else {
2260 lobj = NULL;
2261 }
2262
2263 kve->kve_start = entry->start;
2264 kve->kve_end = entry->end;
2265 kve->kve_offset = entry->offset;
2266
2267 if (entry->protection & VM_PROT_READ)
2268 kve->kve_protection |= KVME_PROT_READ;
2269 if (entry->protection & VM_PROT_WRITE)
2270 kve->kve_protection |= KVME_PROT_WRITE;
2271 if (entry->protection & VM_PROT_EXECUTE)
2272 kve->kve_protection |= KVME_PROT_EXEC;
2273
2274 if (entry->eflags & MAP_ENTRY_COW)
2275 kve->kve_flags |= KVME_FLAG_COW;
2276 if (entry->eflags & MAP_ENTRY_NEEDS_COPY)
2277 kve->kve_flags |= KVME_FLAG_NEEDS_COPY;
2278 if (entry->eflags & MAP_ENTRY_NOCOREDUMP)
2279 kve->kve_flags |= KVME_FLAG_NOCOREDUMP;
2280 if (entry->eflags & MAP_ENTRY_GROWS_UP)
2281 kve->kve_flags |= KVME_FLAG_GROWS_UP;
2282 if (entry->eflags & MAP_ENTRY_GROWS_DOWN)
2283 kve->kve_flags |= KVME_FLAG_GROWS_DOWN;
2284
2285 last_timestamp = map->timestamp;
2286 vm_map_unlock_read(map);
2287
2288 freepath = NULL;
2289 fullpath = "";
2290 if (lobj != NULL) {
2291 vp = NULL;
2292 switch (lobj->type) {
2293 case OBJT_DEFAULT:
2294 kve->kve_type = KVME_TYPE_DEFAULT;
2295 break;
2296 case OBJT_VNODE:
2297 kve->kve_type = KVME_TYPE_VNODE;
2298 vp = lobj->handle;
2299 vref(vp);
2300 break;
2301 case OBJT_SWAP:
2302 kve->kve_type = KVME_TYPE_SWAP;
2303 break;
2304 case OBJT_DEVICE:
2305 kve->kve_type = KVME_TYPE_DEVICE;
2306 break;
2307 case OBJT_PHYS:
2308 kve->kve_type = KVME_TYPE_PHYS;
2309 break;
2310 case OBJT_DEAD:
2311 kve->kve_type = KVME_TYPE_DEAD;
2312 break;
2313 case OBJT_SG:
2314 kve->kve_type = KVME_TYPE_SG;
2315 break;
2316 case OBJT_MGTDEVICE:
2317 kve->kve_type = KVME_TYPE_MGTDEVICE;
2318 break;
2319 default:
2320 kve->kve_type = KVME_TYPE_UNKNOWN;
2321 break;
2322 }
2323 if (lobj != obj)
2324 VM_OBJECT_RUNLOCK(lobj);
2325
2326 kve->kve_ref_count = obj->ref_count;
2327 kve->kve_shadow_count = obj->shadow_count;
2328 VM_OBJECT_RUNLOCK(obj);
2329 if (vp != NULL) {
2330 vn_fullpath(curthread, vp, &fullpath,
2331 &freepath);
2332 kve->kve_vn_type = vntype_to_kinfo(vp->v_type);
2333 cred = curthread->td_ucred;
2334 vn_lock(vp, LK_SHARED | LK_RETRY);
2335 if (VOP_GETATTR(vp, &va, cred) == 0) {
2336 kve->kve_vn_fileid = va.va_fileid;
2337 kve->kve_vn_fsid = va.va_fsid;
2338 kve->kve_vn_mode =
2339 MAKEIMODE(va.va_type, va.va_mode);
2340 kve->kve_vn_size = va.va_size;
2341 kve->kve_vn_rdev = va.va_rdev;
2342 kve->kve_status = KF_ATTR_VALID;
2343 }
2344 vput(vp);
2345 }
2346 } else {
2347 kve->kve_type = KVME_TYPE_NONE;
2348 kve->kve_ref_count = 0;
2349 kve->kve_shadow_count = 0;
2350 }
2351
2352 strlcpy(kve->kve_path, fullpath, sizeof(kve->kve_path));
2353 if (freepath != NULL)
2354 free(freepath, M_TEMP);
2355
2356 /* Pack record size down */
2357 kve->kve_structsize = offsetof(struct kinfo_vmentry, kve_path) +
2358 strlen(kve->kve_path) + 1;
2359 kve->kve_structsize = roundup(kve->kve_structsize,
2360 sizeof(uint64_t));
2361 if (sbuf_bcat(sb, kve, kve->kve_structsize) != 0)
2362 error = ENOMEM;
2363 vm_map_lock_read(map);
2364 if (error != 0)
2365 break;
2366 if (last_timestamp != map->timestamp) {
2367 vm_map_lookup_entry(map, addr - 1, &tmp_entry);
2368 entry = tmp_entry;
2369 }
2370 }
2371 vm_map_unlock_read(map);
2372 vmspace_free(vm);
2373 PRELE(p);
2374 free(kve, M_TEMP);
2375 return (error);
2376 }
2377
2378 static int
sysctl_kern_proc_vmmap(SYSCTL_HANDLER_ARGS)2379 sysctl_kern_proc_vmmap(SYSCTL_HANDLER_ARGS)
2380 {
2381 struct proc *p;
2382 struct sbuf sb;
2383 int error, error2, *name;
2384
2385 name = (int *)arg1;
2386 sbuf_new_for_sysctl(&sb, NULL, sizeof(struct kinfo_vmentry), req);
2387 error = pget((pid_t)name[0], PGET_CANDEBUG | PGET_NOTWEXIT, &p);
2388 if (error != 0) {
2389 sbuf_delete(&sb);
2390 return (error);
2391 }
2392 error = kern_proc_vmmap_out(p, &sb);
2393 error2 = sbuf_finish(&sb);
2394 sbuf_delete(&sb);
2395 return (error != 0 ? error : error2);
2396 }
2397
2398 #if defined(STACK) || defined(DDB)
2399 static int
sysctl_kern_proc_kstack(SYSCTL_HANDLER_ARGS)2400 sysctl_kern_proc_kstack(SYSCTL_HANDLER_ARGS)
2401 {
2402 struct kinfo_kstack *kkstp;
2403 int error, i, *name, numthreads;
2404 lwpid_t *lwpidarray;
2405 struct thread *td;
2406 struct stack *st;
2407 struct sbuf sb;
2408 struct proc *p;
2409
2410 name = (int *)arg1;
2411 error = pget((pid_t)name[0], PGET_NOTINEXEC | PGET_WANTREAD, &p);
2412 if (error != 0)
2413 return (error);
2414
2415 kkstp = malloc(sizeof(*kkstp), M_TEMP, M_WAITOK);
2416 st = stack_create();
2417
2418 lwpidarray = NULL;
2419 numthreads = 0;
2420 PROC_LOCK(p);
2421 repeat:
2422 if (numthreads < p->p_numthreads) {
2423 if (lwpidarray != NULL) {
2424 free(lwpidarray, M_TEMP);
2425 lwpidarray = NULL;
2426 }
2427 numthreads = p->p_numthreads;
2428 PROC_UNLOCK(p);
2429 lwpidarray = malloc(sizeof(*lwpidarray) * numthreads, M_TEMP,
2430 M_WAITOK | M_ZERO);
2431 PROC_LOCK(p);
2432 goto repeat;
2433 }
2434 i = 0;
2435
2436 /*
2437 * XXXRW: During the below loop, execve(2) and countless other sorts
2438 * of changes could have taken place. Should we check to see if the
2439 * vmspace has been replaced, or the like, in order to prevent
2440 * giving a snapshot that spans, say, execve(2), with some threads
2441 * before and some after? Among other things, the credentials could
2442 * have changed, in which case the right to extract debug info might
2443 * no longer be assured.
2444 */
2445 FOREACH_THREAD_IN_PROC(p, td) {
2446 KASSERT(i < numthreads,
2447 ("sysctl_kern_proc_kstack: numthreads"));
2448 lwpidarray[i] = td->td_tid;
2449 i++;
2450 }
2451 numthreads = i;
2452 for (i = 0; i < numthreads; i++) {
2453 td = thread_find(p, lwpidarray[i]);
2454 if (td == NULL) {
2455 continue;
2456 }
2457 bzero(kkstp, sizeof(*kkstp));
2458 (void)sbuf_new(&sb, kkstp->kkst_trace,
2459 sizeof(kkstp->kkst_trace), SBUF_FIXEDLEN);
2460 thread_lock(td);
2461 kkstp->kkst_tid = td->td_tid;
2462 if (TD_IS_SWAPPED(td))
2463 kkstp->kkst_state = KKST_STATE_SWAPPED;
2464 else if (TD_IS_RUNNING(td))
2465 kkstp->kkst_state = KKST_STATE_RUNNING;
2466 else {
2467 kkstp->kkst_state = KKST_STATE_STACKOK;
2468 stack_save_td(st, td);
2469 }
2470 thread_unlock(td);
2471 PROC_UNLOCK(p);
2472 stack_sbuf_print(&sb, st);
2473 sbuf_finish(&sb);
2474 sbuf_delete(&sb);
2475 error = SYSCTL_OUT(req, kkstp, sizeof(*kkstp));
2476 PROC_LOCK(p);
2477 if (error)
2478 break;
2479 }
2480 _PRELE(p);
2481 PROC_UNLOCK(p);
2482 if (lwpidarray != NULL)
2483 free(lwpidarray, M_TEMP);
2484 stack_destroy(st);
2485 free(kkstp, M_TEMP);
2486 return (error);
2487 }
2488 #endif
2489
2490 /*
2491 * This sysctl allows a process to retrieve the full list of groups from
2492 * itself or another process.
2493 */
2494 static int
sysctl_kern_proc_groups(SYSCTL_HANDLER_ARGS)2495 sysctl_kern_proc_groups(SYSCTL_HANDLER_ARGS)
2496 {
2497 pid_t *pidp = (pid_t *)arg1;
2498 unsigned int arglen = arg2;
2499 struct proc *p;
2500 struct ucred *cred;
2501 int error;
2502
2503 if (arglen != 1)
2504 return (EINVAL);
2505 if (*pidp == -1) { /* -1 means this process */
2506 p = req->td->td_proc;
2507 } else {
2508 error = pget(*pidp, PGET_CANSEE, &p);
2509 if (error != 0)
2510 return (error);
2511 }
2512
2513 cred = crhold(p->p_ucred);
2514 if (*pidp != -1)
2515 PROC_UNLOCK(p);
2516
2517 error = SYSCTL_OUT(req, cred->cr_groups,
2518 cred->cr_ngroups * sizeof(gid_t));
2519 crfree(cred);
2520 return (error);
2521 }
2522
2523 /*
2524 * This sysctl allows a process to retrieve or/and set the resource limit for
2525 * another process.
2526 */
2527 static int
sysctl_kern_proc_rlimit(SYSCTL_HANDLER_ARGS)2528 sysctl_kern_proc_rlimit(SYSCTL_HANDLER_ARGS)
2529 {
2530 int *name = (int *)arg1;
2531 u_int namelen = arg2;
2532 struct rlimit rlim;
2533 struct proc *p;
2534 u_int which;
2535 int flags, error;
2536
2537 if (namelen != 2)
2538 return (EINVAL);
2539
2540 which = (u_int)name[1];
2541 if (which >= RLIM_NLIMITS)
2542 return (EINVAL);
2543
2544 if (req->newptr != NULL && req->newlen != sizeof(rlim))
2545 return (EINVAL);
2546
2547 flags = PGET_HOLD | PGET_NOTWEXIT;
2548 if (req->newptr != NULL)
2549 flags |= PGET_CANDEBUG;
2550 else
2551 flags |= PGET_CANSEE;
2552 error = pget((pid_t)name[0], flags, &p);
2553 if (error != 0)
2554 return (error);
2555
2556 /*
2557 * Retrieve limit.
2558 */
2559 if (req->oldptr != NULL) {
2560 PROC_LOCK(p);
2561 lim_rlimit(p, which, &rlim);
2562 PROC_UNLOCK(p);
2563 }
2564 error = SYSCTL_OUT(req, &rlim, sizeof(rlim));
2565 if (error != 0)
2566 goto errout;
2567
2568 /*
2569 * Set limit.
2570 */
2571 if (req->newptr != NULL) {
2572 error = SYSCTL_IN(req, &rlim, sizeof(rlim));
2573 if (error == 0)
2574 error = kern_proc_setrlimit(curthread, p, which, &rlim);
2575 }
2576
2577 errout:
2578 PRELE(p);
2579 return (error);
2580 }
2581
2582 /*
2583 * This sysctl allows a process to retrieve ps_strings structure location of
2584 * another process.
2585 */
2586 static int
sysctl_kern_proc_ps_strings(SYSCTL_HANDLER_ARGS)2587 sysctl_kern_proc_ps_strings(SYSCTL_HANDLER_ARGS)
2588 {
2589 int *name = (int *)arg1;
2590 u_int namelen = arg2;
2591 struct proc *p;
2592 vm_offset_t ps_strings;
2593 int error;
2594 #ifdef COMPAT_FREEBSD32
2595 uint32_t ps_strings32;
2596 #endif
2597
2598 if (namelen != 1)
2599 return (EINVAL);
2600
2601 error = pget((pid_t)name[0], PGET_CANDEBUG, &p);
2602 if (error != 0)
2603 return (error);
2604 #ifdef COMPAT_FREEBSD32
2605 if ((req->flags & SCTL_MASK32) != 0) {
2606 /*
2607 * We return 0 if the 32 bit emulation request is for a 64 bit
2608 * process.
2609 */
2610 ps_strings32 = SV_PROC_FLAG(p, SV_ILP32) != 0 ?
2611 PTROUT(p->p_sysent->sv_psstrings) : 0;
2612 PROC_UNLOCK(p);
2613 error = SYSCTL_OUT(req, &ps_strings32, sizeof(ps_strings32));
2614 return (error);
2615 }
2616 #endif
2617 ps_strings = p->p_sysent->sv_psstrings;
2618 PROC_UNLOCK(p);
2619 error = SYSCTL_OUT(req, &ps_strings, sizeof(ps_strings));
2620 return (error);
2621 }
2622
2623 /*
2624 * This sysctl allows a process to retrieve umask of another process.
2625 */
2626 static int
sysctl_kern_proc_umask(SYSCTL_HANDLER_ARGS)2627 sysctl_kern_proc_umask(SYSCTL_HANDLER_ARGS)
2628 {
2629 int *name = (int *)arg1;
2630 u_int namelen = arg2;
2631 struct proc *p;
2632 int error;
2633 u_short fd_cmask;
2634
2635 if (namelen != 1)
2636 return (EINVAL);
2637
2638 error = pget((pid_t)name[0], PGET_WANTREAD, &p);
2639 if (error != 0)
2640 return (error);
2641
2642 FILEDESC_SLOCK(p->p_fd);
2643 fd_cmask = p->p_fd->fd_cmask;
2644 FILEDESC_SUNLOCK(p->p_fd);
2645 PRELE(p);
2646 error = SYSCTL_OUT(req, &fd_cmask, sizeof(fd_cmask));
2647 return (error);
2648 }
2649
2650 /*
2651 * This sysctl allows a process to set and retrieve binary osreldate of
2652 * another process.
2653 */
2654 static int
sysctl_kern_proc_osrel(SYSCTL_HANDLER_ARGS)2655 sysctl_kern_proc_osrel(SYSCTL_HANDLER_ARGS)
2656 {
2657 int *name = (int *)arg1;
2658 u_int namelen = arg2;
2659 struct proc *p;
2660 int flags, error, osrel;
2661
2662 if (namelen != 1)
2663 return (EINVAL);
2664
2665 if (req->newptr != NULL && req->newlen != sizeof(osrel))
2666 return (EINVAL);
2667
2668 flags = PGET_HOLD | PGET_NOTWEXIT;
2669 if (req->newptr != NULL)
2670 flags |= PGET_CANDEBUG;
2671 else
2672 flags |= PGET_CANSEE;
2673 error = pget((pid_t)name[0], flags, &p);
2674 if (error != 0)
2675 return (error);
2676
2677 error = SYSCTL_OUT(req, &p->p_osrel, sizeof(p->p_osrel));
2678 if (error != 0)
2679 goto errout;
2680
2681 if (req->newptr != NULL) {
2682 error = SYSCTL_IN(req, &osrel, sizeof(osrel));
2683 if (error != 0)
2684 goto errout;
2685 if (osrel < 0) {
2686 error = EINVAL;
2687 goto errout;
2688 }
2689 p->p_osrel = osrel;
2690 }
2691 errout:
2692 PRELE(p);
2693 return (error);
2694 }
2695
2696 static int
sysctl_kern_proc_sigtramp(SYSCTL_HANDLER_ARGS)2697 sysctl_kern_proc_sigtramp(SYSCTL_HANDLER_ARGS)
2698 {
2699 int *name = (int *)arg1;
2700 u_int namelen = arg2;
2701 struct proc *p;
2702 struct kinfo_sigtramp kst;
2703 const struct sysentvec *sv;
2704 int error;
2705 #ifdef COMPAT_FREEBSD32
2706 struct kinfo_sigtramp32 kst32;
2707 #endif
2708
2709 if (namelen != 1)
2710 return (EINVAL);
2711
2712 error = pget((pid_t)name[0], PGET_CANDEBUG, &p);
2713 if (error != 0)
2714 return (error);
2715 sv = p->p_sysent;
2716 #ifdef COMPAT_FREEBSD32
2717 if ((req->flags & SCTL_MASK32) != 0) {
2718 bzero(&kst32, sizeof(kst32));
2719 if (SV_PROC_FLAG(p, SV_ILP32)) {
2720 if (sv->sv_sigcode_base != 0) {
2721 kst32.ksigtramp_start = sv->sv_sigcode_base;
2722 kst32.ksigtramp_end = sv->sv_sigcode_base +
2723 *sv->sv_szsigcode;
2724 } else {
2725 kst32.ksigtramp_start = sv->sv_psstrings -
2726 *sv->sv_szsigcode;
2727 kst32.ksigtramp_end = sv->sv_psstrings;
2728 }
2729 }
2730 PROC_UNLOCK(p);
2731 error = SYSCTL_OUT(req, &kst32, sizeof(kst32));
2732 return (error);
2733 }
2734 #endif
2735 bzero(&kst, sizeof(kst));
2736 if (sv->sv_sigcode_base != 0) {
2737 kst.ksigtramp_start = (char *)sv->sv_sigcode_base;
2738 kst.ksigtramp_end = (char *)sv->sv_sigcode_base +
2739 *sv->sv_szsigcode;
2740 } else {
2741 kst.ksigtramp_start = (char *)sv->sv_psstrings -
2742 *sv->sv_szsigcode;
2743 kst.ksigtramp_end = (char *)sv->sv_psstrings;
2744 }
2745 PROC_UNLOCK(p);
2746 error = SYSCTL_OUT(req, &kst, sizeof(kst));
2747 return (error);
2748 }
2749
2750 SYSCTL_NODE(_kern, KERN_PROC, proc, CTLFLAG_RD, 0, "Process table");
2751
2752 SYSCTL_PROC(_kern_proc, KERN_PROC_ALL, all, CTLFLAG_RD|CTLTYPE_STRUCT|
2753 CTLFLAG_MPSAFE, 0, 0, sysctl_kern_proc, "S,proc",
2754 "Return entire process table");
2755
2756 static SYSCTL_NODE(_kern_proc, KERN_PROC_GID, gid, CTLFLAG_RD | CTLFLAG_MPSAFE,
2757 sysctl_kern_proc, "Process table");
2758
2759 static SYSCTL_NODE(_kern_proc, KERN_PROC_PGRP, pgrp, CTLFLAG_RD | CTLFLAG_MPSAFE,
2760 sysctl_kern_proc, "Process table");
2761
2762 static SYSCTL_NODE(_kern_proc, KERN_PROC_RGID, rgid, CTLFLAG_RD | CTLFLAG_MPSAFE,
2763 sysctl_kern_proc, "Process table");
2764
2765 static SYSCTL_NODE(_kern_proc, KERN_PROC_SESSION, sid, CTLFLAG_RD |
2766 CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2767
2768 static SYSCTL_NODE(_kern_proc, KERN_PROC_TTY, tty, CTLFLAG_RD | CTLFLAG_MPSAFE,
2769 sysctl_kern_proc, "Process table");
2770
2771 static SYSCTL_NODE(_kern_proc, KERN_PROC_UID, uid, CTLFLAG_RD | CTLFLAG_MPSAFE,
2772 sysctl_kern_proc, "Process table");
2773
2774 static SYSCTL_NODE(_kern_proc, KERN_PROC_RUID, ruid, CTLFLAG_RD | CTLFLAG_MPSAFE,
2775 sysctl_kern_proc, "Process table");
2776
2777 static SYSCTL_NODE(_kern_proc, KERN_PROC_PID, pid, CTLFLAG_RD | CTLFLAG_MPSAFE,
2778 sysctl_kern_proc, "Process table");
2779
2780 static SYSCTL_NODE(_kern_proc, KERN_PROC_PROC, proc, CTLFLAG_RD | CTLFLAG_MPSAFE,
2781 sysctl_kern_proc, "Return process table, no threads");
2782
2783 static SYSCTL_NODE(_kern_proc, KERN_PROC_ARGS, args,
2784 CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_MPSAFE,
2785 sysctl_kern_proc_args, "Process argument list");
2786
2787 static SYSCTL_NODE(_kern_proc, KERN_PROC_ENV, env, CTLFLAG_RD | CTLFLAG_MPSAFE,
2788 sysctl_kern_proc_env, "Process environment");
2789
2790 static SYSCTL_NODE(_kern_proc, KERN_PROC_AUXV, auxv, CTLFLAG_RD |
2791 CTLFLAG_MPSAFE, sysctl_kern_proc_auxv, "Process ELF auxiliary vector");
2792
2793 static SYSCTL_NODE(_kern_proc, KERN_PROC_PATHNAME, pathname, CTLFLAG_RD |
2794 CTLFLAG_MPSAFE, sysctl_kern_proc_pathname, "Process executable path");
2795
2796 static SYSCTL_NODE(_kern_proc, KERN_PROC_SV_NAME, sv_name, CTLFLAG_RD |
2797 CTLFLAG_MPSAFE, sysctl_kern_proc_sv_name,
2798 "Process syscall vector name (ABI type)");
2799
2800 static SYSCTL_NODE(_kern_proc, (KERN_PROC_GID | KERN_PROC_INC_THREAD), gid_td,
2801 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2802
2803 static SYSCTL_NODE(_kern_proc, (KERN_PROC_PGRP | KERN_PROC_INC_THREAD), pgrp_td,
2804 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2805
2806 static SYSCTL_NODE(_kern_proc, (KERN_PROC_RGID | KERN_PROC_INC_THREAD), rgid_td,
2807 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2808
2809 static SYSCTL_NODE(_kern_proc, (KERN_PROC_SESSION | KERN_PROC_INC_THREAD),
2810 sid_td, CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2811
2812 static SYSCTL_NODE(_kern_proc, (KERN_PROC_TTY | KERN_PROC_INC_THREAD), tty_td,
2813 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2814
2815 static SYSCTL_NODE(_kern_proc, (KERN_PROC_UID | KERN_PROC_INC_THREAD), uid_td,
2816 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2817
2818 static SYSCTL_NODE(_kern_proc, (KERN_PROC_RUID | KERN_PROC_INC_THREAD), ruid_td,
2819 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2820
2821 static SYSCTL_NODE(_kern_proc, (KERN_PROC_PID | KERN_PROC_INC_THREAD), pid_td,
2822 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc, "Process table");
2823
2824 static SYSCTL_NODE(_kern_proc, (KERN_PROC_PROC | KERN_PROC_INC_THREAD), proc_td,
2825 CTLFLAG_RD | CTLFLAG_MPSAFE, sysctl_kern_proc,
2826 "Return process table, no threads");
2827
2828 #ifdef COMPAT_FREEBSD7
2829 static SYSCTL_NODE(_kern_proc, KERN_PROC_OVMMAP, ovmmap, CTLFLAG_RD |
2830 CTLFLAG_MPSAFE, sysctl_kern_proc_ovmmap, "Old Process vm map entries");
2831 #endif
2832
2833 static SYSCTL_NODE(_kern_proc, KERN_PROC_VMMAP, vmmap, CTLFLAG_RD |
2834 CTLFLAG_MPSAFE, sysctl_kern_proc_vmmap, "Process vm map entries");
2835
2836 #if defined(STACK) || defined(DDB)
2837 static SYSCTL_NODE(_kern_proc, KERN_PROC_KSTACK, kstack, CTLFLAG_RD |
2838 CTLFLAG_MPSAFE, sysctl_kern_proc_kstack, "Process kernel stacks");
2839 #endif
2840
2841 static SYSCTL_NODE(_kern_proc, KERN_PROC_GROUPS, groups, CTLFLAG_RD |
2842 CTLFLAG_MPSAFE, sysctl_kern_proc_groups, "Process groups");
2843
2844 static SYSCTL_NODE(_kern_proc, KERN_PROC_RLIMIT, rlimit, CTLFLAG_RW |
2845 CTLFLAG_ANYBODY | CTLFLAG_MPSAFE, sysctl_kern_proc_rlimit,
2846 "Process resource limits");
2847
2848 static SYSCTL_NODE(_kern_proc, KERN_PROC_PS_STRINGS, ps_strings, CTLFLAG_RD |
2849 CTLFLAG_MPSAFE, sysctl_kern_proc_ps_strings,
2850 "Process ps_strings location");
2851
2852 static SYSCTL_NODE(_kern_proc, KERN_PROC_UMASK, umask, CTLFLAG_RD |
2853 CTLFLAG_MPSAFE, sysctl_kern_proc_umask, "Process umask");
2854
2855 static SYSCTL_NODE(_kern_proc, KERN_PROC_OSREL, osrel, CTLFLAG_RW |
2856 CTLFLAG_ANYBODY | CTLFLAG_MPSAFE, sysctl_kern_proc_osrel,
2857 "Process binary osreldate");
2858
2859 static SYSCTL_NODE(_kern_proc, KERN_PROC_SIGTRAMP, sigtramp, CTLFLAG_RD |
2860 CTLFLAG_MPSAFE, sysctl_kern_proc_sigtramp,
2861 "Process signal trampoline location");
2862
2863 int allproc_gen;
2864
2865 void
stop_all_proc(void)2866 stop_all_proc(void)
2867 {
2868 struct proc *cp, *p;
2869 int r, gen;
2870 bool restart, seen_stopped, seen_exiting, stopped_some;
2871
2872 cp = curproc;
2873 /*
2874 * stop_all_proc() assumes that all process which have
2875 * usermode must be stopped, except current process, for
2876 * obvious reasons. Since other threads in the process
2877 * establishing global stop could unstop something, disable
2878 * calls from multithreaded processes as precaution. The
2879 * service must not be user-callable anyway.
2880 */
2881 KASSERT((cp->p_flag & P_HADTHREADS) == 0 ||
2882 (cp->p_flag & P_KTHREAD) != 0, ("mt stop_all_proc"));
2883
2884 allproc_loop:
2885 sx_xlock(&allproc_lock);
2886 gen = allproc_gen;
2887 seen_exiting = seen_stopped = stopped_some = restart = false;
2888 LIST_REMOVE(cp, p_list);
2889 LIST_INSERT_HEAD(&allproc, cp, p_list);
2890 for (;;) {
2891 p = LIST_NEXT(cp, p_list);
2892 if (p == NULL)
2893 break;
2894 LIST_REMOVE(cp, p_list);
2895 LIST_INSERT_AFTER(p, cp, p_list);
2896 PROC_LOCK(p);
2897 if ((p->p_flag & (P_KTHREAD | P_SYSTEM |
2898 P_TOTAL_STOP)) != 0) {
2899 PROC_UNLOCK(p);
2900 continue;
2901 }
2902 if ((p->p_flag & P_WEXIT) != 0) {
2903 seen_exiting = true;
2904 PROC_UNLOCK(p);
2905 continue;
2906 }
2907 if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) {
2908 /*
2909 * Stopped processes are tolerated when there
2910 * are no other processes which might continue
2911 * them. P_STOPPED_SINGLE but not
2912 * P_TOTAL_STOP process still has at least one
2913 * thread running.
2914 */
2915 seen_stopped = true;
2916 PROC_UNLOCK(p);
2917 continue;
2918 }
2919 _PHOLD(p);
2920 sx_xunlock(&allproc_lock);
2921 r = thread_single(p, SINGLE_ALLPROC);
2922 if (r != 0)
2923 restart = true;
2924 else
2925 stopped_some = true;
2926 _PRELE(p);
2927 PROC_UNLOCK(p);
2928 sx_xlock(&allproc_lock);
2929 }
2930 /* Catch forked children we did not see in iteration. */
2931 if (gen != allproc_gen)
2932 restart = true;
2933 sx_xunlock(&allproc_lock);
2934 if (restart || stopped_some || seen_exiting || seen_stopped) {
2935 kern_yield(PRI_USER);
2936 goto allproc_loop;
2937 }
2938 }
2939
2940 void
resume_all_proc(void)2941 resume_all_proc(void)
2942 {
2943 struct proc *cp, *p;
2944
2945 cp = curproc;
2946 sx_xlock(&allproc_lock);
2947 LIST_REMOVE(cp, p_list);
2948 LIST_INSERT_HEAD(&allproc, cp, p_list);
2949 for (;;) {
2950 p = LIST_NEXT(cp, p_list);
2951 if (p == NULL)
2952 break;
2953 LIST_REMOVE(cp, p_list);
2954 LIST_INSERT_AFTER(p, cp, p_list);
2955 PROC_LOCK(p);
2956 if ((p->p_flag & P_TOTAL_STOP) != 0) {
2957 sx_xunlock(&allproc_lock);
2958 _PHOLD(p);
2959 thread_single_end(p, SINGLE_ALLPROC);
2960 _PRELE(p);
2961 PROC_UNLOCK(p);
2962 sx_xlock(&allproc_lock);
2963 } else {
2964 PROC_UNLOCK(p);
2965 }
2966 }
2967 sx_xunlock(&allproc_lock);
2968 }
2969
2970 #define TOTAL_STOP_DEBUG 1
2971 #ifdef TOTAL_STOP_DEBUG
2972 volatile static int ap_resume;
2973 #include <sys/mount.h>
2974
2975 static int
sysctl_debug_stop_all_proc(SYSCTL_HANDLER_ARGS)2976 sysctl_debug_stop_all_proc(SYSCTL_HANDLER_ARGS)
2977 {
2978 int error, val;
2979
2980 val = 0;
2981 ap_resume = 0;
2982 error = sysctl_handle_int(oidp, &val, 0, req);
2983 if (error != 0 || req->newptr == NULL)
2984 return (error);
2985 if (val != 0) {
2986 stop_all_proc();
2987 syncer_suspend();
2988 while (ap_resume == 0)
2989 ;
2990 syncer_resume();
2991 resume_all_proc();
2992 }
2993 return (0);
2994 }
2995
2996 SYSCTL_PROC(_debug, OID_AUTO, stop_all_proc, CTLTYPE_INT | CTLFLAG_RW |
2997 CTLFLAG_MPSAFE, __DEVOLATILE(int *, &ap_resume), 0,
2998 sysctl_debug_stop_all_proc, "I",
2999 "");
3000 #endif
3001