On 20/10/17(Fri) 11:50, Martin Pieuchot wrote:
> On 14/10/17(Sat) 22:07, Philip Guenther wrote:
> > 
> > The diff below adds proctreelk, an rwlock protecting the links of the 
> > process tree and related bits, as well as uidinfolk, an rwlock protecting 
> > the uidinfo hash table.
> > 
> > Parts of this are based on FreeBSD's proctree_lock, particularly the 
> > reorganization of enterpgrp() into enternewpgrp() and enterthispgrp() and 
> > the splitting out of killjobc() from exit1().
> > 
> > This diff should address the previously reported crashes seen when using 
> > ktrace(2) while creating/exiting processes.
> > 
> > This has been stable for quite a while under my usage; please test and 
> > report any issues.
> 
> First of all, I'm very happy to see this diff.  Thanks Philip.
> 
> I have been running this diff on my amd64 NFS client/server build
> machine since you posted it.  So far no issue, so it is stable for
> this usage as well.
> 
> I'd however appreciate if you could commit the killjobc() and
> enter*grp() refactoring first.  Because in case of revert this
> would be less pain.

I've done that.

> That's also for this reason that I introduced a macro for the
> NET_LOCK().  So I could enable/disable it without having to revert
> N files.  No idea if this could be useful there two.
> 
> I like the way you annotate the protected elements in the structure.
> I'll try to do the same for bpf.
> 
> I'm also suggesting you commit the `uidinfolk' bits first.  This seems
> quite safe.  In this exact part, what about introducing a uid_release(),
> a wrapper around rw_exit_write(&uidinfolk), to be called after uid_find()?
> This way you can keep the lock local.

And that too, here's an updated/rebased diff.

Index: sys/proc.h
===================================================================
RCS file: /cvs/src/sys/sys/proc.h,v
retrieving revision 1.247
diff -u -p -r1.247 proc.h
--- sys/proc.h  26 Feb 2018 13:43:51 -0000      1.247
+++ sys/proc.h  26 Feb 2018 16:47:58 -0000
@@ -44,6 +44,7 @@
 #include <sys/selinfo.h>               /* For struct selinfo */
 #include <sys/syslimits.h>             /* For LOGIN_NAME_MAX */
 #include <sys/queue.h>
+#include <sys/rwlock.h>                        /* For struct rwlock */
 #include <sys/timeout.h>               /* For struct timeout */
 #include <sys/event.h>                 /* For struct klist */
 #include <sys/mutex.h>                 /* For struct mutex */
@@ -55,16 +56,25 @@
 #endif
 
 /*
+ * Locks used to protect struct members in this file:
+ *     I       immutable after creation
+ *     t       proctreelk
+ *
+ * If multiple locks are listed then all are required for writes,
+ * but any one of them is sufficient for reads.
+ */
+
+/*
  * One structure allocated per session.
  */
 struct process;
 struct session {
        int     s_count;                /* Ref cnt; pgrps in session. */
-       struct  process *s_leader;      /* Session leader. */
+       struct  process *s_leader;      /* [t] Session leader. */
        struct  vnode *s_ttyvp;         /* Vnode of controlling terminal. */
-       struct  tty *s_ttyp;            /* Controlling terminal. */
-       char    s_login[LOGIN_NAME_MAX];        /* Setlogin() name. */
-       pid_t   s_verauthppid;
+       struct  tty *s_ttyp;            /* [t] Controlling terminal. */
+       char    s_login[LOGIN_NAME_MAX];/* setlogin() name. */
+       pid_t   s_verauthppid;          /* TIOCSETVERAUTH info */
        uid_t   s_verauthuid;
        struct timeout s_verauthto;
 };
@@ -75,10 +85,10 @@ void zapverauth(/* struct session */ voi
  * One structure allocated per process group.
  */
 struct pgrp {
-       LIST_ENTRY(pgrp) pg_hash;       /* Hash chain. */
-       LIST_HEAD(, process) pg_members;/* Pointer to pgrp members. */
-       struct  session *pg_session;    /* Pointer to session. */
-       pid_t   pg_id;                  /* Pgrp id. */
+       LIST_ENTRY(pgrp) pg_hash;       /* [t] Hash chain. */
+       LIST_HEAD(, process) pg_members;/* [t] Pointer to pgrp members. */
+       struct  session *pg_session;    /* [I] Pointer to session. */
+       pid_t   pg_id;                  /* [I] Pgrp id. */
        int     pg_jobc;        /* # procs qualifying pgrp for job control */
 };
 
@@ -156,17 +166,17 @@ struct process {
        LIST_ENTRY(process) ps_list;    /* List of all processes. */
        TAILQ_HEAD(,proc) ps_threads;   /* Threads in this process. */
 
-       LIST_ENTRY(process) ps_pglist;  /* List of processes in pgrp. */
-       struct  process *ps_pptr;       /* Pointer to parent process. */
-       LIST_ENTRY(process) ps_sibling; /* List of sibling processes. */
-       LIST_HEAD(, process) ps_children;/* Pointer to list of children. */
+       LIST_ENTRY(process) ps_pglist;  /* [t] List of processes in pgrp. */
+       struct  process *ps_pptr;       /* [t] Pointer to parent process. */
+       LIST_ENTRY(process) ps_sibling; /* [t] List of sibling processes. */
+       LIST_HEAD(, process) ps_children;/* [t] Pointer to list of children. */
        LIST_ENTRY(process) ps_hash;    /* Hash chain. */
 
        struct  sigacts *ps_sigacts;    /* Signal actions, state */
        struct  vnode *ps_textvp;       /* Vnode of executable. */
        struct  filedesc *ps_fd;        /* Ptr to open files structure */
        struct  vmspace *ps_vmspace;    /* Address space */
-       pid_t   ps_pid;                 /* Process identifier. */
+       pid_t   ps_pid;                 /* [I] Process identifier. */
 
 /* The following fields are all zeroed upon creation in process_new. */
 #define        ps_startzero    ps_klist
@@ -180,7 +190,7 @@ struct process {
        struct  vnode *ps_tracevp;      /* Trace to vnode. */
        struct  ucred *ps_tracecred;    /* Creds for writing trace */
 
-       pid_t   ps_oppid;               /* Save parent pid during ptrace. */
+       pid_t   ps_oppid;               /* [t] Save parent pid during ptrace. */
        int     ps_ptmask;              /* Ptrace event mask */
        struct  ptrace_state *ps_ptstat;/* Ptrace state */
 
@@ -197,7 +207,7 @@ struct process {
 /* The following fields are all copied upon creation in process_new. */
 #define        ps_startcopy    ps_limit
        struct  plimit *ps_limit;       /* Process limits. */
-       struct  pgrp *ps_pgrp;          /* Pointer to process group. */
+       struct  pgrp *ps_pgrp;          /* [t] Pointer to process group. */
        struct  emul *ps_emul;          /* Emulation information */
 
        char    ps_comm[MAXCOMLEN+1];
@@ -475,6 +485,7 @@ LIST_HEAD(processlist, process);
 extern struct processlist allprocess;  /* List of all processes. */
 extern struct processlist zombprocess; /* List of zombie processes. */
 extern struct proclist allproc;                /* List of all threads. */
+extern struct rwlock proctreelk;       /* parent/child, pgrp, session */
 
 extern struct process *initprocess;    /* Process slot for init. */
 extern struct proc *reaperproc;                /* Thread slot for reaper. */
Index: sys/ucred.h
===================================================================
RCS file: /cvs/src/sys/sys/ucred.h,v
retrieving revision 1.12
diff -u -p -r1.12 ucred.h
--- sys/ucred.h 19 Feb 2018 08:59:53 -0000      1.12
+++ sys/ucred.h 26 Feb 2018 16:47:58 -0000
@@ -67,8 +67,10 @@ struct xucred {
        gid_t   cr_groups[NGROUPS_MAX]; /* groups */
 };
 
-#ifdef _KERNEL
-#define        crhold(cr)      (cr)->cr_ref++
+#if defined(_KERNEL) && !defined(_STANDALONE)
+#include <sys/atomic.h>
+
+#define        crhold(cr)      atomic_inc_int(&(cr)->cr_ref)
 
 int            crfromxucred(struct ucred *, const struct xucred *);
 void           crset(struct ucred *, const struct ucred *);
@@ -79,6 +81,6 @@ struct ucred  *crget(void);
 int            suser(struct proc *p);
 int            suser_ucred(struct ucred *cred);
 
-#endif /* _KERNEL */
+#endif /* _KERNEL && !_STANDALONE */
 
 #endif /* !_SYS_UCRED_H_ */
Index: kern/exec_elf.c
===================================================================
RCS file: /cvs/src/sys/kern/exec_elf.c,v
retrieving revision 1.142
diff -u -p -r1.142 exec_elf.c
--- kern/exec_elf.c     30 Dec 2017 23:08:29 -0000      1.142
+++ kern/exec_elf.c     26 Feb 2018 16:47:57 -0000
@@ -1168,12 +1168,14 @@ coredump_notes_elf(struct proc *p, void 
                cpi.cpi_sigcatch = pr->ps_sigacts->ps_sigcatch;
 
                cpi.cpi_pid = pr->ps_pid;
+               rw_enter_read(&proctreelk);
                cpi.cpi_ppid = pr->ps_pptr->ps_pid;
                cpi.cpi_pgrp = pr->ps_pgid;
                if (pr->ps_session->s_leader)
                        cpi.cpi_sid = pr->ps_session->s_leader->ps_pid;
                else
                        cpi.cpi_sid = 0;
+               rw_exit_read(&proctreelk);
 
                cpi.cpi_ruid = p->p_ucred->cr_ruid;
                cpi.cpi_euid = p->p_ucred->cr_uid;
Index: kern/kern_acct.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_acct.c,v
retrieving revision 1.35
diff -u -p -r1.35 kern_acct.c
--- kern/kern_acct.c    19 Feb 2018 08:59:52 -0000      1.35
+++ kern/kern_acct.c    26 Feb 2018 16:47:57 -0000
@@ -206,11 +206,13 @@ acct_process(struct proc *p)
        acct.ac_gid = pr->ps_ucred->cr_rgid;
 
        /* (7) The terminal from which the process was started */
+       rw_enter_read(&proctreelk);
        if ((pr->ps_flags & PS_CONTROLT) &&
            pr->ps_pgrp->pg_session->s_ttyp)
                acct.ac_tty = pr->ps_pgrp->pg_session->s_ttyp->t_dev;
        else
                acct.ac_tty = NODEV;
+       rw_exit_read(&proctreelk);
 
        /* (8) The boolean flags that tell how the process terminated, etc. */
        acct.ac_flag = pr->ps_acflag;
Index: kern/kern_exec.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_exec.c,v
retrieving revision 1.193
diff -u -p -r1.193 kern_exec.c
--- kern/kern_exec.c    2 Jan 2018 06:38:45 -0000       1.193
+++ kern/kern_exec.c    26 Feb 2018 16:47:57 -0000
@@ -509,9 +509,11 @@ sys_execve(struct proc *p, void *v, regi
 
        atomic_setbits_int(&pr->ps_flags, PS_EXEC);
        if (pr->ps_flags & PS_PPWAIT) {
+               rw_enter_read(&proctreelk);
                atomic_clearbits_int(&pr->ps_flags, PS_PPWAIT);
                atomic_clearbits_int(&pr->ps_pptr->ps_flags, PS_ISPWAIT);
                wakeup(pr->ps_pptr);
+               rw_exit_read(&proctreelk);
        }
 
        /*
Index: kern/kern_exit.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_exit.c,v
retrieving revision 1.164
diff -u -p -r1.164 kern_exit.c
--- kern/kern_exit.c    10 Feb 2018 10:32:51 -0000      1.164
+++ kern/kern_exit.c    26 Feb 2018 16:47:58 -0000
@@ -212,11 +212,7 @@ exit1(struct proc *p, int rv, int flags)
         * thread of a process that isn't PS_NOZOMBIE, we'll put
         * the process on the zombprocess list below.
         */
-       /*
-        * NOTE: WE ARE NO LONGER ALLOWED TO SLEEP!
-        */
-       p->p_stat = SDEAD;
-
+       rw_enter_write(&proctreelk);
        LIST_REMOVE(p, p_hash);
        LIST_REMOVE(p, p_list);
 
@@ -264,6 +260,7 @@ exit1(struct proc *p, int rv, int flags)
                        }
                }
        }
+       rw_exit_write(&proctreelk);
 
        /* add thread's accumulated rusage into the process's total */
        ruadd(rup, &p->p_ru);
@@ -292,9 +289,13 @@ exit1(struct proc *p, int rv, int flags)
                 * wait4() to return ECHILD.
                 */
                if (pr->ps_flags & PS_NOZOMBIE) {
-                       struct process *ppr = pr->ps_pptr;
+                       struct process *ppr;
+
+                       rw_enter_write(&proctreelk);
+                       ppr = pr->ps_pptr;
                        proc_reparent(pr, initprocess);
                        wakeup(ppr);
+                       rw_exit_write(&proctreelk);
                }
 
                /*
@@ -312,6 +313,11 @@ exit1(struct proc *p, int rv, int flags)
        }
 
        /*
+        * NOTE: WE ARE NO LONGER ALLOWED TO SLEEP!
+        */
+       p->p_stat = SDEAD;
+
+       /*
         * Other substructures are freed from reaper and wait().
         */
 
@@ -413,6 +419,7 @@ reaper(void)
                        /* Release the rest of the process's vmspace */
                        uvm_exit(pr);
 
+                       rw_enter_write(&proctreelk);
                        if ((pr->ps_flags & PS_NOZOMBIE) == 0) {
                                /* Process is now a true zombie. */
                                atomic_setbits_int(&pr->ps_flags, PS_ZOMBIE);
@@ -420,6 +427,7 @@ reaper(void)
 
                                /* Wake up the parent so it can get exit 
status. */
                                wakeup(pr->ps_pptr);
+                               rw_exit_write(&proctreelk);
                        } else {
                                /* No one will wait for us. Just zap the 
process now */
                                process_zap(pr);
@@ -473,6 +481,7 @@ dowait4(struct proc *q, pid_t pid, int *
                return (EINVAL);
 
 loop:
+       rw_enter_write(&proctreelk);
        nfound = 0;
        LIST_FOREACH(pr, &q->p_p->ps_children, ps_sibling) {
                if ((pr->ps_flags & PS_NOZOMBIE) ||
@@ -498,6 +507,7 @@ loop:
                    (pr->ps_flags & PS_WAITED) == 0 && pr->ps_single &&
                    pr->ps_single->p_stat == SSTOP &&
                    (pr->ps_single->p_flag & P_SUSPSINGLE) == 0) {
+                       rw_exit_write(&proctreelk);
                        single_thread_wait(pr);
 
                        atomic_setbits_int(&pr->ps_flags, PS_WAITED);
@@ -521,6 +531,7 @@ loop:
                                *statusp = W_STOPCODE(p->p_xstat);
                        if (rusage != NULL)
                                memset(rusage, 0, sizeof(*rusage));
+                       rw_exit_write(&proctreelk);
                        return (0);
                }
                if ((options & WCONTINUED) && (p->p_flag & P_CONTINUED)) {
@@ -531,16 +542,21 @@ loop:
                                *statusp = _WCONTINUED;
                        if (rusage != NULL)
                                memset(rusage, 0, sizeof(*rusage));
+                       rw_exit_write(&proctreelk);
                        return (0);
                }
        }
-       if (nfound == 0)
+       if (nfound == 0) {
+               rw_exit_write(&proctreelk);
                return (ECHILD);
+       }
        if (options & WNOHANG) {
+               rw_exit_write(&proctreelk);
                retval[0] = 0;
                return (0);
        }
-       if ((error = tsleep(q->p_p, PWAIT | PCATCH, "wait", 0)) != 0)
+       if ((error = rwsleep(q->p_p, &proctreelk, PWAIT | PCATCH | PNORELOCK,
+           "wait", 0)) != 0)
                return (error);
        goto loop;
 }
@@ -551,6 +567,8 @@ proc_finish_wait(struct proc *waiter, st
        struct process *pr, *tr;
        struct rusage *rup;
 
+       rw_assert_wrlock(&proctreelk);
+
        /*
         * If we got the child via a ptrace 'attach',
         * we need to give it back to the old parent.
@@ -562,6 +580,7 @@ proc_finish_wait(struct proc *waiter, st
                proc_reparent(pr, tr);
                prsignal(tr, SIGCHLD);
                wakeup(tr);
+               rw_exit_write(&proctreelk);
        } else {
                scheduler_wait_hook(waiter, p);
                p->p_xstat = 0;
@@ -580,6 +599,7 @@ void
 proc_reparent(struct process *child, struct process *parent)
 {
 
+       rw_assert_wrlock(&proctreelk);
        if (child->ps_pptr == parent)
                return;
 
@@ -594,12 +614,15 @@ process_zap(struct process *pr)
        struct vnode *otvp;
        struct proc *p = pr->ps_mainproc;
 
+       rw_assert_wrlock(&proctreelk);
+
        /*
         * Finally finished with old proc entry.
         * Unlink it from its process group and free it.
         */
        leavepgrp(pr);
        LIST_REMOVE(pr, ps_sibling);
+       rw_exit_write(&proctreelk);
 
        /*
         * Decrement the count of procs running with this uid.
Index: kern/kern_fork.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_fork.c,v
retrieving revision 1.202
diff -u -p -r1.202 kern_fork.c
--- kern/kern_fork.c    30 Dec 2017 20:47:00 -0000      1.202
+++ kern/kern_fork.c    26 Feb 2018 16:47:58 -0000
@@ -224,7 +224,6 @@ process_new(struct proc *p, struct proce
            (caddr_t)&pr->ps_endcopy - (caddr_t)&pr->ps_startcopy);
 
        process_initialize(pr, p);
-       pr->ps_pid = allocpid();
 
        /* post-copy fixups */
        pr->ps_pptr = parent;
@@ -269,10 +268,9 @@ process_new(struct proc *p, struct proce
        /* mark as embryo to protect against others */
        pr->ps_flags |= PS_EMBRYO;
 
-       /* Force visibility of all of the above changes */
-       membar_producer();
-
        /* it's sufficiently inited to be globally visible */
+       rw_enter_write(&proctreelk);
+       pr->ps_pid = allocpid();
        LIST_INSERT_HEAD(&allprocess, pr, ps_list);
 
        return pr;
@@ -373,6 +371,7 @@ fork1(struct proc *curp, int flags, void
 
        /*
         * From now on, we're committed to the fork and cannot fail.
+        * process_new() returns with proctreelk held!
         */
        p = thread_new(curp, uaddr);
        pr = process_new(p, curpr, flags);
@@ -447,6 +446,7 @@ fork1(struct proc *curp, int flags, void
                        pr->ps_ptstat->pe_other_pid = curpr->ps_pid;
                }
        }
+       rw_exit_write(&proctreelk);
 
        /*
         * For new processes, set accounting bits and mark as complete.
Index: kern/kern_ktrace.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_ktrace.c,v
retrieving revision 1.95
diff -u -p -r1.95 kern_ktrace.c
--- kern/kern_ktrace.c  19 Feb 2018 08:59:52 -0000      1.95
+++ kern/kern_ktrace.c  26 Feb 2018 16:47:58 -0000
@@ -448,6 +448,7 @@ doktrace(struct vnode *vp, int ops, int 
        /*
         * do it
         */
+       rw_enter_read(&proctreelk);
        if (pid < 0) {
                /*
                 * by process group
@@ -455,7 +456,7 @@ doktrace(struct vnode *vp, int ops, int 
                pg = pgfind(-pid);
                if (pg == NULL) {
                        error = ESRCH;
-                       goto done;
+                       goto done2;
                }
                LIST_FOREACH(pr, &pg->pg_members, ps_pglist) {
                        if (descend)
@@ -471,7 +472,7 @@ doktrace(struct vnode *vp, int ops, int 
                pr = prfind(pid);
                if (pr == NULL) {
                        error = ESRCH;
-                       goto done;
+                       goto done2;
                }
                if (descend)
                        ret |= ktrsetchildren(p, pr, ops, facs, vp, cred);
@@ -480,6 +481,8 @@ doktrace(struct vnode *vp, int ops, int 
        }
        if (!ret)
                error = EPERM;
+done2:
+       rw_exit_read(&proctreelk);
 done:
        return (error);
 }
@@ -548,6 +551,8 @@ ktrsetchildren(struct proc *curp, struct
 {
        struct process *pr;
        int ret = 0;
+
+       rw_assert_rdlock(&proctreelk);
 
        pr = top;
        for (;;) {
Index: kern/kern_proc.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_proc.c,v
retrieving revision 1.82
diff -u -p -r1.82 kern_proc.c
--- kern/kern_proc.c    26 Feb 2018 13:43:51 -0000      1.82
+++ kern/kern_proc.c    26 Feb 2018 16:47:58 -0000
@@ -67,6 +67,8 @@ u_long pgrphash;
 struct processlist allprocess;
 struct processlist zombprocess;
 struct proclist allproc;
+struct rwlock proctreelk;
+struct rwlock uidinfolk;
 
 struct pool proc_pool;
 struct pool process_pool;
@@ -93,6 +95,7 @@ procinit(void)
        LIST_INIT(&zombprocess);
        LIST_INIT(&allproc);
 
+       rw_init(&proctreelk, "proctree");
        rw_init(&uidinfolk, "uidinfo");
 
        tidhashtbl = hashinit(maxthread / 4, M_PROC, M_NOWAIT, &tidhash);
@@ -140,6 +143,7 @@ uid_find(uid_t uid)
                if (uip->ui_uid == uid)
                        break;
        if (uip) {
+               /* XXX unlock uidinfolk across the free()? */
                free(nuip, M_PROC, sizeof(*nuip));
                return (uip);
        }
@@ -180,6 +184,7 @@ int
 inferior(struct process *pr, struct process *parent)
 {
 
+       rw_assert_wrlock(&proctreelk);
        for (; pr != parent; pr = pr->ps_pptr)
                if (pr->ps_pid == 0 || pr->ps_pid == 1)
                        return (0);
@@ -222,6 +227,7 @@ pgfind(pid_t pgid)
 {
        struct pgrp *pgrp;
 
+       rw_assert_anylock(&proctreelk);
        LIST_FOREACH(pgrp, PGRPHASH(pgid), pg_hash)
                if (pgrp->pg_id == pgid)
                        return (pgrp);
@@ -250,6 +256,8 @@ zombiefind(pid_t pid)
 void
 enternewpgrp(struct process *pr, struct pgrp *pgrp, struct session *newsess)
 {
+       rw_assert_wrlock(&proctreelk);
+
 #ifdef DIAGNOSTIC
        if (SESS_LEADER(pr))
                panic("%s: session leader attempted setpgrp", __func__);
@@ -292,6 +300,8 @@ enterthispgrp(struct process *pr, struct
 {
        struct pgrp *savepgrp = pr->ps_pgrp;
 
+       rw_assert_wrlock(&proctreelk);
+
        /*
         * Adjust eligibility of affected pgrps to participate in job control.
         * Increment eligibility counts before decrementing, otherwise we
@@ -302,6 +312,7 @@ enterthispgrp(struct process *pr, struct
 
        LIST_REMOVE(pr, ps_pglist);
        pr->ps_pgrp = pgrp;
+
        LIST_INSERT_HEAD(&pgrp->pg_members, pr, ps_pglist);
        if (LIST_EMPTY(&savepgrp->pg_members))
                pgdelete(savepgrp);
@@ -314,6 +325,7 @@ void
 leavepgrp(struct process *pr)
 {
 
+       rw_assert_wrlock(&proctreelk);
        if (pr->ps_session->s_verauthppid == pr->ps_pid)
                zapverauth(pr->ps_session);
        LIST_REMOVE(pr, ps_pglist);
@@ -329,6 +341,7 @@ void
 pgdelete(struct pgrp *pgrp)
 {
 
+       rw_assert_wrlock(&proctreelk);
        if (pgrp->pg_session->s_ttyp != NULL && 
            pgrp->pg_session->s_ttyp->t_pgrp == pgrp)
                pgrp->pg_session->s_ttyp->t_pgrp = NULL;
@@ -362,6 +375,8 @@ fixjobc(struct process *pr, struct pgrp 
        struct pgrp *hispgrp;
        struct session *mysession = pgrp->pg_session;
 
+       rw_assert_wrlock(&proctreelk);
+
        /*
         * Check pr's parent to see whether pr qualifies its own process
         * group; if so, adjust count for pr's process group.
@@ -393,6 +408,7 @@ fixjobc(struct process *pr, struct pgrp 
 void
 killjobc(struct process *pr)
 {
+       rw_enter_write(&proctreelk);
        if (SESS_LEADER(pr)) {
                struct session *sp = pr->ps_session;
 
@@ -430,6 +446,7 @@ killjobc(struct process *pr)
                sp->s_leader = NULL;
        }
        fixjobc(pr, pr->ps_pgrp, 0);
+       rw_exit_write(&proctreelk);
 }
 
 /* 
@@ -442,6 +459,7 @@ orphanpg(struct pgrp *pg)
 {
        struct process *pr;
 
+       rw_assert_wrlock(&proctreelk);
        LIST_FOREACH(pr, &pg->pg_members, ps_pglist) {
                if (pr->ps_mainproc->p_stat == SSTOP) {
                        LIST_FOREACH(pr, &pg->pg_members, ps_pglist) {
Index: kern/kern_prot.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_prot.c,v
retrieving revision 1.73
diff -u -p -r1.73 kern_prot.c
--- kern/kern_prot.c    20 Feb 2018 12:38:58 -0000      1.73
+++ kern/kern_prot.c    26 Feb 2018 16:47:58 -0000
@@ -83,7 +83,9 @@ int
 sys_getppid(struct proc *p, void *v, register_t *retval)
 {
 
+       rw_enter_read(&proctreelk);
        *retval = p->p_p->ps_pptr->ps_pid;
+       rw_exit_read(&proctreelk);
        return (0);
 }
 
@@ -92,7 +94,9 @@ int
 sys_getpgrp(struct proc *p, void *v, register_t *retval)
 {
 
+       rw_enter_read(&proctreelk);
        *retval = p->p_p->ps_pgrp->pg_id;
+       rw_exit_read(&proctreelk);
        return (0);
 }
 
@@ -106,16 +110,23 @@ sys_getpgid(struct proc *curp, void *v, 
                syscallarg(pid_t) pid;
        } */ *uap = v;
        struct process *targpr = curp->p_p;
+       int error = 0;
 
-       if (SCARG(uap, pid) == 0 || SCARG(uap, pid) == targpr->ps_pid)
-               goto found;
+       if (SCARG(uap, pid) == 0 || SCARG(uap, pid) == targpr->ps_pid) {
+               rw_enter_read(&proctreelk);
+               *retval = targpr->ps_pgid;
+               rw_exit_read(&proctreelk);
+               return 0;
+       }
+       rw_enter_read(&proctreelk);
        if ((targpr = prfind(SCARG(uap, pid))) == NULL)
-               return (ESRCH);
-       if (targpr->ps_session != curp->p_p->ps_session)
-               return (EPERM);
-found:
-       *retval = targpr->ps_pgid;
-       return (0);
+               error = ESRCH;
+       else if (targpr->ps_session != curp->p_p->ps_session)
+               error = EPERM;
+       else
+               *retval = targpr->ps_pgid;
+       rw_exit_read(&proctreelk);
+       return error;
 }
 
 int
@@ -125,7 +136,9 @@ sys_getsid(struct proc *curp, void *v, r
                syscallarg(pid_t) pid;
        } */ *uap = v;
        struct process *targpr = curp->p_p;
+       int error = 0;
 
+       rw_enter_read(&proctreelk);
        if (SCARG(uap, pid) == 0 || SCARG(uap, pid) == targpr->ps_pid)
                goto found;
        if ((targpr = prfind(SCARG(uap, pid))) == NULL)
@@ -135,9 +148,12 @@ sys_getsid(struct proc *curp, void *v, r
 found:
        /* Skip exiting processes */
        if (targpr->ps_pgrp->pg_session->s_leader == NULL)
-               return (ESRCH);
-       *retval = targpr->ps_pgrp->pg_session->s_leader->ps_pid;
-       return (0);
+               error = ESRCH;
+       else
+               *retval = targpr->ps_pgrp->pg_session->s_leader->ps_pid;
+       rw_exit_read(&proctreelk);
+
+       return error;
 }
 
 int
@@ -224,12 +240,15 @@ sys_setsid(struct proc *p, void *v, regi
        newsess = pool_get(&session_pool, PR_WAITOK);
        newpgrp = pool_get(&pgrp_pool, PR_WAITOK);
 
+       rw_enter_write(&proctreelk);
        if (pr->ps_pgid == pid || pgfind(pid) != NULL) {
+               rw_exit_write(&proctreelk);
                pool_put(&pgrp_pool, newpgrp);
                pool_put(&session_pool, newsess);
                return (EPERM);
        } else {
                enternewpgrp(pr, newpgrp, newsess);
+               rw_exit_write(&proctreelk);
                *retval = pid;
                return (0);
        }
@@ -269,6 +288,7 @@ sys_setpgid(struct proc *curp, void *v, 
 
        newpgrp = pool_get(&pgrp_pool, PR_WAITOK);
 
+       rw_enter_write(&proctreelk);
        if (pid != 0 && pid != curpr->ps_pid) {
                if ((targpr = prfind(pid)) == 0 || !inferior(targpr, curpr)) {
                        error = ESRCH;
@@ -307,7 +327,8 @@ sys_setpgid(struct proc *curp, void *v, 
                else
                        enterthispgrp(targpr, pgrp);
        }
- out:
+out:
+       rw_exit_write(&proctreelk);
        if (newpgrp != NULL)
                pool_put(&pgrp_pool, newpgrp);
        return (error);
Index: kern/kern_resource.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_resource.c,v
retrieving revision 1.58
diff -u -p -r1.58 kern_resource.c
--- kern/kern_resource.c        19 Feb 2018 08:59:52 -0000      1.58
+++ kern/kern_resource.c        26 Feb 2018 16:47:58 -0000
@@ -90,13 +90,17 @@ sys_getpriority(struct proc *curp, void 
        case PRIO_PGRP: {
                struct pgrp *pg;
 
+               rw_enter_read(&proctreelk);
                if (SCARG(uap, who) == 0)
                        pg = curp->p_p->ps_pgrp;
-               else if ((pg = pgfind(SCARG(uap, who))) == NULL)
+               else if ((pg = pgfind(SCARG(uap, who))) == NULL) {
+                       rw_exit_read(&proctreelk);
                        break;
+               }
                LIST_FOREACH(pr, &pg->pg_members, ps_pglist)
                        if (pr->ps_nice < low)
                                low = pr->ps_nice;
+               rw_exit_read(&proctreelk);
                break;
        }
 
@@ -145,14 +149,18 @@ sys_setpriority(struct proc *curp, void 
        case PRIO_PGRP: {
                struct pgrp *pg;
                 
+               rw_enter_read(&proctreelk);
                if (SCARG(uap, who) == 0)
                        pg = curp->p_p->ps_pgrp;
-               else if ((pg = pgfind(SCARG(uap, who))) == NULL)
+               else if ((pg = pgfind(SCARG(uap, who))) == NULL) {
+                       rw_exit_read(&proctreelk);
                        break;
+               }
                LIST_FOREACH(pr, &pg->pg_members, ps_pglist) {
                        error = donice(curp, pr, SCARG(uap, prio));
                        found++;
                }
+               rw_exit_read(&proctreelk);
                break;
        }
 
Index: kern/kern_sig.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_sig.c,v
retrieving revision 1.216
diff -u -p -r1.216 kern_sig.c
--- kern/kern_sig.c     26 Feb 2018 13:33:25 -0000      1.216
+++ kern/kern_sig.c     26 Feb 2018 16:47:58 -0000
@@ -662,6 +662,7 @@ killpg1(struct proc *cp, int signum, int
                                prsignal(pr, signum);
                }
        } else {
+               rw_enter_read(&proctreelk);
                if (pgid == 0)
                        /*
                         * zero pgid means send to my process group.
@@ -669,8 +670,10 @@ killpg1(struct proc *cp, int signum, int
                        pgrp = cp->p_p->ps_pgrp;
                else {
                        pgrp = pgfind(pgid);
-                       if (pgrp == NULL)
+                       if (pgrp == NULL) {
+                               rw_exit_read(&proctreelk);
                                return (ESRCH);
+                       }
                }
                LIST_FOREACH(pr, &pgrp->pg_members, ps_pglist) {
                        if (pr->ps_pid <= 1 || pr->ps_flags & PS_SYSTEM ||
@@ -680,6 +683,7 @@ killpg1(struct proc *cp, int signum, int
                        if (signum)
                                prsignal(pr, signum);
                }
+               rw_exit_read(&proctreelk);
        }
        return (nfound ? 0 : ESRCH);
 }
@@ -1329,6 +1333,7 @@ proc_stop_sweep(void *v)
 {
        struct process *pr;
 
+       rw_enter_read(&proctreelk);
        LIST_FOREACH(pr, &allprocess, ps_list) {
                if ((pr->ps_flags & PS_STOPPED) == 0)
                        continue;
@@ -1338,6 +1343,7 @@ proc_stop_sweep(void *v)
                        prsignal(pr->ps_pptr, SIGCHLD);
                wakeup(pr->ps_pptr);
        }
+       rw_exit_read(&proctreelk);
 }
 
 /*
Index: kern/kern_sysctl.c
===================================================================
RCS file: /cvs/src/sys/kern/kern_sysctl.c,v
retrieving revision 1.332
diff -u -p -r1.332 kern_sysctl.c
--- kern/kern_sysctl.c  19 Feb 2018 08:59:52 -0000      1.332
+++ kern/kern_sysctl.c  26 Feb 2018 16:47:58 -0000
@@ -1507,6 +1507,7 @@ again:
                        break;
 
                case KERN_PROC_TTY:
+                       /* XXX proctreelk? */
                        if ((pr->ps_flags & PS_CONTROLT) == 0 ||
                            pr->ps_session->s_ttyp == NULL ||
                            pr->ps_session->s_ttyp->t_dev != (dev_t)arg)
@@ -1613,6 +1614,7 @@ fill_kproc(struct process *pr, struct ki
        if (s->s_leader)
                ki->p_sid = s->s_leader->ps_pid;
 
+       /* XXX proctreelk */
        if ((pr->ps_flags & PS_CONTROLT) && (tp = s->s_ttyp)) {
                ki->p_tdev = tp->t_dev;
                ki->p_tpgid = tp->t_pgrp ? tp->t_pgrp->pg_id : -1;
Index: kern/subr_prf.c
===================================================================
RCS file: /cvs/src/sys/kern/subr_prf.c,v
retrieving revision 1.93
diff -u -p -r1.93 subr_prf.c
--- kern/subr_prf.c     5 Jan 2018 11:10:25 -0000       1.93
+++ kern/subr_prf.c     26 Feb 2018 16:47:58 -0000
@@ -362,6 +362,7 @@ uprintf(const char *fmt, ...)
        struct process *pr = curproc->p_p;
        va_list ap;
 
+       /* XXX proctreelk? */
        if (pr->ps_flags & PS_CONTROLT && pr->ps_session->s_ttyvp) {
                va_start(ap, fmt);
                kprintf(fmt, TOTTY, pr->ps_session->s_ttyp, NULL, ap);
Index: kern/sys_process.c
===================================================================
RCS file: /cvs/src/sys/kern/sys_process.c,v
retrieving revision 1.80
diff -u -p -r1.80 sys_process.c
--- kern/sys_process.c  19 Feb 2018 09:25:13 -0000      1.80
+++ kern/sys_process.c  26 Feb 2018 16:47:58 -0000
@@ -276,8 +276,13 @@ ptrace_ctrl(struct proc *p, int req, pid
        struct proc *t;                         /* target thread */
        struct process *tr;                     /* target process */
        int error = 0;
+       int proctree_locked;
        int s;
 
+       /* Lock proctree before looking up the process. */
+       rw_enter_write(&proctreelk);
+       proctree_locked = 1;
+
        switch (req) {
        case PT_TRACE_ME:
                /* Just set the trace flag. */
@@ -288,6 +293,7 @@ ptrace_ctrl(struct proc *p, int req, pid
                        tr->ps_ptstat = malloc(sizeof(*tr->ps_ptstat),
                            M_SUBPROC, M_WAITOK);
                memset(tr->ps_ptstat, 0, sizeof(*tr->ps_ptstat));
+               rw_exit_write(&proctreelk);
                return 0;
 
        /* calls that only operate on the PID */
@@ -487,6 +493,10 @@ ptrace_ctrl(struct proc *p, int req, pid
                atomic_clearbits_int(&tr->ps_flags, PS_TRACED|PS_WAITED);
 
        sendsig:
+               KASSERT(proctree_locked);
+               proctree_locked = 0;
+               rw_exit_write(&proctreelk);
+
                memset(tr->ps_ptstat, 0, sizeof(*tr->ps_ptstat));
 
                /* Finally, deliver the requested signal (or none). */
@@ -534,6 +544,8 @@ ptrace_ctrl(struct proc *p, int req, pid
        }
 
 fail:
+       if (proctree_locked)
+               rw_exit_write(&proctreelk);
        return error;
 }
 
Index: kern/syscalls.master
===================================================================
RCS file: /cvs/src/sys/kern/syscalls.master,v
retrieving revision 1.180
diff -u -p -r1.180 syscalls.master
--- kern/syscalls.master        12 Dec 2017 01:12:34 -0000      1.180
+++ kern/syscalls.master        26 Feb 2018 16:47:58 -0000
@@ -107,7 +107,7 @@
 36     STD             { void sys_sync(void); }
 37     OBSOL           o58_kill
 38     STD             { int sys_stat(const char *path, struct stat *ub); }
-39     STD             { pid_t sys_getppid(void); }
+39     STD NOLOCK      { pid_t sys_getppid(void); }
 40     STD             { int sys_lstat(const char *path, struct stat *ub); }
 41     STD             { int sys_dup(int fd); }
 42     STD             { int sys_fstatat(int fd, const char *path, \
@@ -185,7 +185,7 @@
                            gid_t *gidset); }
 80     STD             { int sys_setgroups(int gidsetsize, \
                            const gid_t *gidset); }
-81     STD             { int sys_getpgrp(void); }
+81     STD NOLOCK      { int sys_getpgrp(void); }
 82     STD             { int sys_setpgid(pid_t pid, pid_t pgid); }
 83     STD NOLOCK      { int sys_futex(uint32_t *f, int op, int val, \
                            const struct timespec *timeout, uint32_t *g); }
Index: kern/tty.c
===================================================================
RCS file: /cvs/src/sys/kern/tty.c,v
retrieving revision 1.137
diff -u -p -r1.137 tty.c
--- kern/tty.c  19 Feb 2018 08:59:52 -0000      1.137
+++ kern/tty.c  26 Feb 2018 16:47:58 -0000
@@ -973,10 +973,13 @@ ttioctl(struct tty *tp, u_long cmd, cadd
                break;
        case TIOCSCTTY:                 /* become controlling tty */
                /* Session ctty vnode pointer set in vnode layer. */
+               rw_enter_write(&proctreelk);
                if (!SESS_LEADER(pr) ||
                    ((pr->ps_session->s_ttyvp || tp->t_session) &&
-                    (tp->t_session != pr->ps_session)))
+                    (tp->t_session != pr->ps_session))) {
+                       rw_exit_write(&proctreelk);
                        return (EPERM);
+               }
                if (tp->t_session)
                        SESSRELE(tp->t_session);
                SESSHOLD(pr->ps_session);
@@ -984,10 +987,14 @@ ttioctl(struct tty *tp, u_long cmd, cadd
                tp->t_pgrp = pr->ps_pgrp;
                pr->ps_session->s_ttyp = tp;
                atomic_setbits_int(&pr->ps_flags, PS_CONTROLT);
+               rw_exit_write(&proctreelk);
                break;
        case TIOCSPGRP: {               /* set pgrp of tty */
-               struct pgrp *pgrp = pgfind(*(int *)data);
+               struct pgrp *pgrp;
 
+               rw_enter_write(&proctreelk);
+               pgrp = pgfind(*(int *)data);
+               rw_exit_write(&proctreelk);
                if (!isctty(pr, tp))
                        return (ENOTTY);
                else if (pgrp == NULL)
@@ -2126,6 +2133,7 @@ process_sum(struct process *pr, fixpt_t 
 
 /*
  * Report on state of foreground process group.
+ * XXX needs proctreelk?
  */
 void
 ttyinfo(struct tty *tp)

Reply via email to