exit1(9): do not deadlock if exit is called due to PT_SC_REMOTERQ

The remote syscall is executed in the context where debugger owns a
p_lock hold on the target.  Due to this, exit1() waiting for p_lock
going to zero, never happen.

Postpone the exit1() call to ast then, saving the provided rval and
signo in the struct proc.  Mark the async-exiting proc with the new
p_flag P_ASYNC_EXIT.

While p_xexit can be reused, p_xsig can be only set by actual exit1(),
otherwise it breaks the ptrace mechanism. Allocate a dedicated p_asig
for it.

Reviewed by:	markj
Sponsored by:	The FreeBSD Foundation
MFC after:	1 week
Differential revision:	https://reviews.freebsd.org/D57482
This commit is contained in:
Konstantin Belousov
2026-06-05 23:21:59 +03:00
parent 9f378397ee
commit a2cfe53577
9 changed files with 72 additions and 20 deletions
+2 -2
View File
@@ -486,8 +486,8 @@ linux_exit(struct thread *td, struct linux_exit_args *args)
* exit via pthread_exit() try thr_exit() first. * exit via pthread_exit() try thr_exit() first.
*/ */
kern_thr_exit(td); kern_thr_exit(td);
exit1(td, args->rval, 0); kern_exit(td, args->rval, 0);
/* NOTREACHED */ return (0);
} }
int int
+2 -2
View File
@@ -1545,8 +1545,8 @@ linux_exit_group(struct thread *td, struct linux_exit_group_args *args)
* SIGNAL_EXIT_GROUP is set. We ignore that (temporarily?) * SIGNAL_EXIT_GROUP is set. We ignore that (temporarily?)
* as it doesnt occur often. * as it doesnt occur often.
*/ */
exit1(td, args->error_code, 0); kern_exit(td, args->error_code, 0);
/* NOTREACHED */ return (0);
} }
#define _LINUX_CAPABILITY_VERSION_1 0x19980330 #define _LINUX_CAPABILITY_VERSION_1 0x19980330
+6 -7
View File
@@ -341,11 +341,11 @@ post_execve(struct thread *td, int error, struct vmspace *oldvmspace)
} }
/* /*
* kern_execve() has the astonishing property of not always returning to * kern_execve() has the astonishing property of not always returning
* the caller. If sufficiently bad things happen during the call to * to the caller. If sufficiently bad things happen during the call
* do_execve(), it can end up calling exit1(); as a result, callers must * to do_execve(), it can end up calling exit2(). Callers must avoid
* avoid doing anything which they might need to undo (e.g., allocating * doing anything which they might need to undo (e.g., allocating
* memory). * memory), unless called from the ptrace(PT_SC_REMOTERQ) handler.
*/ */
int int
kern_execve(struct thread *td, struct image_args *args, struct mac *mac_p, kern_execve(struct thread *td, struct image_args *args, struct mac *mac_p,
@@ -1042,8 +1042,7 @@ do_execve(struct thread *td, struct image_args *args, struct mac *mac_p,
if (error && imgp->vmspace_destroyed) { if (error && imgp->vmspace_destroyed) {
/* sorry, no more process anymore. exit gracefully */ /* sorry, no more process anymore. exit gracefully */
exec_cleanup(td, oldvmspace); exec_cleanup(td, oldvmspace);
exit1(td, 0, SIGABRT); kern_exit(td, 0, SIGABRT);
/* NOT REACHED */
} }
#ifdef KTRACE #ifdef KTRACE
+53 -4
View File
@@ -204,9 +204,8 @@ exit_onexit(struct proc *p)
int int
sys__exit(struct thread *td, struct _exit_args *uap) sys__exit(struct thread *td, struct _exit_args *uap)
{ {
kern_exit(td, uap->rval, 0);
exit1(td, uap->rval, 0); return (0);
__unreachable();
} }
void void
@@ -216,6 +215,48 @@ proc_set_p2_wexit(struct proc *p)
p->p_flag2 |= P2_WEXIT; p->p_flag2 |= P2_WEXIT;
} }
static void
ast_async_exit(struct thread *td, int asts)
{
struct proc *p;
p = td->td_proc;
if ((p->p_flag & P_ASYNC_EXIT) != 0)
exit1(td, p->p_xexit, p->p_asig);
}
/*
* The variation on exit1() intended to be used in the syscall
* handlers. Unlike exit1(), it might delay the current process exit
* to ast. This is needed e.g. when _exit(2) is executed due to the
* ptrace(PT_SC_REMOTERQ), which must do more work after the syscall
* handler call.
*/
void
kern_exit(struct thread *td, int rval, int signo)
{
struct proc *p;
KASSERT(rval == 0 || signo == 0,
("kern_exit rv %d sig %d", rval, signo));
p = td->td_proc;
if ((td->td_dbgflags & TDB_SCREMOTEREQ) != 0) {
PROC_LOCK(p);
p->p_xexit = rval;
p->p_asig = signo;
p->p_flag |= P_ASYNC_EXIT;
ast_sched(td, TDA_ASYNC_EXIT);
PROC_UNLOCK(p);
return;
}
if ((p->p_flag & P_ASYNC_EXIT) != 0) {
rval = p->p_xexit;
signo = p->p_asig;
}
exit1(td, rval, signo);
}
/* /*
* Exit: deallocate address space and other resources, change proc state to * Exit: deallocate address space and other resources, change proc state to
* zombie, and unlink proc from allproc and parent's lists. Save exit status * zombie, and unlink proc from allproc and parent's lists. Save exit status
@@ -231,6 +272,7 @@ exit1(struct thread *td, int rval, int signo)
mtx_assert(&Giant, MA_NOTOWNED); mtx_assert(&Giant, MA_NOTOWNED);
KASSERT(rval == 0 || signo == 0, ("exit1 rv %d sig %d", rval, signo)); KASSERT(rval == 0 || signo == 0, ("exit1 rv %d sig %d", rval, signo));
MPASS((td->td_dbgflags & TDB_SCREMOTEREQ) == 0);
TSPROCEXIT(td->td_proc->p_pid); TSPROCEXIT(td->td_proc->p_pid);
p = td->td_proc; p = td->td_proc;
@@ -828,7 +870,7 @@ kern_abort2(struct thread *td, const char *why, int nargs, void **uargs)
sbuf_delete(sb); sbuf_delete(sb);
PROC_LOCK(p); PROC_LOCK(p);
sigexit(td, sig); sigexit(td, sig);
/* NOTREACHED */ return (0);
} }
#ifdef COMPAT_43 #ifdef COMPAT_43
@@ -1627,3 +1669,10 @@ proc_reparent(struct proc *child, struct proc *parent, bool set_oppid)
if (set_oppid) if (set_oppid)
child->p_oppid = parent->p_pid; child->p_oppid = parent->p_pid;
} }
static void
initexit(void *dummy __unused)
{
ast_register(TDA_ASYNC_EXIT, ASTR_ASTF_REQUIRED, 0, ast_async_exit);
}
SYSINIT(exit, SI_SUB_EXEC, SI_ORDER_ANY, initexit, NULL);
+2 -1
View File
@@ -66,6 +66,7 @@
#include <sys/signalvar.h> #include <sys/signalvar.h>
#include <sys/sx.h> #include <sys/sx.h>
#include <sys/syscall.h> #include <sys/syscall.h>
#include <sys/syscallsubr.h>
#include <sys/sysent.h> #include <sys/sysent.h>
#include <sys/sysproto.h> #include <sys/sysproto.h>
#include <sys/vmmeter.h> #include <sys/vmmeter.h>
@@ -1258,7 +1259,7 @@ fork_return(struct thread *td, struct trapframe *frame)
* If the prison was killed mid-fork, die along with it. * If the prison was killed mid-fork, die along with it.
*/ */
if (!prison_isalive(td->td_ucred->cr_prison)) if (!prison_isalive(td->td_ucred->cr_prison))
exit1(td, 0, SIGKILL); kern_exit(td, 0, SIGKILL);
#ifdef KTRACE #ifdef KTRACE
if (KTRPOINT(td, KTR_SYSRET)) if (KTRPOINT(td, KTR_SYSRET))
+2 -2
View File
@@ -46,6 +46,7 @@
#include <sys/racct.h> #include <sys/racct.h>
#include <sys/resourcevar.h> #include <sys/resourcevar.h>
#include <sys/rmlock.h> #include <sys/rmlock.h>
#include <sys/syscallsubr.h>
#include <sys/sysctl.h> #include <sys/sysctl.h>
#include <sys/syslog.h> #include <sys/syslog.h>
#include <sys/ucoredump.h> #include <sys/ucoredump.h>
@@ -197,8 +198,7 @@ sigexit(struct thread *td, int sig)
err != NULL ? err : ""); err != NULL ? err : "");
} else } else
PROC_UNLOCK(p); PROC_UNLOCK(p);
exit1(td, 0, sig); kern_exit(td, 0, sig);
/* NOTREACHED */
} }
+3 -1
View File
@@ -504,6 +504,7 @@ enum {
TDA_MOD3, /* .. and after */ TDA_MOD3, /* .. and after */
TDA_MOD4, TDA_MOD4,
TDA_SCHED_PRIV, TDA_SCHED_PRIV,
TDA_ASYNC_EXIT,
TDA_MAX, TDA_MAX,
}; };
#define TDAI(tda) (1U << (tda)) #define TDAI(tda) (1U << (tda))
@@ -777,6 +778,7 @@ struct proc {
TAILQ_HEAD(, kq_timer_cb_data) p_kqtim_stop; /* (c) */ TAILQ_HEAD(, kq_timer_cb_data) p_kqtim_stop; /* (c) */
LIST_ENTRY(proc) p_jaillist; /* (d) Jail process linkage. */ LIST_ENTRY(proc) p_jaillist; /* (d) Jail process linkage. */
u_int p_asig; /* (c) ASYNCEXIT pending signal. */
}; };
#define p_session p_pgrp->pg_session #define p_session p_pgrp->pg_session
@@ -842,7 +844,7 @@ struct proc {
#define P_INEXEC 0x04000000 /* Process is in execve(). */ #define P_INEXEC 0x04000000 /* Process is in execve(). */
#define P_STATCHILD 0x08000000 /* Child process stopped or exited. */ #define P_STATCHILD 0x08000000 /* Child process stopped or exited. */
#define P_INMEM 0x10000000 /* Loaded into memory, always set. */ #define P_INMEM 0x10000000 /* Loaded into memory, always set. */
#define P_UNUSED1 0x20000000 /* --available-- */ #define P_ASYNC_EXIT 0x20000000 /* XXX */
#define P_UNUSED2 0x40000000 /* --available-- */ #define P_UNUSED2 0x40000000 /* --available-- */
#define P_PPTRACE 0x80000000 /* PT_TRACEME by vforked child. */ #define P_PPTRACE 0x80000000 /* PT_TRACEME by vforked child. */
+1 -1
View File
@@ -399,7 +399,7 @@ int sigacts_shared(struct sigacts *ps);
int sig_ast_checksusp(struct thread *td); int sig_ast_checksusp(struct thread *td);
int sig_ast_needsigchk(struct thread *td); int sig_ast_needsigchk(struct thread *td);
void sig_drop_caught(struct proc *p); void sig_drop_caught(struct proc *p);
void sigexit(struct thread *td, int sig) __dead2; void sigexit(struct thread *td, int sig);
int sigev_findtd(struct proc *p, struct sigevent *sigev, struct thread **); int sigev_findtd(struct proc *p, struct sigevent *sigev, struct thread **);
void sigfastblock_clear(struct thread *td); void sigfastblock_clear(struct thread *td);
void sigfastblock_fetch(struct thread *td); void sigfastblock_fetch(struct thread *td);
+1
View File
@@ -136,6 +136,7 @@ int kern_cpuset_setid(struct thread *td, cpuwhich_t which,
int kern_dup(struct thread *td, u_int mode, int flags, int old, int new); int kern_dup(struct thread *td, u_int mode, int flags, int old, int new);
int kern_execve(struct thread *td, struct image_args *args, int kern_execve(struct thread *td, struct image_args *args,
struct mac *mac_p, struct vmspace *oldvmspace); struct mac *mac_p, struct vmspace *oldvmspace);
void kern_exit(struct thread *, int, int);
int kern_extattr_delete_fd(struct thread *td, int fd, int attrnamespace, int kern_extattr_delete_fd(struct thread *td, int fd, int attrnamespace,
const char *attrname); const char *attrname);
int kern_extattr_delete_path(struct thread *td, const char *path, int kern_extattr_delete_path(struct thread *td, const char *path,