rust/library/std/src/sys/pal/unix/process/process_unix.rs

use crate::fmt;
use crate::io::{self, Error, ErrorKind};
use crate::mem;
use crate::num::NonZero;
use crate::sys;
use crate::sys::cvt;
use crate::sys::process::process_common::*;

#[cfg(target_os = "linux")]
use crate::sys::pal::unix::linux::pidfd::PidFd;

#[cfg(target_os = "vxworks")]
use libc::RTP_ID as pid_t;

#[cfg(not(target_os = "vxworks"))]
use libc::{c_int, pid_t};

#[cfg(not(any(
    target_os = "vxworks",
    target_os = "l4re",
    target_os = "tvos",
    target_os = "watchos",
)))]
use libc::{gid_t, uid_t};

cfg_if::cfg_if! {
    if #[cfg(all(target_os = "nto", target_env = "nto71"))] {
        use crate::thread;
        use libc::{c_char, posix_spawn_file_actions_t, posix_spawnattr_t};
        use crate::time::Duration;
        use crate::sync::LazyLock;
        // Get smallest amount of time we can sleep.
        // Return a common value if it cannot be determined.
        fn get_clock_resolution() -> Duration {
            static MIN_DELAY: LazyLock<Duration, fn() -> Duration> = LazyLock::new(|| {
                let mut mindelay = libc::timespec { tv_sec: 0, tv_nsec: 0 };
                if unsafe { libc::clock_getres(libc::CLOCK_MONOTONIC, &mut mindelay) } == 0
                {
                    Duration::from_nanos(mindelay.tv_nsec as u64)
                } else {
                    Duration::from_millis(1)
                }
            });
            *MIN_DELAY
        }
        // Arbitrary minimum sleep duration for retrying fork/spawn
        const MIN_FORKSPAWN_SLEEP: Duration = Duration::from_nanos(1);
        // Maximum duration of sleeping before giving up and returning an error
        const MAX_FORKSPAWN_SLEEP: Duration = Duration::from_millis(1000);
    }
}

////////////////////////////////////////////////////////////////////////////////
// Command
////////////////////////////////////////////////////////////////////////////////

impl Command {
    pub fn spawn(
        &mut self,
        default: Stdio,
        needs_stdin: bool,
    ) -> io::Result<(Process, StdioPipes)> {
        const CLOEXEC_MSG_FOOTER: [u8; 4] = *b"NOEX";

        let envp = self.capture_env();

        if self.saw_nul() {
            return Err(io::const_io_error!(
                ErrorKind::InvalidInput,
                "nul byte found in provided data",
            ));
        }

        let (ours, theirs) = self.setup_io(default, needs_stdin)?;

        if let Some(ret) = self.posix_spawn(&theirs, envp.as_ref())? {
            return Ok((ret, ours));
        }

        #[cfg(target_os = "linux")]
        let (input, output) = sys::net::Socket::new_pair(libc::AF_UNIX, libc::SOCK_SEQPACKET)?;

        #[cfg(not(target_os = "linux"))]
        let (input, output) = sys::pipe::anon_pipe()?;

        // Whatever happens after the fork is almost for sure going to touch or
        // look at the environment in one way or another (PATH in `execvp` or
        // accessing the `environ` pointer ourselves). Make sure no other thread
        // is accessing the environment when we do the fork itself.
        //
        // Note that as soon as we're done with the fork there's no need to hold
        // a lock any more because the parent won't do anything and the child is
        // in its own process. Thus the parent drops the lock guard immediately.
        // The child calls `mem::forget` to leak the lock, which is crucial because
        // releasing a lock is not async-signal-safe.
        let env_lock = sys::os::env_read_lock();
        let pid = unsafe { self.do_fork()? };

        if pid == 0 {
            crate::panic::always_abort();
            mem::forget(env_lock); // avoid non-async-signal-safe unlocking
            drop(input);
            #[cfg(target_os = "linux")]
            if self.get_create_pidfd() {
                self.send_pidfd(&output);
            }
            let Err(err) = unsafe { self.do_exec(theirs, envp.as_ref()) };
            let errno = err.raw_os_error().unwrap_or(libc::EINVAL) as u32;
            let errno = errno.to_be_bytes();
            let bytes = [
                errno[0],
                errno[1],
                errno[2],
                errno[3],
                CLOEXEC_MSG_FOOTER[0],
                CLOEXEC_MSG_FOOTER[1],
                CLOEXEC_MSG_FOOTER[2],
                CLOEXEC_MSG_FOOTER[3],
            ];
            // pipe I/O up to PIPE_BUF bytes should be atomic, and then
            // we want to be sure we *don't* run at_exit destructors as
            // we're being torn down regardless
            rtassert!(output.write(&bytes).is_ok());
            unsafe { libc::_exit(1) }
        }

        drop(env_lock);
        drop(output);

        #[cfg(target_os = "linux")]
        let pidfd = if self.get_create_pidfd() { self.recv_pidfd(&input) } else { -1 };

        #[cfg(not(target_os = "linux"))]
        let pidfd = -1;

        // Safety: We obtained the pidfd (on Linux) using SOCK_SEQPACKET, so it's valid.
        let mut p = unsafe { Process::new(pid, pidfd) };
        let mut bytes = [0; 8];

        // loop to handle EINTR
        loop {
            match input.read(&mut bytes) {
                Ok(0) => return Ok((p, ours)),
                Ok(8) => {
                    let (errno, footer) = bytes.split_at(4);
                    assert_eq!(
                        CLOEXEC_MSG_FOOTER, footer,
                        "Validation on the CLOEXEC pipe failed: {:?}",
                        bytes
                    );
                    let errno = i32::from_be_bytes(errno.try_into().unwrap());
                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
                    return Err(Error::from_raw_os_error(errno));
                }
                Err(ref e) if e.is_interrupted() => {}
                Err(e) => {
                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
                    panic!("the CLOEXEC pipe failed: {e:?}")
                }
                Ok(..) => {
                    // pipe I/O up to PIPE_BUF bytes should be atomic
                    // similarly SOCK_SEQPACKET messages should arrive whole
                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
                    panic!("short read on the CLOEXEC pipe")
                }
            }
        }
    }

    pub fn output(&mut self) -> io::Result<(ExitStatus, Vec<u8>, Vec<u8>)> {
        let (proc, pipes) = self.spawn(Stdio::MakePipe, false)?;
        crate::sys_common::process::wait_with_output(proc, pipes)
    }

    // WatchOS and TVOS headers mark the `fork`/`exec*` functions with
    // `__WATCHOS_PROHIBITED __TVOS_PROHIBITED`, and indicate that the
    // `posix_spawn*` functions should be used instead. It isn't entirely clear
    // what `PROHIBITED` means here (e.g. if calls to these functions are
    // allowed to exist in dead code), but it sounds bad, so we go out of our
    // way to avoid that all-together.
    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
    const ERR_APPLE_TV_WATCH_NO_FORK_EXEC: Error = io::const_io_error!(
        ErrorKind::Unsupported,
        "`fork`+`exec`-based process spawning is not supported on this target",
    );

    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
        return Err(Self::ERR_APPLE_TV_WATCH_NO_FORK_EXEC);
    }

    // Attempts to fork the process. If successful, returns Ok((0, -1))
    // in the child, and Ok((child_pid, -1)) in the parent.
    #[cfg(not(any(
        target_os = "watchos",
        target_os = "tvos",
        all(target_os = "nto", target_env = "nto71"),
    )))]
    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
        cvt(libc::fork())
    }

    // On QNX Neutrino, fork can fail with EBADF in case "another thread might have opened
    // or closed a file descriptor while the fork() was occurring".
    // Documentation says "... or try calling fork() again". This is what we do here.
    // See also https://www.qnx.com/developers/docs/7.1/#com.qnx.doc.neutrino.lib_ref/topic/f/fork.html
    #[cfg(all(target_os = "nto", target_env = "nto71"))]
    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
        use crate::sys::os::errno;

        let mut delay = MIN_FORKSPAWN_SLEEP;

        loop {
            let r = libc::fork();
            if r == -1 as libc::pid_t && errno() as libc::c_int == libc::EBADF {
                if delay < get_clock_resolution() {
                    // We cannot sleep this short (it would be longer).
                    // Yield instead.
                    thread::yield_now();
                } else if delay < MAX_FORKSPAWN_SLEEP {
                    thread::sleep(delay);
                } else {
                    return Err(io::const_io_error!(
                        ErrorKind::WouldBlock,
                        "forking returned EBADF too often",
                    ));
                }
                delay *= 2;
                continue;
            } else {
                return cvt(r);
            }
        }
    }

    pub fn exec(&mut self, default: Stdio) -> io::Error {
        let envp = self.capture_env();

        if self.saw_nul() {
            return io::const_io_error!(ErrorKind::InvalidInput, "nul byte found in provided data",);
        }

        match self.setup_io(default, true) {
            Ok((_, theirs)) => {
                unsafe {
                    // Similar to when forking, we want to ensure that access to
                    // the environment is synchronized, so make sure to grab the
                    // environment lock before we try to exec.
                    let _lock = sys::os::env_read_lock();

                    let Err(e) = self.do_exec(theirs, envp.as_ref());
                    e
                }
            }
            Err(e) => e,
        }
    }

    // And at this point we've reached a special time in the life of the
    // child. The child must now be considered hamstrung and unable to
    // do anything other than syscalls really. Consider the following
    // scenario:
    //
    //      1. Thread A of process 1 grabs the malloc() mutex
    //      2. Thread B of process 1 forks(), creating thread C
    //      3. Thread C of process 2 then attempts to malloc()
    //      4. The memory of process 2 is the same as the memory of
    //         process 1, so the mutex is locked.
    //
    // This situation looks a lot like deadlock, right? It turns out
    // that this is what pthread_atfork() takes care of, which is
    // presumably implemented across platforms. The first thing that
    // threads to *before* forking is to do things like grab the malloc
    // mutex, and then after the fork they unlock it.
    //
    // Despite this information, libnative's spawn has been witnessed to
    // deadlock on both macOS and FreeBSD. I'm not entirely sure why, but
    // all collected backtraces point at malloc/free traffic in the
    // child spawned process.
    //
    // For this reason, the block of code below should contain 0
    // invocations of either malloc of free (or their related friends).
    //
    // As an example of not having malloc/free traffic, we don't close
    // this file descriptor by dropping the FileDesc (which contains an
    // allocation). Instead we just close it manually. This will never
    // have the drop glue anyway because this code never returns (the
    // child will either exec() or invoke libc::exit)
    #[cfg(not(any(target_os = "tvos", target_os = "watchos")))]
    unsafe fn do_exec(
        &mut self,
        stdio: ChildPipes,
        maybe_envp: Option<&CStringArray>,
    ) -> Result<!, io::Error> {
        use crate::sys::{self, cvt_r};

        if let Some(fd) = stdio.stdin.fd() {
            cvt_r(|| libc::dup2(fd, libc::STDIN_FILENO))?;
        }
        if let Some(fd) = stdio.stdout.fd() {
            cvt_r(|| libc::dup2(fd, libc::STDOUT_FILENO))?;
        }
        if let Some(fd) = stdio.stderr.fd() {
            cvt_r(|| libc::dup2(fd, libc::STDERR_FILENO))?;
        }

        #[cfg(not(target_os = "l4re"))]
        {
            if let Some(_g) = self.get_groups() {
                //FIXME: Redox kernel does not support setgroups yet
                #[cfg(not(target_os = "redox"))]
                cvt(libc::setgroups(_g.len().try_into().unwrap(), _g.as_ptr()))?;
            }
            if let Some(u) = self.get_gid() {
                cvt(libc::setgid(u as gid_t))?;
            }
            if let Some(u) = self.get_uid() {
                // When dropping privileges from root, the `setgroups` call
                // will remove any extraneous groups. We only drop groups
                // if we have CAP_SETGID and we weren't given an explicit
                // set of groups. If we don't call this, then even though our
                // uid has dropped, we may still have groups that enable us to
                // do super-user things.
                //FIXME: Redox kernel does not support setgroups yet
                #[cfg(not(target_os = "redox"))]
                if self.get_groups().is_none() {
                    let res = cvt(libc::setgroups(0, crate::ptr::null()));
                    if let Err(e) = res {
                        // Here we ignore the case of not having CAP_SETGID.
                        // An alternative would be to require CAP_SETGID (in
                        // addition to CAP_SETUID) for setting the UID.
                        if e.raw_os_error() != Some(libc::EPERM) {
                            return Err(e.into());
                        }
                    }
                }
                cvt(libc::setuid(u as uid_t))?;
            }
        }
        if let Some(ref cwd) = *self.get_cwd() {
            cvt(libc::chdir(cwd.as_ptr()))?;
        }

        if let Some(pgroup) = self.get_pgroup() {
            cvt(libc::setpgid(0, pgroup))?;
        }

        // emscripten has no signal support.
        #[cfg(not(target_os = "emscripten"))]
        {
            // Inherit the signal mask from the parent rather than resetting it (i.e. do not call
            // pthread_sigmask).

            // If -Zon-broken-pipe is used, don't reset SIGPIPE to SIG_DFL.
            // If -Zon-broken-pipe is not used, reset SIGPIPE to SIG_DFL for backward compatibility.
            //
            // -Zon-broken-pipe is an opportunity to change the default here.
            if !crate::sys::pal::on_broken_pipe_flag_used() {
                #[cfg(target_os = "android")] // see issue #88585
                {
                    let mut action: libc::sigaction = mem::zeroed();
                    action.sa_sigaction = libc::SIG_DFL;
                    cvt(libc::sigaction(libc::SIGPIPE, &action, crate::ptr::null_mut()))?;
                }
                #[cfg(not(target_os = "android"))]
                {
                    let ret = sys::signal(libc::SIGPIPE, libc::SIG_DFL);
                    if ret == libc::SIG_ERR {
                        return Err(io::Error::last_os_error());
                    }
                }
                #[cfg(target_os = "hurd")]
                {
                    let ret = sys::signal(libc::SIGLOST, libc::SIG_DFL);
                    if ret == libc::SIG_ERR {
                        return Err(io::Error::last_os_error());
                    }
                }
            }
        }

        for callback in self.get_closures().iter_mut() {
            callback()?;
        }

        // Although we're performing an exec here we may also return with an
        // error from this function (without actually exec'ing) in which case we
        // want to be sure to restore the global environment back to what it
        // once was, ensuring that our temporary override, when free'd, doesn't
        // corrupt our process's environment.
        let mut _reset = None;
        if let Some(envp) = maybe_envp {
            struct Reset(*const *const libc::c_char);

            impl Drop for Reset {
                fn drop(&mut self) {
                    unsafe {
                        *sys::os::environ() = self.0;
                    }
                }
            }

            _reset = Some(Reset(*sys::os::environ()));
            *sys::os::environ() = envp.as_ptr();
        }

        libc::execvp(self.get_program_cstr().as_ptr(), self.get_argv().as_ptr());
        Err(io::Error::last_os_error())
    }

    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
    unsafe fn do_exec(
        &mut self,
        _stdio: ChildPipes,
        _maybe_envp: Option<&CStringArray>,
    ) -> Result<!, io::Error> {
        return Err(Self::ERR_APPLE_TV_WATCH_NO_FORK_EXEC);
    }

    #[cfg(not(any(
        target_os = "freebsd",
        all(target_os = "linux", target_env = "gnu"),
        all(target_os = "linux", target_env = "musl"),
        target_os = "nto",
        target_vendor = "apple",
    )))]
    fn posix_spawn(
        &mut self,
        _: &ChildPipes,
        _: Option<&CStringArray>,
    ) -> io::Result<Option<Process>> {
        Ok(None)
    }

    // Only support platforms for which posix_spawn() can return ENOENT
    // directly.
    #[cfg(any(
        target_os = "freebsd",
        all(target_os = "linux", target_env = "gnu"),
        all(target_os = "linux", target_env = "musl"),
        target_os = "nto",
        target_vendor = "apple",
    ))]
    fn posix_spawn(
        &mut self,
        stdio: &ChildPipes,
        envp: Option<&CStringArray>,
    ) -> io::Result<Option<Process>> {
        use crate::mem::MaybeUninit;
        use crate::sys::weak::weak;
        use crate::sys::{self, cvt_nz, on_broken_pipe_flag_used};

        if self.get_gid().is_some()
            || self.get_uid().is_some()
            || (self.env_saw_path() && !self.program_is_path())
            || !self.get_closures().is_empty()
            || self.get_groups().is_some()
            || self.get_create_pidfd()
        {
            return Ok(None);
        }

        // Only glibc 2.24+ posix_spawn() supports returning ENOENT directly.
        #[cfg(all(target_os = "linux", target_env = "gnu"))]
        {
            if let Some(version) = sys::os::glibc_version() {
                if version < (2, 24) {
                    return Ok(None);
                }
            } else {
                return Ok(None);
            }
        }

        // On QNX Neutrino, posix_spawnp can fail with EBADF in case "another thread might have opened
        // or closed a file descriptor while the posix_spawn() was occurring".
        // Documentation says "... or try calling posix_spawn() again". This is what we do here.
        // See also http://www.qnx.com/developers/docs/7.1/#com.qnx.doc.neutrino.lib_ref/topic/p/posix_spawn.html
        #[cfg(all(target_os = "nto", target_env = "nto71"))]
        unsafe fn retrying_libc_posix_spawnp(
            pid: *mut pid_t,
            file: *const c_char,
            file_actions: *const posix_spawn_file_actions_t,
            attrp: *const posix_spawnattr_t,
            argv: *const *mut c_char,
            envp: *const *mut c_char,
        ) -> io::Result<i32> {
            let mut delay = MIN_FORKSPAWN_SLEEP;
            loop {
                match libc::posix_spawnp(pid, file, file_actions, attrp, argv, envp) {
                    libc::EBADF => {
                        if delay < get_clock_resolution() {
                            // We cannot sleep this short (it would be longer).
                            // Yield instead.
                            thread::yield_now();
                        } else if delay < MAX_FORKSPAWN_SLEEP {
                            thread::sleep(delay);
                        } else {
                            return Err(io::const_io_error!(
                                ErrorKind::WouldBlock,
                                "posix_spawnp returned EBADF too often",
                            ));
                        }
                        delay *= 2;
                        continue;
                    }
                    r => {
                        return Ok(r);
                    }
                }
            }
        }

        // Solaris, glibc 2.29+, and musl 1.24+ can set a new working directory,
        // and maybe others will gain this non-POSIX function too. We'll check
        // for this weak symbol as soon as it's needed, so we can return early
        // otherwise to do a manual chdir before exec.
        weak! {
            fn posix_spawn_file_actions_addchdir_np(
                *mut libc::posix_spawn_file_actions_t,
                *const libc::c_char
            ) -> libc::c_int
        }
        let addchdir = match self.get_cwd() {
            Some(cwd) => {
                if cfg!(target_vendor = "apple") {
                    // There is a bug in macOS where a relative executable
                    // path like "../myprogram" will cause `posix_spawn` to
                    // successfully launch the program, but erroneously return
                    // ENOENT when used with posix_spawn_file_actions_addchdir_np
                    // which was introduced in macOS 10.15.
                    if self.get_program_kind() == ProgramKind::Relative {
                        return Ok(None);
                    }
                }
                match posix_spawn_file_actions_addchdir_np.get() {
                    Some(f) => Some((f, cwd)),
                    None => return Ok(None),
                }
            }
            None => None,
        };

        let pgroup = self.get_pgroup();

        // Safety: -1 indicates we don't have a pidfd.
        let mut p = unsafe { Process::new(0, -1) };

        struct PosixSpawnFileActions<'a>(&'a mut MaybeUninit<libc::posix_spawn_file_actions_t>);

        impl Drop for PosixSpawnFileActions<'_> {
            fn drop(&mut self) {
                unsafe {
                    libc::posix_spawn_file_actions_destroy(self.0.as_mut_ptr());
                }
            }
        }

        struct PosixSpawnattr<'a>(&'a mut MaybeUninit<libc::posix_spawnattr_t>);

        impl Drop for PosixSpawnattr<'_> {
            fn drop(&mut self) {
                unsafe {
                    libc::posix_spawnattr_destroy(self.0.as_mut_ptr());
                }
            }
        }

        unsafe {
            let mut attrs = MaybeUninit::uninit();
            cvt_nz(libc::posix_spawnattr_init(attrs.as_mut_ptr()))?;
            let attrs = PosixSpawnattr(&mut attrs);

            let mut flags = 0;

            let mut file_actions = MaybeUninit::uninit();
            cvt_nz(libc::posix_spawn_file_actions_init(file_actions.as_mut_ptr()))?;
            let file_actions = PosixSpawnFileActions(&mut file_actions);

            if let Some(fd) = stdio.stdin.fd() {
                cvt_nz(libc::posix_spawn_file_actions_adddup2(
                    file_actions.0.as_mut_ptr(),
                    fd,
                    libc::STDIN_FILENO,
                ))?;
            }
            if let Some(fd) = stdio.stdout.fd() {
                cvt_nz(libc::posix_spawn_file_actions_adddup2(
                    file_actions.0.as_mut_ptr(),
                    fd,
                    libc::STDOUT_FILENO,
                ))?;
            }
            if let Some(fd) = stdio.stderr.fd() {
                cvt_nz(libc::posix_spawn_file_actions_adddup2(
                    file_actions.0.as_mut_ptr(),
                    fd,
                    libc::STDERR_FILENO,
                ))?;
            }
            if let Some((f, cwd)) = addchdir {
                cvt_nz(f(file_actions.0.as_mut_ptr(), cwd.as_ptr()))?;
            }

            if let Some(pgroup) = pgroup {
                flags |= libc::POSIX_SPAWN_SETPGROUP;
                cvt_nz(libc::posix_spawnattr_setpgroup(attrs.0.as_mut_ptr(), pgroup))?;
            }

            // Inherit the signal mask from this process rather than resetting it (i.e. do not call
            // posix_spawnattr_setsigmask).

            // If -Zon-broken-pipe is used, don't reset SIGPIPE to SIG_DFL.
            // If -Zon-broken-pipe is not used, reset SIGPIPE to SIG_DFL for backward compatibility.
            //
            // -Zon-broken-pipe is an opportunity to change the default here.
            if !on_broken_pipe_flag_used() {
                let mut default_set = MaybeUninit::<libc::sigset_t>::uninit();
                cvt(sigemptyset(default_set.as_mut_ptr()))?;
                cvt(sigaddset(default_set.as_mut_ptr(), libc::SIGPIPE))?;
                #[cfg(target_os = "hurd")]
                {
                    cvt(sigaddset(default_set.as_mut_ptr(), libc::SIGLOST))?;
                }
                cvt_nz(libc::posix_spawnattr_setsigdefault(
                    attrs.0.as_mut_ptr(),
                    default_set.as_ptr(),
                ))?;
                flags |= libc::POSIX_SPAWN_SETSIGDEF;
            }

            cvt_nz(libc::posix_spawnattr_setflags(attrs.0.as_mut_ptr(), flags as _))?;

            // Make sure we synchronize access to the global `environ` resource
            let _env_lock = sys::os::env_read_lock();
            let envp = envp.map(|c| c.as_ptr()).unwrap_or_else(|| *sys::os::environ() as *const _);

            #[cfg(not(target_os = "nto"))]
            let spawn_fn = libc::posix_spawnp;
            #[cfg(target_os = "nto")]
            let spawn_fn = retrying_libc_posix_spawnp;

            let spawn_res = spawn_fn(
                &mut p.pid,
                self.get_program_cstr().as_ptr(),
                file_actions.0.as_ptr(),
                attrs.0.as_ptr(),
                self.get_argv().as_ptr() as *const _,
                envp as *const _,
            );

            #[cfg(target_os = "nto")]
            let spawn_res = spawn_res?;

            cvt_nz(spawn_res)?;
            Ok(Some(p))
        }
    }

    #[cfg(target_os = "linux")]
    fn send_pidfd(&self, sock: &crate::sys::net::Socket) {
        use crate::io::IoSlice;
        use crate::os::fd::RawFd;
        use crate::sys::cvt_r;
        use libc::{CMSG_DATA, CMSG_FIRSTHDR, CMSG_LEN, CMSG_SPACE, SCM_RIGHTS, SOL_SOCKET};

        unsafe {
            let child_pid = libc::getpid();
            // pidfd_open sets CLOEXEC by default
            let pidfd = libc::syscall(libc::SYS_pidfd_open, child_pid, 0);

            let fds: [c_int; 1] = [pidfd as RawFd];

            const SCM_MSG_LEN: usize = mem::size_of::<[c_int; 1]>();

            #[repr(C)]
            union Cmsg {
                buf: [u8; unsafe { CMSG_SPACE(SCM_MSG_LEN as u32) as usize }],
                _align: libc::cmsghdr,
            }

            let mut cmsg: Cmsg = mem::zeroed();

            // 0-length message to send through the socket so we can pass along the fd
            let mut iov = [IoSlice::new(b"")];
            let mut msg: libc::msghdr = mem::zeroed();

            msg.msg_iov = core::ptr::addr_of_mut!(iov) as *mut _;
            msg.msg_iovlen = 1;

            // only attach cmsg if we successfully acquired the pidfd
            if pidfd >= 0 {
                msg.msg_controllen = mem::size_of_val(&cmsg.buf) as _;
                msg.msg_control = core::ptr::addr_of_mut!(cmsg.buf) as *mut _;

                let hdr = CMSG_FIRSTHDR(core::ptr::addr_of_mut!(msg) as *mut _);
                (*hdr).cmsg_level = SOL_SOCKET;
                (*hdr).cmsg_type = SCM_RIGHTS;
                (*hdr).cmsg_len = CMSG_LEN(SCM_MSG_LEN as _) as _;
                let data = CMSG_DATA(hdr);
                crate::ptr::copy_nonoverlapping(
                    fds.as_ptr().cast::<u8>(),
                    data as *mut _,
                    SCM_MSG_LEN,
                );
            }

            // we send the 0-length message even if we failed to acquire the pidfd
            // so we get a consistent SEQPACKET order
            match cvt_r(|| libc::sendmsg(sock.as_raw(), &msg, 0)) {
                Ok(0) => {}
                other => rtabort!("failed to communicate with parent process. {:?}", other),
            }
        }
    }

    #[cfg(target_os = "linux")]
    fn recv_pidfd(&self, sock: &crate::sys::net::Socket) -> pid_t {
        use crate::io::IoSliceMut;
        use crate::sys::cvt_r;

        use libc::{CMSG_DATA, CMSG_FIRSTHDR, CMSG_LEN, CMSG_SPACE, SCM_RIGHTS, SOL_SOCKET};

        unsafe {
            const SCM_MSG_LEN: usize = mem::size_of::<[c_int; 1]>();

            #[repr(C)]
            union Cmsg {
                _buf: [u8; unsafe { CMSG_SPACE(SCM_MSG_LEN as u32) as usize }],
                _align: libc::cmsghdr,
            }
            let mut cmsg: Cmsg = mem::zeroed();
            // 0-length read to get the fd
            let mut iov = [IoSliceMut::new(&mut [])];

            let mut msg: libc::msghdr = mem::zeroed();

            msg.msg_iov = core::ptr::addr_of_mut!(iov) as *mut _;
            msg.msg_iovlen = 1;
            msg.msg_controllen = mem::size_of::<Cmsg>() as _;
            msg.msg_control = core::ptr::addr_of_mut!(cmsg) as *mut _;

            match cvt_r(|| libc::recvmsg(sock.as_raw(), &mut msg, libc::MSG_CMSG_CLOEXEC)) {
                Err(_) => return -1,
                Ok(_) => {}
            }

            let hdr = CMSG_FIRSTHDR(core::ptr::addr_of_mut!(msg) as *mut _);
            if hdr.is_null()
                || (*hdr).cmsg_level != SOL_SOCKET
                || (*hdr).cmsg_type != SCM_RIGHTS
                || (*hdr).cmsg_len != CMSG_LEN(SCM_MSG_LEN as _) as _
            {
                return -1;
            }
            let data = CMSG_DATA(hdr);

            let mut fds = [-1 as c_int];

            crate::ptr::copy_nonoverlapping(
                data as *const _,
                fds.as_mut_ptr().cast::<u8>(),
                SCM_MSG_LEN,
            );

            fds[0]
        }
    }
}

////////////////////////////////////////////////////////////////////////////////
// Processes
////////////////////////////////////////////////////////////////////////////////

/// The unique ID of the process (this should never be negative).
pub struct Process {
    pid: pid_t,
    status: Option<ExitStatus>,
    // On Linux, stores the pidfd created for this child.
    // This is None if the user did not request pidfd creation,
    // or if the pidfd could not be created for some reason
    // (e.g. the `pidfd_open` syscall was not available).
    #[cfg(target_os = "linux")]
    pidfd: Option<PidFd>,
}

impl Process {
    #[cfg(target_os = "linux")]
    unsafe fn new(pid: pid_t, pidfd: pid_t) -> Self {
        use crate::os::unix::io::FromRawFd;
        use crate::sys_common::FromInner;
        // Safety: If `pidfd` is nonnegative, we assume it's valid and otherwise unowned.
        let pidfd = (pidfd >= 0).then(|| PidFd::from_inner(sys::fd::FileDesc::from_raw_fd(pidfd)));
        Process { pid, status: None, pidfd }
    }

    #[cfg(not(target_os = "linux"))]
    unsafe fn new(pid: pid_t, _pidfd: pid_t) -> Self {
        Process { pid, status: None }
    }

    pub fn id(&self) -> u32 {
        self.pid as u32
    }

    pub fn kill(&mut self) -> io::Result<()> {
        // If we've already waited on this process then the pid can be recycled
        // and used for another process, and we probably shouldn't be killing
        // random processes, so return Ok because the process has exited already.
        if self.status.is_some() {
            return Ok(());
        }
        #[cfg(target_os = "linux")]
        if let Some(pid_fd) = self.pidfd.as_ref() {
            // pidfd_send_signal predates pidfd_open. so if we were able to get an fd then sending signals will work too
            return pid_fd.kill();
        }
        cvt(unsafe { libc::kill(self.pid, libc::SIGKILL) }).map(drop)
    }

    pub fn wait(&mut self) -> io::Result<ExitStatus> {
        use crate::sys::cvt_r;
        if let Some(status) = self.status {
            return Ok(status);
        }
        #[cfg(target_os = "linux")]
        if let Some(pid_fd) = self.pidfd.as_ref() {
            let status = pid_fd.wait()?;
            self.status = Some(status);
            return Ok(status);
        }
        let mut status = 0 as c_int;
        cvt_r(|| unsafe { libc::waitpid(self.pid, &mut status, 0) })?;
        self.status = Some(ExitStatus::new(status));
        Ok(ExitStatus::new(status))
    }

    pub fn try_wait(&mut self) -> io::Result<Option<ExitStatus>> {
        if let Some(status) = self.status {
            return Ok(Some(status));
        }
        #[cfg(target_os = "linux")]
        if let Some(pid_fd) = self.pidfd.as_ref() {
            let status = pid_fd.try_wait()?;
            if let Some(status) = status {
                self.status = Some(status)
            }
            return Ok(status);
        }
        let mut status = 0 as c_int;
        let pid = cvt(unsafe { libc::waitpid(self.pid, &mut status, libc::WNOHANG) })?;
        if pid == 0 {
            Ok(None)
        } else {
            self.status = Some(ExitStatus::new(status));
            Ok(Some(ExitStatus::new(status)))
        }
    }
}

/// Unix exit statuses
//
// This is not actually an "exit status" in Unix terminology.  Rather, it is a "wait status".
// See the discussion in comments and doc comments for `std::process::ExitStatus`.
#[derive(PartialEq, Eq, Clone, Copy, Default)]
pub struct ExitStatus(c_int);

impl fmt::Debug for ExitStatus {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_tuple("unix_wait_status").field(&self.0).finish()
    }
}

impl ExitStatus {
    pub fn new(status: c_int) -> ExitStatus {
        ExitStatus(status)
    }

    #[cfg(target_os = "linux")]
    pub fn from_waitid_siginfo(siginfo: libc::siginfo_t) -> ExitStatus {
        let status = unsafe { siginfo.si_status() };

        match siginfo.si_code {
            libc::CLD_EXITED => ExitStatus((status & 0xff) << 8),
            libc::CLD_KILLED => ExitStatus(status),
            libc::CLD_DUMPED => ExitStatus(status | 0x80),
            libc::CLD_CONTINUED => ExitStatus(0xffff),
            libc::CLD_STOPPED | libc::CLD_TRAPPED => ExitStatus(((status & 0xff) << 8) | 0x7f),
            _ => unreachable!("waitid() should only return the above codes"),
        }
    }

    fn exited(&self) -> bool {
        libc::WIFEXITED(self.0)
    }

    pub fn exit_ok(&self) -> Result<(), ExitStatusError> {
        // This assumes that WIFEXITED(status) && WEXITSTATUS==0 corresponds to status==0. This is
        // true on all actual versions of Unix, is widely assumed, and is specified in SuS
        // https://pubs.opengroup.org/onlinepubs/9699919799/functions/wait.html. If it is not
        // true for a platform pretending to be Unix, the tests (our doctests, and also
        // process_unix/tests.rs) will spot it. `ExitStatusError::code` assumes this too.
        match NonZero::try_from(self.0) {
            /* was nonzero */ Ok(failure) => Err(ExitStatusError(failure)),
            /* was zero, couldn't convert */ Err(_) => Ok(()),
        }
    }

    pub fn code(&self) -> Option<i32> {
        self.exited().then(|| libc::WEXITSTATUS(self.0))
    }

    pub fn signal(&self) -> Option<i32> {
        libc::WIFSIGNALED(self.0).then(|| libc::WTERMSIG(self.0))
    }

    pub fn core_dumped(&self) -> bool {
        libc::WIFSIGNALED(self.0) && libc::WCOREDUMP(self.0)
    }

    pub fn stopped_signal(&self) -> Option<i32> {
        libc::WIFSTOPPED(self.0).then(|| libc::WSTOPSIG(self.0))
    }

    pub fn continued(&self) -> bool {
        libc::WIFCONTINUED(self.0)
    }

    pub fn into_raw(&self) -> c_int {
        self.0
    }
}

/// Converts a raw `c_int` to a type-safe `ExitStatus` by wrapping it without copying.
impl From<c_int> for ExitStatus {
    fn from(a: c_int) -> ExitStatus {
        ExitStatus(a)
    }
}

/// Convert a signal number to a readable, searchable name.
///
/// This string should be displayed right after the signal number.
/// If a signal is unrecognized, it returns the empty string, so that
/// you just get the number like "0". If it is recognized, you'll get
/// something like "9 (SIGKILL)".
fn signal_string(signal: i32) -> &'static str {
    match signal {
        libc::SIGHUP => " (SIGHUP)",
        libc::SIGINT => " (SIGINT)",
        libc::SIGQUIT => " (SIGQUIT)",
        libc::SIGILL => " (SIGILL)",
        libc::SIGTRAP => " (SIGTRAP)",
        libc::SIGABRT => " (SIGABRT)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGBUS => " (SIGBUS)",
        libc::SIGFPE => " (SIGFPE)",
        libc::SIGKILL => " (SIGKILL)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGUSR1 => " (SIGUSR1)",
        libc::SIGSEGV => " (SIGSEGV)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGUSR2 => " (SIGUSR2)",
        libc::SIGPIPE => " (SIGPIPE)",
        libc::SIGALRM => " (SIGALRM)",
        libc::SIGTERM => " (SIGTERM)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGCHLD => " (SIGCHLD)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGCONT => " (SIGCONT)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGSTOP => " (SIGSTOP)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGTSTP => " (SIGTSTP)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGTTIN => " (SIGTTIN)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGTTOU => " (SIGTTOU)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGURG => " (SIGURG)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGXCPU => " (SIGXCPU)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGXFSZ => " (SIGXFSZ)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGVTALRM => " (SIGVTALRM)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGPROF => " (SIGPROF)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGWINCH => " (SIGWINCH)",
        #[cfg(not(any(target_os = "haiku", target_os = "l4re")))]
        libc::SIGIO => " (SIGIO)",
        #[cfg(target_os = "haiku")]
        libc::SIGPOLL => " (SIGPOLL)",
        #[cfg(not(target_os = "l4re"))]
        libc::SIGSYS => " (SIGSYS)",
        // For information on Linux signals, run `man 7 signal`
        #[cfg(all(
            target_os = "linux",
            any(
                target_arch = "x86_64",
                target_arch = "x86",
                target_arch = "arm",
                target_arch = "aarch64"
            )
        ))]
        libc::SIGSTKFLT => " (SIGSTKFLT)",
        #[cfg(any(target_os = "linux", target_os = "nto"))]
        libc::SIGPWR => " (SIGPWR)",
        #[cfg(any(
            target_os = "freebsd",
            target_os = "netbsd",
            target_os = "openbsd",
            target_os = "dragonfly",
            target_os = "nto",
            target_vendor = "apple",
        ))]
        libc::SIGEMT => " (SIGEMT)",
        #[cfg(any(
            target_os = "freebsd",
            target_os = "netbsd",
            target_os = "openbsd",
            target_os = "dragonfly",
            target_vendor = "apple",
        ))]
        libc::SIGINFO => " (SIGINFO)",
        #[cfg(target_os = "hurd")]
        libc::SIGLOST => " (SIGLOST)",
        #[cfg(target_os = "freebsd")]
        libc::SIGTHR => " (SIGTHR)",
        #[cfg(target_os = "freebsd")]
        libc::SIGLIBRT => " (SIGLIBRT)",
        _ => "",
    }
}

impl fmt::Display for ExitStatus {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        if let Some(code) = self.code() {
            write!(f, "exit status: {code}")
        } else if let Some(signal) = self.signal() {
            let signal_string = signal_string(signal);
            if self.core_dumped() {
                write!(f, "signal: {signal}{signal_string} (core dumped)")
            } else {
                write!(f, "signal: {signal}{signal_string}")
            }
        } else if let Some(signal) = self.stopped_signal() {
            let signal_string = signal_string(signal);
            write!(f, "stopped (not terminated) by signal: {signal}{signal_string}")
        } else if self.continued() {
            write!(f, "continued (WIFCONTINUED)")
        } else {
            write!(f, "unrecognised wait status: {} {:#x}", self.0, self.0)
        }
    }
}

#[derive(PartialEq, Eq, Clone, Copy)]
pub struct ExitStatusError(NonZero<c_int>);

impl Into<ExitStatus> for ExitStatusError {
    fn into(self) -> ExitStatus {
        ExitStatus(self.0.into())
    }
}

impl fmt::Debug for ExitStatusError {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_tuple("unix_wait_status").field(&self.0).finish()
    }
}

impl ExitStatusError {
    pub fn code(self) -> Option<NonZero<i32>> {
        ExitStatus(self.0.into()).code().map(|st| st.try_into().unwrap())
    }
}

#[cfg(target_os = "linux")]
mod linux_child_ext {

    use crate::io;
    use crate::mem;
    use crate::os::linux::process as os;
    use crate::sys::pal::unix::linux::pidfd as imp;
    use crate::sys::pal::unix::ErrorKind;
    use crate::sys_common::FromInner;

    #[unstable(feature = "linux_pidfd", issue = "82971")]
    impl crate::os::linux::process::ChildExt for crate::process::Child {
        fn pidfd(&self) -> io::Result<&os::PidFd> {
            self.handle
                .pidfd
                .as_ref()
                // SAFETY: The os type is a transparent wrapper, therefore we can transmute references
                .map(|fd| unsafe { mem::transmute::<&imp::PidFd, &os::PidFd>(fd) })
                .ok_or_else(|| io::Error::new(ErrorKind::Uncategorized, "No pidfd was created."))
        }

        fn take_pidfd(&mut self) -> io::Result<os::PidFd> {
            self.handle
                .pidfd
                .take()
                .map(|fd| <os::PidFd as FromInner<imp::PidFd>>::from_inner(fd))
                .ok_or_else(|| io::Error::new(ErrorKind::Uncategorized, "No pidfd was created."))
        }
    }
}

#[cfg(test)]
#[path = "process_unix/tests.rs"]
mod tests;

// See [`process_unsupported_wait_status::compare_with_linux`];
#[cfg(all(test, target_os = "linux"))]
#[path = "process_unsupported/wait_status.rs"]
mod process_unsupported_wait_status;
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								use crate::fmt;
-												libstd => 2018

											
										
										
											2019-02-11 04:23:21 +09:00
+								use crate::io::{self, Error, ErrorKind};
-												Do not attempt to unlock envlock in child process after a fork.

This is a breaking change for cases where the environment is
accessed in a Command::pre_exec closure. Except for
single-threaded programs these uses were not correct
anyway since they aren't async-signal safe.

											
										
										
											2021-03-09 21:42:38 +01:00
+								use crate::mem;
-												Use generic `NonZero` internally.

											
										
										
											2024-01-29 23:59:09 +01:00
+								use crate::num::NonZero;
-												libstd => 2018

											
										
										
											2019-02-11 04:23:21 +09:00
+								use crate::sys;
 								use crate::sys::cvt;
 								use crate::sys::process::process_common::*;
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
 								#[cfg(target_os = "linux")]
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								use crate::sys::pal::unix::linux::pidfd::PidFd;
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
-												Take some of sys/vxworks/process/* from sys/unix instead.

											
										
										
											2020-10-07 20:38:25 +02:00
+								#[cfg(target_os = "vxworks")]
 								use libc::RTP_ID as pid_t;
 								#[cfg(not(target_os = "vxworks"))]
-												drop unused libc imports on L4Re

As a capability-based microkernel OS, L4Re only has incomplete support
for POSIX APIs, in particular it does not implement UIDs and GIDs.

											
										
										
											2021-05-31 15:00:11 +02:00
+								use libc::{c_int, pid_t};
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								#[cfg(not(any(
 								    target_os = "vxworks",
 								    target_os = "l4re",
 								    target_os = "tvos",
 								    target_os = "watchos",
 								)))]
-												drop unused libc imports on L4Re

As a capability-based microkernel OS, L4Re only has incomplete support
for POSIX APIs, in particular it does not implement UIDs and GIDs.

											
										
										
											2021-05-31 15:00:11 +02:00
+								use libc::{gid_t, uid_t};
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								cfg_if::cfg_if! {
 								    if #[cfg(all(target_os = "nto", target_env = "nto71"))] {
 								        use crate::thread;
 								        use libc::{c_char, posix_spawn_file_actions_t, posix_spawnattr_t};
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								        use crate::time::Duration;
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								        use crate::sync::LazyLock;
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								        // Get smallest amount of time we can sleep.
 								        // Return a common value if it cannot be determined.
 								        fn get_clock_resolution() -> Duration {
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								            static MIN_DELAY: LazyLock<Duration, fn() -> Duration> = LazyLock::new(|| {
 								                let mut mindelay = libc::timespec { tv_sec: 0, tv_nsec: 0 };
 								                if unsafe { libc::clock_getres(libc::CLOCK_MONOTONIC, &mut mindelay) } == 0
 								                {
 								                    Duration::from_nanos(mindelay.tv_nsec as u64)
 								                } else {
 								                    Duration::from_millis(1)
 								                }
 								            });
 								            *MIN_DELAY
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								        }
 								        // Arbitrary minimum sleep duration for retrying fork/spawn
 								        const MIN_FORKSPAWN_SLEEP: Duration = Duration::from_nanos(1);
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								        // Maximum duration of sleeping before giving up and returning an error
 								        const MAX_FORKSPAWN_SLEEP: Duration = Duration::from_millis(1000);
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								    }
 								}
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								////////////////////////////////////////////////////////////////////////////////
 								// Command
 								////////////////////////////////////////////////////////////////////////////////
 								impl Command {
 								    pub fn spawn(
 								        &mut self,
 								        default: Stdio,
 								        needs_stdin: bool,
 								    ) -> io::Result<(Process, StdioPipes)> {
-												process_unix: prefer i32::*_be_bytes over manually shifting bytes

											
										
										
											2020-07-12 16:47:15 +00:00
+								        const CLOEXEC_MSG_FOOTER: [u8; 4] = *b"NOEX";
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
-												Capture environment at spawn

											
										
										
											2017-12-17 15:21:47 +00:00
+								        let envp = self.capture_env();
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        if self.saw_nul() {
-												Hide Repr details from io::Error, and rework `io::Error::new_const`.

											
										
										
											2021-08-08 01:04:33 -07:00
+								            return Err(io::const_io_error!(
-												Use io::Error::new_const everywhere to avoid allocations.

											
										
										
											2021-03-21 20:22:38 +01:00
+								                ErrorKind::InvalidInput,
-												Hide Repr details from io::Error, and rework `io::Error::new_const`.

											
										
										
											2021-08-08 01:04:33 -07:00
+								                "nul byte found in provided data",
-												Use io::Error::new_const everywhere to avoid allocations.

											
										
										
											2021-03-21 20:22:38 +01:00
+								            ));
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
 								        let (ours, theirs) = self.setup_io(default, needs_stdin)?;
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
 								        if let Some(ret) = self.posix_spawn(&theirs, envp.as_ref())? {
 								            return Ok((ret, ours));
 								        }
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
 								        #[cfg(target_os = "linux")]
 								        let (input, output) = sys::net::Socket::new_pair(libc::AF_UNIX, libc::SOCK_SEQPACKET)?;
 								        #[cfg(not(target_os = "linux"))]
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        let (input, output) = sys::pipe::anon_pipe()?;
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
+								        // Whatever happens after the fork is almost for sure going to touch or
 								        // look at the environment in one way or another (PATH in `execvp` or
 								        // accessing the `environ` pointer ourselves). Make sure no other thread
 								        // is accessing the environment when we do the fork itself.
 								        //
 								        // Note that as soon as we're done with the fork there's no need to hold
 								        // a lock any more because the parent won't do anything and the child is
-												explain mem::forget(env_lock) in fork/exec

											
										
										
											2022-12-12 09:49:42 +01:00
+								        // in its own process. Thus the parent drops the lock guard immediately.
 								        // The child calls `mem::forget` to leak the lock, which is crucial because
 								        // releasing a lock is not async-signal-safe.
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								        let env_lock = sys::os::env_read_lock();
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								        let pid = unsafe { self.do_fork()? };
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
-												Simplify Command::spawn (no semantic change)

This minimizes the size of an unsafe block, and allows outdenting some
complex code.

											
										
										
											2021-03-15 13:35:47 -07:00
+								        if pid == 0 {
-												panic/fork: Command: Do not unwind after fork() in child

Unwinding after fork() in the child is UB on some platforms, because
on those (including musl) malloc can be UB in the child of a
multithreaded program, and unwinding must box for the payload.

Even if it's safe, unwinding past fork() in the child causes whatever
traps the unwind to return twice.  This is very strange and clearly
not desirable.  With the default behaviour of the thread library, this
can even result in a panic in the child being transformed into zero
exit status (ie, success) as seen in the parent!

Fixes #79740.

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-04-20 20:04:31 +01:00
+								            crate::panic::always_abort();
-												explain mem::forget(env_lock) in fork/exec

											
										
										
											2022-12-12 09:49:42 +01:00
+								            mem::forget(env_lock); // avoid non-async-signal-safe unlocking
-												Simplify Command::spawn (no semantic change)

This minimizes the size of an unsafe block, and allows outdenting some
complex code.

											
										
										
											2021-03-15 13:35:47 -07:00
+								            drop(input);
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								            #[cfg(target_os = "linux")]
 								            if self.get_create_pidfd() {
 								                self.send_pidfd(&output);
 								            }
-												Simplify Command::spawn (no semantic change)

This minimizes the size of an unsafe block, and allows outdenting some
complex code.

											
										
										
											2021-03-15 13:35:47 -07:00
+								            let Err(err) = unsafe { self.do_exec(theirs, envp.as_ref()) };
 								            let errno = err.raw_os_error().unwrap_or(libc::EINVAL) as u32;
 								            let errno = errno.to_be_bytes();
 								            let bytes = [
 								                errno[0],
 								                errno[1],
 								                errno[2],
 								                errno[3],
 								                CLOEXEC_MSG_FOOTER[0],
 								                CLOEXEC_MSG_FOOTER[1],
 								                CLOEXEC_MSG_FOOTER[2],
 								                CLOEXEC_MSG_FOOTER[3],
 								            ];
 								            // pipe I/O up to PIPE_BUF bytes should be atomic, and then
 								            // we want to be sure we *don't* run at_exit destructors as
 								            // we're being torn down regardless
 								            rtassert!(output.write(&bytes).is_ok());
 								            unsafe { libc::_exit(1) }
 								        }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
-												Simplify Command::spawn (no semantic change)

This minimizes the size of an unsafe block, and allows outdenting some
complex code.

											
										
										
											2021-03-15 13:35:47 -07:00
+								        drop(env_lock);
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        drop(output);
-												Simplify Command::spawn (no semantic change)

This minimizes the size of an unsafe block, and allows outdenting some
complex code.

											
										
										
											2021-03-15 13:35:47 -07:00
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								        #[cfg(target_os = "linux")]
 								        let pidfd = if self.get_create_pidfd() { self.recv_pidfd(&input) } else { -1 };
 								        #[cfg(not(target_os = "linux"))]
 								        let pidfd = -1;
-												Finishing clone3 clean up

											
										
										
											2024-01-24 15:36:57 +03:00
+								        // Safety: We obtained the pidfd (on Linux) using SOCK_SEQPACKET, so it's valid.
-												Update PidFd for the new I/O safety APIs.

											
										
										
											2021-08-03 07:31:59 -05:00
+								        let mut p = unsafe { Process::new(pid, pidfd) };
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        let mut bytes = [0; 8];
 								        // loop to handle EINTR
 								        loop {
 								            match input.read(&mut bytes) {
 								                Ok(0) => return Ok((p, ours)),
 								                Ok(8) => {
-												process_unix: prefer i32::*_be_bytes over manually shifting bytes

											
										
										
											2020-07-12 16:47:15 +00:00
+								                    let (errno, footer) = bytes.split_at(4);
-												Remove combine function

Comparing two array directly helps generate better assert message

											
										
										
											2020-07-15 08:14:55 +00:00
+								                    assert_eq!(
 								                        CLOEXEC_MSG_FOOTER, footer,
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								                        "Validation on the CLOEXEC pipe failed: {:?}",
 								                        bytes
 								                    );
-												Remove combine function

Comparing two array directly helps generate better assert message

											
										
										
											2020-07-15 08:14:55 +00:00
+								                    let errno = i32::from_be_bytes(errno.try_into().unwrap());
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
 								                    return Err(Error::from_raw_os_error(errno));
 								                }
-												Use std::io::Error::is_interrupted everywhere

											
										
										
											2023-09-02 19:50:33 -04:00
+								                Err(ref e) if e.is_interrupted() => {}
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								                Err(e) => {
 								                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
-												Use implicit capture syntax in format_args

This updates the standard library's documentation to use the new syntax. The
documentation is worthwhile to update as it should be more idiomatic
(particularly for features like this, which are nice for users to get acquainted
with). The general codebase is likely more hassle than benefit to update: it'll
hurt git blame, and generally updates can be done by folks updating the code if
(and when) that makes things more readable with the new format.

A few places in the compiler and library code are updated (mostly just due to
already having been done when this commit was first authored).

											
										
										
											2022-02-12 23:16:17 +04:00
+								                    panic!("the CLOEXEC pipe failed: {e:?}")
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								                }
 								                Ok(..) => {
 								                    // pipe I/O up to PIPE_BUF bytes should be atomic
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								                    // similarly SOCK_SEQPACKET messages should arrive whole
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								                    assert!(p.wait().is_ok(), "wait() should either return Ok or panic");
 								                    panic!("short read on the CLOEXEC pipe")
 								                }
 								            }
 								        }
 								    }
-												Implement blocking output

This allows decoupling `Command::spawn` and `Command::output`. This is
useful for targets which do support launching programs in blocking mode
but do not support multitasking (Eg: UEFI).

This was originally conceived when working on https://github.com/rust-lang/rust/pull/100316

Signed-off-by: Ayush Singh <ayushsingh1325@gmail.com>

											
										
										
											2022-12-08 18:22:33 +05:30
+								    pub fn output(&mut self) -> io::Result<(ExitStatus, Vec<u8>, Vec<u8>)> {
 								        let (proc, pipes) = self.spawn(Stdio::MakePipe, false)?;
 								        crate::sys_common::process::wait_with_output(proc, pipes)
 								    }
-												Actually save all the files

											
										
										
											2023-06-04 10:13:16 -07:00
+								    // WatchOS and TVOS headers mark the `fork`/`exec*` functions with
 								    // `__WATCHOS_PROHIBITED __TVOS_PROHIBITED`, and indicate that the
 								    // `posix_spawn*` functions should be used instead. It isn't entirely clear
 								    // what `PROHIBITED` means here (e.g. if calls to these functions are
 								    // allowed to exist in dead code), but it sounds bad, so we go out of our
 								    // way to avoid that all-together.
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
 								    const ERR_APPLE_TV_WATCH_NO_FORK_EXEC: Error = io::const_io_error!(
 								        ErrorKind::Unsupported,
 								        "`fork`+`exec`-based process spawning is not supported on this target",
 								    );
 								    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								        return Err(Self::ERR_APPLE_TV_WATCH_NO_FORK_EXEC);
 								    }
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    // Attempts to fork the process. If successful, returns Ok((0, -1))
 								    // in the child, and Ok((child_pid, -1)) in the parent.
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								    #[cfg(not(any(
 								        target_os = "watchos",
 								        target_os = "tvos",
 								        all(target_os = "nto", target_env = "nto71"),
 								    )))]
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
 								        cvt(libc::fork())
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    }
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								    // On QNX Neutrino, fork can fail with EBADF in case "another thread might have opened
 								    // or closed a file descriptor while the fork() was occurring".
 								    // Documentation says "... or try calling fork() again". This is what we do here.
 								    // See also https://www.qnx.com/developers/docs/7.1/#com.qnx.doc.neutrino.lib_ref/topic/f/fork.html
 								    #[cfg(all(target_os = "nto", target_env = "nto71"))]
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								    unsafe fn do_fork(&mut self) -> Result<pid_t, io::Error> {
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								        use crate::sys::os::errno;
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								        let mut delay = MIN_FORKSPAWN_SLEEP;
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								        loop {
 								            let r = libc::fork();
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								            if r == -1 as libc::pid_t && errno() as libc::c_int == libc::EBADF {
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                if delay < get_clock_resolution() {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                    // We cannot sleep this short (it would be longer).
 								                    // Yield instead.
 								                    thread::yield_now();
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                } else if delay < MAX_FORKSPAWN_SLEEP {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                    thread::sleep(delay);
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                } else {
 								                    return Err(io::const_io_error!(
 								                        ErrorKind::WouldBlock,
 								                        "forking returned EBADF too often",
 								                    ));
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                }
 								                delay *= 2;
 								                continue;
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								            } else {
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								                return cvt(r);
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								            }
 								        }
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    }
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    pub fn exec(&mut self, default: Stdio) -> io::Error {
-												Capture environment at spawn

											
										
										
											2017-12-17 15:21:47 +00:00
+								        let envp = self.capture_env();
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        if self.saw_nul() {
-												Hide Repr details from io::Error, and rework `io::Error::new_const`.

											
										
										
											2021-08-08 01:04:33 -07:00
+								            return io::const_io_error!(ErrorKind::InvalidInput, "nul byte found in provided data",);
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
 								        match self.setup_io(default, true) {
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
+								            Ok((_, theirs)) => {
 								                unsafe {
 								                    // Similar to when forking, we want to ensure that access to
 								                    // the environment is synchronized, so make sure to grab the
 								                    // environment lock before we try to exec.
-												Revert "Revert "use RWlock when accessing os::env #81850""

This reverts commit acdca316c3d42299d31c1b47eb792006ffdfc29c.

											
										
										
											2021-03-14 19:10:34 +01:00
+								                    let _lock = sys::os::env_read_lock();
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
-												use exhaustive_patterns to be able to use `?`

											
										
										
											2019-05-06 15:40:34 +02:00
+								                    let Err(e) = self.do_exec(theirs, envp.as_ref());
 								                    e
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
+								                }
 								            }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								            Err(e) => e,
 								        }
 								    }
 								    // And at this point we've reached a special time in the life of the
 								    // child. The child must now be considered hamstrung and unable to
 								    // do anything other than syscalls really. Consider the following
 								    // scenario:
 								    //
 								    //      1. Thread A of process 1 grabs the malloc() mutex
 								    //      2. Thread B of process 1 forks(), creating thread C
 								    //      3. Thread C of process 2 then attempts to malloc()
 								    //      4. The memory of process 2 is the same as the memory of
 								    //         process 1, so the mutex is locked.
 								    //
 								    // This situation looks a lot like deadlock, right? It turns out
 								    // that this is what pthread_atfork() takes care of, which is
 								    // presumably implemented across platforms. The first thing that
 								    // threads to *before* forking is to do things like grab the malloc
 								    // mutex, and then after the fork they unlock it.
 								    //
 								    // Despite this information, libnative's spawn has been witnessed to
-												Update usages of 'OSX' (and other old names) to 'macOS'.

As of last year with version 'Sierra', the Mac operating system is now
called 'macOS'.

											
										
										
											2017-03-12 14:13:35 -04:00
+								    // deadlock on both macOS and FreeBSD. I'm not entirely sure why, but
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    // all collected backtraces point at malloc/free traffic in the
 								    // child spawned process.
 								    //
 								    // For this reason, the block of code below should contain 0
 								    // invocations of either malloc of free (or their related friends).
 								    //
 								    // As an example of not having malloc/free traffic, we don't close
 								    // this file descriptor by dropping the FileDesc (which contains an
 								    // allocation). Instead we just close it manually. This will never
 								    // have the drop glue anyway because this code never returns (the
 								    // child will either exec() or invoke libc::exit)
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								    #[cfg(not(any(target_os = "tvos", target_os = "watchos")))]
-												Capture environment at spawn

											
										
										
											2017-12-17 15:21:47 +00:00
+								    unsafe fn do_exec(
 								        &mut self,
 								        stdio: ChildPipes,
-												Revert "Fixes #46775 -- don't mutate the process's environment in Command::exec"

This reverts commit 36fe3b605a7a7143a14565272140ba1b43c1b041.

											
										
										
											2018-11-13 14:50:50 -08:00
+								        maybe_envp: Option<&CStringArray>,
-												use exhaustive_patterns to be able to use `?`

											
										
										
											2019-05-06 15:40:34 +02:00
+								    ) -> Result<!, io::Error> {
-												libstd => 2018

											
										
										
											2019-02-11 04:23:21 +09:00
+								        use crate::sys::{self, cvt_r};
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
 								        if let Some(fd) = stdio.stdin.fd() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								            cvt_r(|| libc::dup2(fd, libc::STDIN_FILENO))?;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
 								        if let Some(fd) = stdio.stdout.fd() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								            cvt_r(|| libc::dup2(fd, libc::STDOUT_FILENO))?;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
 								        if let Some(fd) = stdio.stderr.fd() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								            cvt_r(|| libc::dup2(fd, libc::STDERR_FILENO))?;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
-												remove any from cfgs
											
										
										
											2019-08-19 20:02:50 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												cfg fix 2
											
										
										
											2019-08-19 20:01:02 +00:00
+								        {
-												Add setgroups to std::os::unix::process::CommandExt

											
										
										
											2020-06-15 21:39:34 -07:00
+								            if let Some(_g) = self.get_groups() {
 								                //FIXME: Redox kernel does not support setgroups yet
 								                #[cfg(not(target_os = "redox"))]
 								                cvt(libc::setgroups(_g.len().try_into().unwrap(), _g.as_ptr()))?;
 								            }
-												Match c_char definitions and enable signal reset for L4Re

*   Match definition of c_char in os/raw.rs with the libc definition

    Due to historic reasons, os/raw.rs redefines types for c_char from
    libc, but these didn't match. Now they do :).

*   Enable signal reset on exec for L4Re

    L4Re has full signal emulation and hence it needs to reset the
    signal set of the child with sigemptyset. However, gid and uid
    should *not* be set.

											
										
										
											2017-08-17 13:23:00 +02:00
+								            if let Some(u) = self.get_gid() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								                cvt(libc::setgid(u as gid_t))?;
-												Match c_char definitions and enable signal reset for L4Re

*   Match definition of c_char in os/raw.rs with the libc definition

    Due to historic reasons, os/raw.rs redefines types for c_char from
    libc, but these didn't match. Now they do :).

*   Enable signal reset on exec for L4Re

    L4Re has full signal emulation and hence it needs to reset the
    signal set of the child with sigemptyset. However, gid and uid
    should *not* be set.

											
										
										
											2017-08-17 13:23:00 +02:00
+								            }
 								            if let Some(u) = self.get_uid() {
-												fix cfg
											
										
										
											2019-08-19 19:58:35 +00:00
+								                // When dropping privileges from root, the `setgroups` call
-												Add setgroups to std::os::unix::process::CommandExt

											
										
										
											2020-06-15 21:39:34 -07:00
+								                // will remove any extraneous groups. We only drop groups
-												change std::process to drop supplementary groups based on CAP_SETGID

											
										
										
											2022-04-12 07:46:07 -07:00
+								                // if we have CAP_SETGID and we weren't given an explicit
-												Add setgroups to std::os::unix::process::CommandExt

											
										
										
											2020-06-15 21:39:34 -07:00
+								                // set of groups. If we don't call this, then even though our
 								                // uid has dropped, we may still have groups that enable us to
 								                // do super-user things.
-												redox: convert to target_family unix

											
										
										
											2019-04-07 08:39:54 -06:00
+								                //FIXME: Redox kernel does not support setgroups yet
-												fix cfg
											
										
										
											2019-08-19 19:58:35 +00:00
+								                #[cfg(not(target_os = "redox"))]
-												change std::process to drop supplementary groups based on CAP_SETGID

											
										
										
											2022-04-12 07:46:07 -07:00
+								                if self.get_groups().is_none() {
 								                    let res = cvt(libc::setgroups(0, crate::ptr::null()));
 								                    if let Err(e) = res {
 								                        // Here we ignore the case of not having CAP_SETGID.
 								                        // An alternative would be to require CAP_SETGID (in
 								                        // addition to CAP_SETUID) for setting the UID.
 								                        if e.raw_os_error() != Some(libc::EPERM) {
 								                            return Err(e.into());
 								                        }
 								                    }
-												Add setgroups to std::os::unix::process::CommandExt

											
										
										
											2020-06-15 21:39:34 -07:00
+								                }
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								                cvt(libc::setuid(u as uid_t))?;
-												Match c_char definitions and enable signal reset for L4Re

*   Match definition of c_char in os/raw.rs with the libc definition

    Due to historic reasons, os/raw.rs redefines types for c_char from
    libc, but these didn't match. Now they do :).

*   Enable signal reset on exec for L4Re

    L4Re has full signal emulation and hence it needs to reset the
    signal set of the child with sigemptyset. However, gid and uid
    should *not* be set.

											
										
										
											2017-08-17 13:23:00 +02:00
+								            }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
 								        if let Some(ref cwd) = *self.get_cwd() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								            cvt(libc::chdir(cwd.as_ptr()))?;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
-												Add a `process_group` method to UNIX `CommandExt`

											
										
										
											2022-02-03 09:40:45 +00:00
+								        if let Some(pgroup) = self.get_pgroup() {
 								            cvt(libc::setpgid(0, pgroup))?;
 								        }
-												Remove nacl from libstd

											
										
										
											2017-10-05 05:01:41 +02:00
+								        // emscripten has no signal support.
-												remove any from cfgs
											
										
										
											2019-08-19 20:02:50 +00:00
+								        #[cfg(not(target_os = "emscripten"))]
-												Update the libc submodule

Brings in a few fixes for wasm/asmjs

											
										
										
											2017-07-17 09:24:05 -07:00
+								        {
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								            // Inherit the signal mask from the parent rather than resetting it (i.e. do not call
 								            // pthread_sigmask).
-												Change `SIGPIPE` ui from `#[unix_sigpipe = "..."]` to `-Zon-broken-pipe=...`

In the stabilization attempt of `#[unix_sigpipe = "sig_dfl"]`, a concern
was raised related to using a language attribute for the feature: Long
term, we want `fn lang_start()` to be definable by any crate, not just
libstd. Having a special language attribute in that case becomes
awkward.

So as a first step towards towards the next stabilization attempt, this
PR changes the `#[unix_sigpipe = "..."]` attribute to a compiler flag
`-Zon-broken-pipe=...` to remove that concern, since now the language
is not "contaminated" by this feature.

Another point was also raised, namely that the ui should not leak
**how** it does things, but rather what the **end effect** is. The new
flag uses the proposed naming. This is of course something that can be
iterated on further before stabilization.

											
										
										
											2024-04-28 18:02:21 +02:00
+								            // If -Zon-broken-pipe is used, don't reset SIGPIPE to SIG_DFL.
 								            // If -Zon-broken-pipe is not used, reset SIGPIPE to SIG_DFL for backward compatibility.
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								            //
-												Change `SIGPIPE` ui from `#[unix_sigpipe = "..."]` to `-Zon-broken-pipe=...`

In the stabilization attempt of `#[unix_sigpipe = "sig_dfl"]`, a concern
was raised related to using a language attribute for the feature: Long
term, we want `fn lang_start()` to be definable by any crate, not just
libstd. Having a special language attribute in that case becomes
awkward.

So as a first step towards towards the next stabilization attempt, this
PR changes the `#[unix_sigpipe = "..."]` attribute to a compiler flag
`-Zon-broken-pipe=...` to remove that concern, since now the language
is not "contaminated" by this feature.

Another point was also raised, namely that the ui should not leak
**how** it does things, but rather what the **end effect** is. The new
flag uses the proposed naming. This is of course something that can be
iterated on further before stabilization.

											
										
										
											2024-04-28 18:02:21 +02:00
+								            // -Zon-broken-pipe is an opportunity to change the default here.
 								            if !crate::sys::pal::on_broken_pipe_flag_used() {
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								                #[cfg(target_os = "android")] // see issue #88585
 								                {
 								                    let mut action: libc::sigaction = mem::zeroed();
 								                    action.sa_sigaction = libc::SIG_DFL;
 								                    cvt(libc::sigaction(libc::SIGPIPE, &action, crate::ptr::null_mut()))?;
 								                }
 								                #[cfg(not(target_os = "android"))]
 								                {
 								                    let ret = sys::signal(libc::SIGPIPE, libc::SIG_DFL);
 								                    if ret == libc::SIG_ERR {
 								                        return Err(io::Error::last_os_error());
 								                    }
-												Call `libc::sigaction()` only on Android

											
										
										
											2021-10-01 21:22:18 +02:00
+								                }
-												added support for GNU/Hurd

											
										
										
											2023-09-19 12:41:30 +02:00
+								                #[cfg(target_os = "hurd")]
 								                {
 								                    let ret = sys::signal(libc::SIGLOST, libc::SIG_DFL);
 								                    if ret == libc::SIG_ERR {
 								                        return Err(io::Error::last_os_error());
 								                    }
 								                }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								            }
 								        }
 								        for callback in self.get_closures().iter_mut() {
-												convert custom try macro to `?`

resolves #60580

											
										
										
											2019-05-06 14:54:27 +02:00
+								            callback()?;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
+								        // Although we're performing an exec here we may also return with an
 								        // error from this function (without actually exec'ing) in which case we
 								        // want to be sure to restore the global environment back to what it
 								        // once was, ensuring that our temporary override, when free'd, doesn't
 								        // corrupt our process's environment.
 								        let mut _reset = None;
 								        if let Some(envp) = maybe_envp {
 								            struct Reset(*const *const libc::c_char);
 								            impl Drop for Reset {
 								                fn drop(&mut self) {
 								                    unsafe {
 								                        *sys::os::environ() = self.0;
 								                    }
 								                }
 								            }
 								            _reset = Some(Reset(*sys::os::environ()));
 								            *sys::os::environ() = envp.as_ptr();
 								        }
-												Add accessors to Command.

											
										
										
											2020-09-21 11:32:06 -07:00
+								        libc::execvp(self.get_program_cstr().as_ptr(), self.get_argv().as_ptr());
-												use exhaustive_patterns to be able to use `?`

											
										
										
											2019-05-06 15:40:34 +02:00
+								        Err(io::Error::last_os_error())
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    }
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Avoid fork/exec spawning on tvOS/watchOS, as those functions are marked as prohibited

											
										
										
											2023-06-04 09:46:18 -07:00
+								    #[cfg(any(target_os = "tvos", target_os = "watchos"))]
 								    unsafe fn do_exec(
 								        &mut self,
 								        _stdio: ChildPipes,
 								        _maybe_envp: Option<&CStringArray>,
 								    ) -> Result<!, io::Error> {
 								        return Err(Self::ERR_APPLE_TV_WATCH_NO_FORK_EXEC);
 								    }
-												Support posix_spawn() for Linux glibc 2.24+.

The relevant support was added in https://sourceware.org/bugzilla/show_bug.cgi?id=10354#c12

											
										
										
											2018-03-02 13:02:38 -08:00
+								    #[cfg(not(any(
 								        target_os = "freebsd",
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								        all(target_os = "linux", target_env = "gnu"),
 								        all(target_os = "linux", target_env = "musl"),
-												Add QNX Neutrino support to libstd

Co-authored-by: gh-tr <troach@qnx.com>

											
										
										
											2023-01-10 10:44:05 +01:00
+								        target_os = "nto",
-												Fix posix_spawn not being used on iOS and visionOS

`man posix_spawn` documents it to be able to return `ENOENT`, and there
should be nothing preventing this. Tested in the iOS simulator and on
Mac Catalyst.

											
										
										
											2024-04-28 22:34:51 +02:00
+								        target_vendor = "apple",
-												Support posix_spawn() for Linux glibc 2.24+.

The relevant support was added in https://sourceware.org/bugzilla/show_bug.cgi?id=10354#c12

											
										
										
											2018-03-02 13:02:38 -08:00
+								    )))]
-												Use _

											
										
										
											2018-03-02 08:50:37 -08:00
+								    fn posix_spawn(
 								        &mut self,
 								        _: &ChildPipes,
 								        _: Option<&CStringArray>,
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								    ) -> io::Result<Option<Process>> {
 								        Ok(None)
 								    }
-												Add comment explaining when posix_spawn() can be supported.

											
										
										
											2018-03-01 09:18:16 -08:00
+								    // Only support platforms for which posix_spawn() can return ENOENT
 								    // directly.
-												Support posix_spawn() for Linux glibc 2.24+.

The relevant support was added in https://sourceware.org/bugzilla/show_bug.cgi?id=10354#c12

											
										
										
											2018-03-02 13:02:38 -08:00
+								    #[cfg(any(
 								        target_os = "freebsd",
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								        all(target_os = "linux", target_env = "gnu"),
 								        all(target_os = "linux", target_env = "musl"),
-												Add QNX Neutrino support to libstd

Co-authored-by: gh-tr <troach@qnx.com>

											
										
										
											2023-01-10 10:44:05 +01:00
+								        target_os = "nto",
-												Fix posix_spawn not being used on iOS and visionOS

`man posix_spawn` documents it to be able to return `ENOENT`, and there
should be nothing preventing this. Tested in the iOS simulator and on
Mac Catalyst.

											
										
										
											2024-04-28 22:34:51 +02:00
+								        target_vendor = "apple",
-												Support posix_spawn() for Linux glibc 2.24+.

The relevant support was added in https://sourceware.org/bugzilla/show_bug.cgi?id=10354#c12

											
										
										
											2018-03-02 13:02:38 -08:00
+								    ))]
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								    fn posix_spawn(
 								        &mut self,
 								        stdio: &ChildPipes,
 								        envp: Option<&CStringArray>,
 								    ) -> io::Result<Option<Process>> {
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								        use crate::mem::MaybeUninit;
-												visionOS: Fix unused import warning

The import is used once in this file, inside `posix_spawn`, so let's move the import into that function instead, to reduce the number of `cfg`s that need to be kept in sync.

											
										
										
											2024-04-10 14:59:11 +02:00
+								        use crate::sys::weak::weak;
-												Change `SIGPIPE` ui from `#[unix_sigpipe = "..."]` to `-Zon-broken-pipe=...`

In the stabilization attempt of `#[unix_sigpipe = "sig_dfl"]`, a concern
was raised related to using a language attribute for the feature: Long
term, we want `fn lang_start()` to be definable by any crate, not just
libstd. Having a special language attribute in that case becomes
awkward.

So as a first step towards towards the next stabilization attempt, this
PR changes the `#[unix_sigpipe = "..."]` attribute to a compiler flag
`-Zon-broken-pipe=...` to remove that concern, since now the language
is not "contaminated" by this feature.

Another point was also raised, namely that the ui should not leak
**how** it does things, but rather what the **end effect** is. The new
flag uses the proposed naming. This is of course something that can be
iterated on further before stabilization.

											
										
										
											2024-04-28 18:02:21 +02:00
+								        use crate::sys::{self, cvt_nz, on_broken_pipe_flag_used};
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Use posix_spawn_file_actions_addchdir_np when possible

This is a non-POSIX extension implemented in Solaris and in glibc 2.29.
With this we can still use `posix_spawn()` when `Command::current_dir()`
has been set, otherwise we fallback to `fork(); chdir(); exec()`.

											
										
										
											2019-02-13 12:20:23 -08:00
+								        if self.get_gid().is_some()
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								            || self.get_uid().is_some()
-												Use posix_spawn() on unix if program is a path

Previously `Command::spawn` would fall back to the non-posix_spawn based
implementation if the `PATH` environment variable was possibly changed.
On systems with a modern (g)libc `posix_spawn()` can be significantly
faster. If program is a path itself the `PATH` environment variable is
not used for the lookup and it should be safe to use the
`posix_spawnp()` method. [1]

We found this, because we have a cli application that effectively runs a
lot of subprocesses. It would sometimes noticeably hang while printing
output. Profiling showed that the process was spending the majority of
time in the kernel's `copy_page_range` function while spawning
subprocesses. During this time the process is completely blocked from
running, explaining why users were reporting the cli app hanging.

Through this we discovered that `std::process::Command` has a fast and
slow path for process execution. The fast path is backed by
`posix_spawnp()` and the slow path by fork/exec syscalls being called
explicitly. Using fork for process creation is supposed to be fast, but
it slows down as your process uses more memory.  It's not because the
kernel copies the actual memory from the parent, but it does need to
copy the references to it (see `copy_page_range` above!).  We ended up
using the slow path, because the command spawn implementation in falls
back to the slow path if it suspects the PATH environment variable was
changed.

Here is a smallish program demonstrating the slowdown before this code
change:

```
use std::process::Command;
use std::time::Instant;

fn main() {
    let mut args = std::env::args().skip(1);
    if let Some(size) = args.next() {
        // Allocate some memory
        let _xs: Vec<_> = std::iter::repeat(0)
            .take(size.parse().expect("valid number"))
            .collect();

        let mut command = Command::new("/bin/sh");
        command
            .arg("-c")
            .arg("echo hello");

        if args.next().is_some() {
            println!("Overriding PATH");
            command.env("PATH", std::env::var("PATH").expect("PATH env var"));
        }

        let now = Instant::now();
        let child = command
            .spawn()
            .expect("failed to execute process");

        println!("Spawn took: {:?}", now.elapsed());

        let output = child.wait_with_output().expect("failed to wait on process");
        println!("Output: {:?}", output);
    } else {
        eprintln!("Usage: prog [size]");
        std::process::exit(1);
    }
    ()
}
```

Running it and passing different amounts of elements to use to allocate
memory shows that the time taken for `spawn()` can differ quite
significantly. In latter case the `posix_spawnp()` implementation is 30x
faster:

```
$ cargo run --release 10000000
...
Spawn took: 324.275µs
hello
$ cargo run --release 10000000 changepath
...
Overriding PATH
Spawn took: 2.346809ms
hello
$ cargo run --release 100000000
...
Spawn took: 387.842µs
hello
$ cargo run --release 100000000 changepath
...
Overriding PATH
Spawn took: 13.434677ms
hello
```

[1]: https://github.com/bminor/glibc/blob/5f72f9800b250410cad3abfeeb09469ef12b2438/posix/execvpe.c#L81

											
										
										
											2020-10-02 07:44:32 -07:00
+								            || (self.env_saw_path() && !self.program_is_path())
-												Fix clippy::len_zero warnings

											
										
										
											2019-07-18 14:22:22 +02:00
+								            || !self.get_closures().is_empty()
-												Add setgroups to std::os::unix::process::CommandExt

											
										
										
											2020-06-15 21:39:34 -07:00
+								            || self.get_groups().is_some()
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								            || self.get_create_pidfd()
-												Fix clippy::len_zero warnings

											
										
										
											2019-07-18 14:22:22 +02:00
+								        {
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								            return Ok(None);
 								        }
-												Support posix_spawn() for Linux glibc 2.24+.

The relevant support was added in https://sourceware.org/bugzilla/show_bug.cgi?id=10354#c12

											
										
										
											2018-03-02 13:02:38 -08:00
+								        // Only glibc 2.24+ posix_spawn() supports returning ENOENT directly.
 								        #[cfg(all(target_os = "linux", target_env = "gnu"))]
 								        {
 								            if let Some(version) = sys::os::glibc_version() {
 								                if version < (2, 24) {
 								                    return Ok(None);
 								                }
 								            } else {
 								                return Ok(None);
 								            }
 								        }
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								        // On QNX Neutrino, posix_spawnp can fail with EBADF in case "another thread might have opened
 								        // or closed a file descriptor while the posix_spawn() was occurring".
 								        // Documentation says "... or try calling posix_spawn() again". This is what we do here.
 								        // See also http://www.qnx.com/developers/docs/7.1/#com.qnx.doc.neutrino.lib_ref/topic/p/posix_spawn.html
 								        #[cfg(all(target_os = "nto", target_env = "nto71"))]
 								        unsafe fn retrying_libc_posix_spawnp(
 								            pid: *mut pid_t,
 								            file: *const c_char,
 								            file_actions: *const posix_spawn_file_actions_t,
 								            attrp: *const posix_spawnattr_t,
 								            argv: *const *mut c_char,
 								            envp: *const *mut c_char,
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								        ) -> io::Result<i32> {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								            let mut delay = MIN_FORKSPAWN_SLEEP;
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								            loop {
 								                match libc::posix_spawnp(pid, file, file_actions, attrp, argv, envp) {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                    libc::EBADF => {
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                        if delay < get_clock_resolution() {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                            // We cannot sleep this short (it would be longer).
 								                            // Yield instead.
 								                            thread::yield_now();
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                        } else if delay < MAX_FORKSPAWN_SLEEP {
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                            thread::sleep(delay);
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                        } else {
 								                            return Err(io::const_io_error!(
 								                                ErrorKind::WouldBlock,
 								                                "posix_spawnp returned EBADF too often",
 								                            ));
-												Retry to fork/spawn with exponential backoff

											
										
										
											2023-03-18 18:45:51 +01:00
+								                        }
 								                        delay *= 2;
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								                        continue;
 								                    }
 								                    r => {
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								                        return Ok(r);
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
+								                    }
 								                }
 								            }
 								        }
-												Use posix_spawn on musl targets

The posix_spawn had been available in a form suitable for use in a
Command implementation since musl 0.9.12. Use it in a preference to a
fork when possible, to benefit from CLONE_VM|CLONE_VFORK used there.

											
										
										
											2020-10-01 00:00:00 +00:00
+								        // Solaris, glibc 2.29+, and musl 1.24+ can set a new working directory,
 								        // and maybe others will gain this non-POSIX function too. We'll check
 								        // for this weak symbol as soon as it's needed, so we can return early
 								        // otherwise to do a manual chdir before exec.
-												Use posix_spawn_file_actions_addchdir_np when possible

This is a non-POSIX extension implemented in Solaris and in glibc 2.29.
With this we can still use `posix_spawn()` when `Command::current_dir()`
has been set, otherwise we fallback to `fork(); chdir(); exec()`.

											
										
										
											2019-02-13 12:20:23 -08:00
+								        weak! {
 								            fn posix_spawn_file_actions_addchdir_np(
 								                *mut libc::posix_spawn_file_actions_t,
 								                *const libc::c_char
 								            ) -> libc::c_int
 								        }
 								        let addchdir = match self.get_cwd() {
-												Don't use posix_spawn_file_actions_addchdir_np on macOS.

											
										
										
											2020-12-30 14:56:51 -08:00
+								            Some(cwd) => {
-												Fix posix_spawn not being used on iOS and visionOS

`man posix_spawn` documents it to be able to return `ENOENT`, and there
should be nothing preventing this. Tested in the iOS simulator and on
Mac Catalyst.

											
										
										
											2024-04-28 22:34:51 +02:00
+								                if cfg!(target_vendor = "apple") {
-												Don't use posix_spawn_file_actions_addchdir_np on macOS.

											
										
										
											2020-12-30 14:56:51 -08:00
+								                    // There is a bug in macOS where a relative executable
 								                    // path like "../myprogram" will cause `posix_spawn` to
 								                    // successfully launch the program, but erroneously return
 								                    // ENOENT when used with posix_spawn_file_actions_addchdir_np
 								                    // which was introduced in macOS 10.15.
-												Use posix_spawn for absolute paths on macOS

Currently, on macOS, Rust never uses the fast posix_spawn path if a
directory change is requested due to a bug in Apple's libc. However, the
bug is only triggered if the program is a relative path.

This PR makes it so that the fast path continues to work if the program
is an absolute path or a lone filename.

This was an alternative proposed in
https://github.com/rust-lang/rust/pull/80537#issue-776674009, and it
makes a measurable performance difference in some of my code that spawns
thousands of processes.

											
										
										
											2022-08-19 18:24:21 -07:00
+								                    if self.get_program_kind() == ProgramKind::Relative {
 								                        return Ok(None);
 								                    }
-												Don't use posix_spawn_file_actions_addchdir_np on macOS.

											
										
										
											2020-12-30 14:56:51 -08:00
+								                }
 								                match posix_spawn_file_actions_addchdir_np.get() {
 								                    Some(f) => Some((f, cwd)),
 								                    None => return Ok(None),
 								                }
 								            }
-												Use posix_spawn_file_actions_addchdir_np when possible

This is a non-POSIX extension implemented in Solaris and in glibc 2.29.
With this we can still use `posix_spawn()` when `Command::current_dir()`
has been set, otherwise we fallback to `fork(); chdir(); exec()`.

											
										
										
											2019-02-13 12:20:23 -08:00
+								            None => None,
 								        };
-												Add a `process_group` method to UNIX `CommandExt`

											
										
										
											2022-02-03 09:40:45 +00:00
+								        let pgroup = self.get_pgroup();
-												Update PidFd for the new I/O safety APIs.

											
										
										
											2021-08-03 07:31:59 -05:00
+								        // Safety: -1 indicates we don't have a pidfd.
 								        let mut p = unsafe { Process::new(0, -1) };
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								        struct PosixSpawnFileActions<'a>(&'a mut MaybeUninit<libc::posix_spawn_file_actions_t>);
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								        impl Drop for PosixSpawnFileActions<'_> {
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								            fn drop(&mut self) {
 								                unsafe {
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                    libc::posix_spawn_file_actions_destroy(self.0.as_mut_ptr());
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                }
 								            }
 								        }
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								        struct PosixSpawnattr<'a>(&'a mut MaybeUninit<libc::posix_spawnattr_t>);
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								        impl Drop for PosixSpawnattr<'_> {
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								            fn drop(&mut self) {
 								                unsafe {
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                    libc::posix_spawnattr_destroy(self.0.as_mut_ptr());
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                }
 								            }
 								        }
 								        unsafe {
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								            let mut attrs = MaybeUninit::uninit();
 								            cvt_nz(libc::posix_spawnattr_init(attrs.as_mut_ptr()))?;
 								            let attrs = PosixSpawnattr(&mut attrs);
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Add a `process_group` method to UNIX `CommandExt`

											
										
										
											2022-02-03 09:40:45 +00:00
+								            let mut flags = 0;
-												Check for errors returned from posix_spawn*_init functions

The posix_spawnattr_init & posix_spawn_file_actions_init might fail,
but their return code is not checked.

Check for non-zero return code and destroy only succesfully initialized
objects.

											
										
										
											2020-10-08 00:00:00 +00:00
+								            let mut file_actions = MaybeUninit::uninit();
 								            cvt_nz(libc::posix_spawn_file_actions_init(file_actions.as_mut_ptr()))?;
 								            let file_actions = PosixSpawnFileActions(&mut file_actions);
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
 								            if let Some(fd) = stdio.stdin.fd() {
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								                cvt_nz(libc::posix_spawn_file_actions_adddup2(
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                    file_actions.0.as_mut_ptr(),
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                    fd,
 								                    libc::STDIN_FILENO,
 								                ))?;
 								            }
 								            if let Some(fd) = stdio.stdout.fd() {
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								                cvt_nz(libc::posix_spawn_file_actions_adddup2(
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                    file_actions.0.as_mut_ptr(),
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                    fd,
 								                    libc::STDOUT_FILENO,
 								                ))?;
 								            }
 								            if let Some(fd) = stdio.stderr.fd() {
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								                cvt_nz(libc::posix_spawn_file_actions_adddup2(
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                    file_actions.0.as_mut_ptr(),
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                    fd,
 								                    libc::STDERR_FILENO,
 								                ))?;
 								            }
-												Use posix_spawn_file_actions_addchdir_np when possible

This is a non-POSIX extension implemented in Solaris and in glibc 2.29.
With this we can still use `posix_spawn()` when `Command::current_dir()`
has been set, otherwise we fallback to `fork(); chdir(); exec()`.

											
										
										
											2019-02-13 12:20:23 -08:00
+								            if let Some((f, cwd)) = addchdir {
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								                cvt_nz(f(file_actions.0.as_mut_ptr(), cwd.as_ptr()))?;
-												Use posix_spawn_file_actions_addchdir_np when possible

This is a non-POSIX extension implemented in Solaris and in glibc 2.29.
With this we can still use `posix_spawn()` when `Command::current_dir()`
has been set, otherwise we fallback to `fork(); chdir(); exec()`.

											
										
										
											2019-02-13 12:20:23 -08:00
+								            }
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Add a `process_group` method to UNIX `CommandExt`

											
										
										
											2022-02-03 09:40:45 +00:00
+								            if let Some(pgroup) = pgroup {
 								                flags |= libc::POSIX_SPAWN_SETPGROUP;
 								                cvt_nz(libc::posix_spawnattr_setpgroup(attrs.0.as_mut_ptr(), pgroup))?;
 								            }
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								            // Inherit the signal mask from this process rather than resetting it (i.e. do not call
 								            // posix_spawnattr_setsigmask).
-												Change `SIGPIPE` ui from `#[unix_sigpipe = "..."]` to `-Zon-broken-pipe=...`

In the stabilization attempt of `#[unix_sigpipe = "sig_dfl"]`, a concern
was raised related to using a language attribute for the feature: Long
term, we want `fn lang_start()` to be definable by any crate, not just
libstd. Having a special language attribute in that case becomes
awkward.

So as a first step towards towards the next stabilization attempt, this
PR changes the `#[unix_sigpipe = "..."]` attribute to a compiler flag
`-Zon-broken-pipe=...` to remove that concern, since now the language
is not "contaminated" by this feature.

Another point was also raised, namely that the ui should not leak
**how** it does things, but rather what the **end effect** is. The new
flag uses the proposed naming. This is of course something that can be
iterated on further before stabilization.

											
										
										
											2024-04-28 18:02:21 +02:00
+								            // If -Zon-broken-pipe is used, don't reset SIGPIPE to SIG_DFL.
 								            // If -Zon-broken-pipe is not used, reset SIGPIPE to SIG_DFL for backward compatibility.
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								            //
-												Change `SIGPIPE` ui from `#[unix_sigpipe = "..."]` to `-Zon-broken-pipe=...`

In the stabilization attempt of `#[unix_sigpipe = "sig_dfl"]`, a concern
was raised related to using a language attribute for the feature: Long
term, we want `fn lang_start()` to be definable by any crate, not just
libstd. Having a special language attribute in that case becomes
awkward.

So as a first step towards towards the next stabilization attempt, this
PR changes the `#[unix_sigpipe = "..."]` attribute to a compiler flag
`-Zon-broken-pipe=...` to remove that concern, since now the language
is not "contaminated" by this feature.

Another point was also raised, namely that the ui should not leak
**how** it does things, but rather what the **end effect** is. The new
flag uses the proposed naming. This is of course something that can be
iterated on further before stabilization.

											
										
										
											2024-04-28 18:02:21 +02:00
+								            // -Zon-broken-pipe is an opportunity to change the default here.
 								            if !on_broken_pipe_flag_used() {
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								                let mut default_set = MaybeUninit::<libc::sigset_t>::uninit();
 								                cvt(sigemptyset(default_set.as_mut_ptr()))?;
 								                cvt(sigaddset(default_set.as_mut_ptr(), libc::SIGPIPE))?;
-												added support for GNU/Hurd

											
										
										
											2023-09-19 12:41:30 +02:00
+								                #[cfg(target_os = "hurd")]
 								                {
 								                    cvt(sigaddset(default_set.as_mut_ptr(), libc::SIGLOST))?;
 								                }
-												Change process spawning to inherit the parent's signal mask by default

Previously, the signal mask is always reset when a child process is
started. This breaks tools like `nohup` which expect `SIGHUP` to be
blocked.

With this change, the default behavior changes to inherit the signal mask.

This also changes the signal disposition for `SIGPIPE` to only be
changed if the `#[unix_sigpipe]` attribute isn't set.

											
										
										
											2022-09-22 22:48:14 -07:00
+								                cvt_nz(libc::posix_spawnattr_setsigdefault(
 								                    attrs.0.as_mut_ptr(),
 								                    default_set.as_ptr(),
 								                ))?;
 								                flags |= libc::POSIX_SPAWN_SETSIGDEF;
 								            }
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								            cvt_nz(libc::posix_spawnattr_setflags(attrs.0.as_mut_ptr(), flags as _))?;
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
-												std: Synchronize access to global env during `exec`

This commit, after reverting #55359, applies a different fix for #46775
while also fixing #55775. The basic idea was to go back to pre-#55359
libstd, and then fix #46775 in a way that doesn't expose #55775.

The issue described in #46775 boils down to two problems:

* First, the global environment is reset during `exec` but, but if the
  `exec` call fails then the global environment was a dangling pointer
  into free'd memory as the block of memory was deallocated when
  `Command` is dropped. This is fixed in this commit by installing a
  `Drop` stack object which ensures that the `environ` pointer is
  preserved on a failing `exec`.

* Second, the global environment was accessed in an unsynchronized
  fashion during `exec`. This was fixed by ensuring that the
  Rust-specific environment lock is acquired for these system-level
  operations.

Thanks to Alex Gaynor for pioneering the solution here!

Closes #55775

Co-authored-by: Alex Gaynor <alex.gaynor@gmail.com>

											
										
										
											2018-11-13 14:57:10 -08:00
+								            // Make sure we synchronize access to the global `environ` resource
-												Revert "Revert "use RWlock when accessing os::env #81850""

This reverts commit acdca316c3d42299d31c1b47eb792006ffdfc29c.

											
										
										
											2021-03-14 19:10:34 +01:00
+								            let _env_lock = sys::os::env_read_lock();
-												Prefer unwrap_or_else to unwrap_or in case of function calls/allocations

											
										
										
											2018-10-12 16:16:00 +02:00
+								            let envp = envp.map(|c| c.as_ptr()).unwrap_or_else(|| *sys::os::environ() as *const _);
-												Retry to spawn/fork up to 3 times when it failed because of an interruption

											
										
										
											2023-02-10 15:27:22 +01:00
 								            #[cfg(not(target_os = "nto"))]
 								            let spawn_fn = libc::posix_spawnp;
 								            #[cfg(target_os = "nto")]
 								            let spawn_fn = retrying_libc_posix_spawnp;
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
 								            let spawn_res = spawn_fn(
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                &mut p.pid,
-												Add accessors to Command.

											
										
										
											2020-09-21 11:32:06 -07:00
+								                self.get_program_cstr().as_ptr(),
-												Avoid mem::uninitialized() in std::sys::unix

For `libc` types that will be initialized in FFI calls, we can just use
`MaybeUninit` and then pass around raw pointers.

For `sun_path_offset()`, which really wants `offset_of`, all callers
have a real `sockaddr_un` available, so we can use that reference.

											
										
										
											2019-06-26 15:03:15 -07:00
+								                file_actions.0.as_ptr(),
 								                attrs.0.as_ptr(),
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								                self.get_argv().as_ptr() as *const _,
 								                envp as *const _,
-												Only determine clock res once; give up before sleeping more than 1 second

											
										
										
											2023-06-02 17:52:14 +02:00
+								            );
 								            #[cfg(target_os = "nto")]
 								            let spawn_res = spawn_res?;
 								            cvt_nz(spawn_res)?;
-												Check for non-zero return value from posix_spawn functions

The cvt function compares the argument with -1 and when equal returns a new
io::Error constructed from errno. It is used together posix_spawn_* functions.
This is incorrect. Those functions do not set errno. Instead they return
non-zero error code directly.

Check for non-zero return code and use it to construct a new io::Error.

											
										
										
											2020-10-08 00:00:00 +00:00
+								            Ok(Some(p))
-												Support posix_spawn() when possible.

											
										
										
											2018-01-25 18:13:45 -08:00
+								        }
 								    }
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
 								    #[cfg(target_os = "linux")]
 								    fn send_pidfd(&self, sock: &crate::sys::net::Socket) {
 								        use crate::io::IoSlice;
 								        use crate::os::fd::RawFd;
 								        use crate::sys::cvt_r;
 								        use libc::{CMSG_DATA, CMSG_FIRSTHDR, CMSG_LEN, CMSG_SPACE, SCM_RIGHTS, SOL_SOCKET};
 								        unsafe {
 								            let child_pid = libc::getpid();
 								            // pidfd_open sets CLOEXEC by default
 								            let pidfd = libc::syscall(libc::SYS_pidfd_open, child_pid, 0);
 								            let fds: [c_int; 1] = [pidfd as RawFd];
 								            const SCM_MSG_LEN: usize = mem::size_of::<[c_int; 1]>();
 								            #[repr(C)]
 								            union Cmsg {
 								                buf: [u8; unsafe { CMSG_SPACE(SCM_MSG_LEN as u32) as usize }],
 								                _align: libc::cmsghdr,
 								            }
 								            let mut cmsg: Cmsg = mem::zeroed();
 								            // 0-length message to send through the socket so we can pass along the fd
 								            let mut iov = [IoSlice::new(b"")];
 								            let mut msg: libc::msghdr = mem::zeroed();
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								            msg.msg_iov = core::ptr::addr_of_mut!(iov) as *mut _;
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								            msg.msg_iovlen = 1;
 								            // only attach cmsg if we successfully acquired the pidfd
 								            if pidfd >= 0 {
-												Don't set cmsg fields in msghdr if we have no cmsg to send

											
										
										
											2023-11-19 15:19:47 +01:00
+								                msg.msg_controllen = mem::size_of_val(&cmsg.buf) as _;
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								                msg.msg_control = core::ptr::addr_of_mut!(cmsg.buf) as *mut _;
-												Don't set cmsg fields in msghdr if we have no cmsg to send

											
										
										
											2023-11-19 15:19:47 +01:00
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								                let hdr = CMSG_FIRSTHDR(core::ptr::addr_of_mut!(msg) as *mut _);
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								                (*hdr).cmsg_level = SOL_SOCKET;
 								                (*hdr).cmsg_type = SCM_RIGHTS;
 								                (*hdr).cmsg_len = CMSG_LEN(SCM_MSG_LEN as _) as _;
 								                let data = CMSG_DATA(hdr);
 								                crate::ptr::copy_nonoverlapping(
 								                    fds.as_ptr().cast::<u8>(),
 								                    data as *mut _,
 								                    SCM_MSG_LEN,
 								                );
 								            }
 								            // we send the 0-length message even if we failed to acquire the pidfd
 								            // so we get a consistent SEQPACKET order
 								            match cvt_r(|| libc::sendmsg(sock.as_raw(), &msg, 0)) {
 								                Ok(0) => {}
-												Don't set cmsg fields in msghdr if we have no cmsg to send

											
										
										
											2023-11-19 15:19:47 +01:00
+								                other => rtabort!("failed to communicate with parent process. {:?}", other),
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								            }
 								        }
 								    }
 								    #[cfg(target_os = "linux")]
 								    fn recv_pidfd(&self, sock: &crate::sys::net::Socket) -> pid_t {
 								        use crate::io::IoSliceMut;
 								        use crate::sys::cvt_r;
 								        use libc::{CMSG_DATA, CMSG_FIRSTHDR, CMSG_LEN, CMSG_SPACE, SCM_RIGHTS, SOL_SOCKET};
 								        unsafe {
 								            const SCM_MSG_LEN: usize = mem::size_of::<[c_int; 1]>();
 								            #[repr(C)]
 								            union Cmsg {
 								                _buf: [u8; unsafe { CMSG_SPACE(SCM_MSG_LEN as u32) as usize }],
 								                _align: libc::cmsghdr,
 								            }
 								            let mut cmsg: Cmsg = mem::zeroed();
 								            // 0-length read to get the fd
 								            let mut iov = [IoSliceMut::new(&mut [])];
 								            let mut msg: libc::msghdr = mem::zeroed();
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								            msg.msg_iov = core::ptr::addr_of_mut!(iov) as *mut _;
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								            msg.msg_iovlen = 1;
 								            msg.msg_controllen = mem::size_of::<Cmsg>() as _;
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								            msg.msg_control = core::ptr::addr_of_mut!(cmsg) as *mut _;
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
-												set CLOEXEC on pidfd received from child process

											
										
										
											2023-11-16 01:35:51 +01:00
+								            match cvt_r(|| libc::recvmsg(sock.as_raw(), &mut msg, libc::MSG_CMSG_CLOEXEC)) {
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								                Err(_) => return -1,
 								                Ok(_) => {}
 								            }
-												library: use `addr_of!`

											
										
										
											2024-02-24 16:02:17 +03:00
+								            let hdr = CMSG_FIRSTHDR(core::ptr::addr_of_mut!(msg) as *mut _);
-												open pidfd in child process and send to the parent via SOCK_SEQPACKET+CMSG

This is a 100% race-free way to obtain a child's pidfd while
avoiding `clone3`.

											
										
										
											2023-07-22 02:30:13 +02:00
+								            if hdr.is_null()
 								                || (*hdr).cmsg_level != SOL_SOCKET
 								                || (*hdr).cmsg_type != SCM_RIGHTS
 								                || (*hdr).cmsg_len != CMSG_LEN(SCM_MSG_LEN as _) as _
 								            {
 								                return -1;
 								            }
 								            let data = CMSG_DATA(hdr);
 								            let mut fds = [-1 as c_int];
 								            crate::ptr::copy_nonoverlapping(
 								                data as *const _,
 								                fds.as_mut_ptr().cast::<u8>(),
 								                SCM_MSG_LEN,
 								            );
 								            fds[0]
 								        }
 								    }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								}
 								////////////////////////////////////////////////////////////////////////////////
 								// Processes
 								////////////////////////////////////////////////////////////////////////////////
-												libs: doc comments

											
										
										
											2019-02-09 22:16:58 +00:00
+								/// The unique ID of the process (this should never be negative).
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								pub struct Process {
 								    pid: pid_t,
 								    status: Option<ExitStatus>,
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								    // On Linux, stores the pidfd created for this child.
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    // This is None if the user did not request pidfd creation,
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								    // or if the pidfd could not be created for some reason
-												update comment, we're currently using a different syscall

											
										
										
											2023-11-16 01:38:59 +01:00
+								    // (e.g. the `pidfd_open` syscall was not available).
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								    #[cfg(target_os = "linux")]
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    pidfd: Option<PidFd>,
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								}
 								impl Process {
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								    #[cfg(target_os = "linux")]
-												Update PidFd for the new I/O safety APIs.

											
										
										
											2021-08-03 07:31:59 -05:00
+								    unsafe fn new(pid: pid_t, pidfd: pid_t) -> Self {
-												Fix an unused import warning.

											
										
										
											2021-08-04 07:58:06 -05:00
+								        use crate::os::unix::io::FromRawFd;
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								        use crate::sys_common::FromInner;
-												Update PidFd for the new I/O safety APIs.

											
										
										
											2021-08-03 07:31:59 -05:00
+								        // Safety: If `pidfd` is nonnegative, we assume it's valid and otherwise unowned.
-												Remove unnecessary unsafe block in `process_unix`

											
										
										
											2021-08-24 10:07:16 +02:00
+								        let pidfd = (pidfd >= 0).then(|| PidFd::from_inner(sys::fd::FileDesc::from_raw_fd(pidfd)));
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								        Process { pid, status: None, pidfd }
 								    }
 								    #[cfg(not(target_os = "linux"))]
-												Update PidFd for the new I/O safety APIs.

											
										
										
											2021-08-03 07:31:59 -05:00
+								    unsafe fn new(pid: pid_t, _pidfd: pid_t) -> Self {
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
+								        Process { pid, status: None }
 								    }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    pub fn id(&self) -> u32 {
 								        self.pid as u32
 								    }
 								    pub fn kill(&mut self) -> io::Result<()> {
 								        // If we've already waited on this process then the pid can be recycled
 								        // and used for another process, and we probably shouldn't be killing
-												Return `Ok` on kill if process has already exited

											
										
										
											2023-06-13 20:32:31 +01:00
+								        // random processes, so return Ok because the process has exited already.
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        if self.status.is_some() {
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								            return Ok(());
 								        }
 								        #[cfg(target_os = "linux")]
 								        if let Some(pid_fd) = self.pidfd.as_ref() {
 								            // pidfd_send_signal predates pidfd_open. so if we were able to get an fd then sending signals will work too
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								            return pid_fd.kill();
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        }
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								        cvt(unsafe { libc::kill(self.pid, libc::SIGKILL) }).map(drop)
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    }
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								    pub fn wait(&mut self) -> io::Result<ExitStatus> {
-												libstd => 2018

											
										
										
											2019-02-11 04:23:21 +09:00
+								        use crate::sys::cvt_r;
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        if let Some(status) = self.status {
 								            return Ok(status);
 								        }
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								        #[cfg(target_os = "linux")]
 								        if let Some(pid_fd) = self.pidfd.as_ref() {
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								            let status = pid_fd.wait()?;
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								            self.status = Some(status);
 								            return Ok(status);
 								        }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								        let mut status = 0 as c_int;
 								        cvt_r(|| unsafe { libc::waitpid(self.pid, &mut status, 0) })?;
 								        self.status = Some(ExitStatus::new(status));
 								        Ok(ExitStatus::new(status))
 								    }
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
-												make Child::try_wait return io::Result<Option<ExitStatus>>

This is much nicer for callers who want to short-circuit real I/O errors
with `?`, because they can write this

    if let Some(status) = foo.try_wait()? {
        ...
    } else {
        ...
    }

instead of this

    match foo.try_wait() {
        Ok(status) => {
            ...
        }
        Err(err) if err.kind() == io::ErrorKind::WouldBlock => {
            ...
        }
        Err(err) => return Err(err),
    }

The original design of `try_wait` was patterned after the `Read` and
`Write` traits, which support both blocking and non-blocking
implementations in a single API. But since `try_wait` is never blocking,
it makes sense to optimize for the non-blocking case.

Tracking issue: https://github.com/rust-lang/rust/issues/38903

											
										
										
											2017-02-03 17:39:41 -05:00
+								    pub fn try_wait(&mut self) -> io::Result<Option<ExitStatus>> {
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
+								        if let Some(status) = self.status {
-												make Child::try_wait return io::Result<Option<ExitStatus>>

This is much nicer for callers who want to short-circuit real I/O errors
with `?`, because they can write this

    if let Some(status) = foo.try_wait()? {
        ...
    } else {
        ...
    }

instead of this

    match foo.try_wait() {
        Ok(status) => {
            ...
        }
        Err(err) if err.kind() == io::ErrorKind::WouldBlock => {
            ...
        }
        Err(err) => return Err(err),
    }

The original design of `try_wait` was patterned after the `Read` and
`Write` traits, which support both blocking and non-blocking
implementations in a single API. But since `try_wait` is never blocking,
it makes sense to optimize for the non-blocking case.

Tracking issue: https://github.com/rust-lang/rust/issues/38903

											
										
										
											2017-02-03 17:39:41 -05:00
+								            return Ok(Some(status));
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
+								        }
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								        #[cfg(target_os = "linux")]
 								        if let Some(pid_fd) = self.pidfd.as_ref() {
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								            let status = pid_fd.try_wait()?;
 								            if let Some(status) = status {
 								                self.status = Some(status)
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								            }
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								            return Ok(status);
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								        }
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
+								        let mut status = 0 as c_int;
 								        let pid = cvt(unsafe { libc::waitpid(self.pid, &mut status, libc::WNOHANG) })?;
 								        if pid == 0 {
-												make Child::try_wait return io::Result<Option<ExitStatus>>

This is much nicer for callers who want to short-circuit real I/O errors
with `?`, because they can write this

    if let Some(status) = foo.try_wait()? {
        ...
    } else {
        ...
    }

instead of this

    match foo.try_wait() {
        Ok(status) => {
            ...
        }
        Err(err) if err.kind() == io::ErrorKind::WouldBlock => {
            ...
        }
        Err(err) => return Err(err),
    }

The original design of `try_wait` was patterned after the `Read` and
`Write` traits, which support both blocking and non-blocking
implementations in a single API. But since `try_wait` is never blocking,
it makes sense to optimize for the non-blocking case.

Tracking issue: https://github.com/rust-lang/rust/issues/38903

											
										
										
											2017-02-03 17:39:41 -05:00
+								            Ok(None)
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
+								        } else {
 								            self.status = Some(ExitStatus::new(status));
-												make Child::try_wait return io::Result<Option<ExitStatus>>

This is much nicer for callers who want to short-circuit real I/O errors
with `?`, because they can write this

    if let Some(status) = foo.try_wait()? {
        ...
    } else {
        ...
    }

instead of this

    match foo.try_wait() {
        Ok(status) => {
            ...
        }
        Err(err) if err.kind() == io::ErrorKind::WouldBlock => {
            ...
        }
        Err(err) => return Err(err),
    }

The original design of `try_wait` was patterned after the `Read` and
`Write` traits, which support both blocking and non-blocking
implementations in a single API. But since `try_wait` is never blocking,
it makes sense to optimize for the non-blocking case.

Tracking issue: https://github.com/rust-lang/rust/issues/38903

											
										
										
											2017-02-03 17:39:41 -05:00
+								            Ok(Some(ExitStatus::new(status)))
-												std: Add a nonblocking `Child::try_wait` method

This commit adds a new method to the `Child` type in the `std::process` module
called `try_wait`. This method is the same as `wait` except that it will not
block the calling thread and instead only attempt to collect the exit status. On
Unix this means that we call `waitpid` with the `WNOHANG` flag and on Windows it
just means that we pass a 0 timeout to `WaitForSingleObject`.

Currently it's possible to build this method out of tree, but it's unfortunately
tricky to do so. Specifically on Unix you essentially lose ownership of the pid
for the process once a call to `waitpid` has succeeded. Although `Child` tracks
this state internally to be resilient to multiple calls to `wait` or a `kill`
after a successful wait, if the child is waited on externally then the state
inside of `Child` is not updated. This means that external implementations of
this method must be extra careful to essentially not use a `Child`'s methods
after a call to `waitpid` has succeeded (even in a nonblocking fashion).

By adding this functionality to the standard library it should help canonicalize
these external implementations and ensure they can continue to robustly reuse
the `Child` type from the standard library without worrying about pid ownership.

											
										
										
											2017-01-05 22:47:09 -08:00
+								        }
 								    }
-												Separated fuchsia-specific process stuff into 'process_fuchsia.rs' and refactored out some now-duplicated code into a 'process_common.rs'

											
										
										
											2016-11-23 13:58:13 -08:00
+								}
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
 								/// Unix exit statuses
-												unix::ExitStatus: Add comment saying that it's a wait status

With cross-reference.

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-11-08 17:38:01 +00:00
+								//
 								// This is not actually an "exit status" in Unix terminology.  Rather, it is a "wait status".
 								// See the discussion in comments and doc comments for `std::process::ExitStatus`.
-												impl Default for ExitStatus

											
										
										
											2023-01-03 20:47:07 +00:00
+								#[derive(PartialEq, Eq, Clone, Copy, Default)]
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								pub struct ExitStatus(c_int);
-												Manual Debug for Unix ExitCode ExitStatus ExitStatusError

These structs have misleading names.  An ExitStatus[Error] is actually
a Unix wait status; an ExitCode is actually an exit status.

The Display impls are fixed, but the Debug impls are still misleading,
as reported in #74832.

Fix this by pretending that these internal structs are called
`unix_exit_status` and `unix_wait_status` as applicable.  (We can't
actually rename the structs because of the way that the cross-platform
machinery works: the names are cross-platform.)

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-08-24 18:56:24 +01:00
+								impl fmt::Debug for ExitStatus {
 								    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
 								        f.debug_tuple("unix_wait_status").field(&self.0).finish()
 								    }
 								}
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								impl ExitStatus {
 								    pub fn new(status: c_int) -> ExitStatus {
 								        ExitStatus(status)
 								    }
-												if available use a Child's pidfd for kill/wait

											
										
										
											2023-11-16 01:41:02 +01:00
+								    #[cfg(target_os = "linux")]
 								    pub fn from_waitid_siginfo(siginfo: libc::siginfo_t) -> ExitStatus {
 								        let status = unsafe { siginfo.si_status() };
 								        match siginfo.si_code {
 								            libc::CLD_EXITED => ExitStatus((status & 0xff) << 8),
 								            libc::CLD_KILLED => ExitStatus(status),
 								            libc::CLD_DUMPED => ExitStatus(status | 0x80),
 								            libc::CLD_CONTINUED => ExitStatus(0xffff),
 								            libc::CLD_STOPPED | libc::CLD_TRAPPED => ExitStatus(((status & 0xff) << 8) | 0x7f),
 								            _ => unreachable!("waitid() should only return the above codes"),
 								        }
 								    }
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								    fn exited(&self) -> bool {
-												Update libc to 0.2.79

This also fixes issues with inconsistent `unsafe` on functions.

											
										
										
											2020-09-30 21:30:07 -07:00
+								        libc::WIFEXITED(self.0)
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								    }
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
+								    pub fn exit_ok(&self) -> Result<(), ExitStatusError> {
-												Remove various double spaces in source comments.

											
										
										
											2023-01-14 16:33:11 +01:00
+								        // This assumes that WIFEXITED(status) && WEXITSTATUS==0 corresponds to status==0. This is
-												Add `ExitStatusError` for `vxworks`

											
										
										
											2021-05-20 01:34:06 +02:00
+								        // true on all actual versions of Unix, is widely assumed, and is specified in SuS
-												Remove various double spaces in source comments.

											
										
										
											2023-01-14 16:33:11 +01:00
+								        // https://pubs.opengroup.org/onlinepubs/9699919799/functions/wait.html. If it is not
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
+								        // true for a platform pretending to be Unix, the tests (our doctests, and also
-												Spelling library/

* advance
* aligned
* borrowed
* calculate
* debugable
* debuggable
* declarations
* desugaring
* documentation
* enclave
* ignorable
* initialized
* iterator
* kaboom
* monomorphization
* nonexistent
* optimizer
* panicking
* process
* reentrant
* rustonomicon
* the
* uninitialized

Signed-off-by: Josh Soref <2119212+jsoref@users.noreply.github.com>

											
										
										
											2023-04-11 00:49:38 -04:00
+								        // process_unix/tests.rs) will spot it. `ExitStatusError::code` assumes this too.
-												Remove `raw_os_nonzero` feature.

											
										
										
											2024-01-24 03:19:51 +01:00
+								        match NonZero::try_from(self.0) {
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
+								            /* was nonzero */ Ok(failure) => Err(ExitStatusError(failure)),
 								            /* was zero, couldn't convert */ Err(_) => Ok(()),
 								        }
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								    }
 								    pub fn code(&self) -> Option<i32> {
-												feat: Add use of bool::then in sys/unix/process

Remove else { None } in favor of using bool::then()

											
										
										
											2022-03-17 19:12:09 -04:00
+								        self.exited().then(|| libc::WEXITSTATUS(self.0))
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								    }
 								    pub fn signal(&self) -> Option<i32> {
-												feat: Add use of bool::then in sys/unix/process

Remove else { None } in favor of using bool::then()

											
										
										
											2022-03-17 19:12:09 -04:00
+								        libc::WIFSIGNALED(self.0).then(|| libc::WTERMSIG(self.0))
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								    }
-												unix ExitStatus: Provide .into_raw()

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:41:55 +00:00
-												unix ExitStatus: Provide .core_dumped

This is essential for proper reporting of child process status on Unix.

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:44:13 +00:00
+								    pub fn core_dumped(&self) -> bool {
 								        libc::WIFSIGNALED(self.0) && libc::WCOREDUMP(self.0)
 								    }
-												unix ExitStatus: Provide .stopped_signal()

Necessary to handle WIFSTOPPED.

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:47:47 +00:00
+								    pub fn stopped_signal(&self) -> Option<i32> {
-												feat: Add use of bool::then in sys/unix/process

Remove else { None } in favor of using bool::then()

											
										
										
											2022-03-17 19:12:09 -04:00
+								        libc::WIFSTOPPED(self.0).then(|| libc::WSTOPSIG(self.0))
-												unix ExitStatus: Provide .stopped_signal()

Necessary to handle WIFSTOPPED.

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:47:47 +00:00
+								    }
-												unix ExitStatus: Provide .continued()

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:52:17 +00:00
+								    pub fn continued(&self) -> bool {
 								        libc::WIFCONTINUED(self.0)
 								    }
-												unix ExitStatus: Provide .into_raw()

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2020-12-12 21:41:55 +00:00
+								    pub fn into_raw(&self) -> c_int {
 								        self.0
 								    }
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								}
-												Added docs for `From<c_int>` for `ExitStatus`

											
										
										
											2020-07-13 13:47:18 +02:00
+								/// Converts a raw `c_int` to a type-safe `ExitStatus` by wrapping it without copying.
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								impl From<c_int> for ExitStatus {
 								    fn from(a: c_int) -> ExitStatus {
 								        ExitStatus(a)
 								    }
 								}
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								/// Convert a signal number to a readable, searchable name.
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								///
 								/// This string should be displayed right after the signal number.
 								/// If a signal is unrecognized, it returns the empty string, so that
 								/// you just get the number like "0". If it is recognized, you'll get
 								/// something like "9 (SIGKILL)".
 								fn signal_string(signal: i32) -> &'static str {
 								    match signal {
 								        libc::SIGHUP => " (SIGHUP)",
 								        libc::SIGINT => " (SIGINT)",
 								        libc::SIGQUIT => " (SIGQUIT)",
 								        libc::SIGILL => " (SIGILL)",
 								        libc::SIGTRAP => " (SIGTRAP)",
 								        libc::SIGABRT => " (SIGABRT)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGBUS => " (SIGBUS)",
 								        libc::SIGFPE => " (SIGFPE)",
 								        libc::SIGKILL => " (SIGKILL)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGUSR1 => " (SIGUSR1)",
 								        libc::SIGSEGV => " (SIGSEGV)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGUSR2 => " (SIGUSR2)",
 								        libc::SIGPIPE => " (SIGPIPE)",
 								        libc::SIGALRM => " (SIGALRM)",
 								        libc::SIGTERM => " (SIGTERM)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGCHLD => " (SIGCHLD)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGCONT => " (SIGCONT)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGSTOP => " (SIGSTOP)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGTSTP => " (SIGTSTP)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGTTIN => " (SIGTTIN)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGTTOU => " (SIGTTOU)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGURG => " (SIGURG)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGXCPU => " (SIGXCPU)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGXFSZ => " (SIGXFSZ)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGVTALRM => " (SIGVTALRM)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGPROF => " (SIGPROF)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGWINCH => " (SIGWINCH)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(any(target_os = "haiku", target_os = "l4re")))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGIO => " (SIGIO)",
-												signal update string representation for haiku.

											
										
										
											2023-01-18 23:06:59 +00:00
+								        #[cfg(target_os = "haiku")]
 								        libc::SIGPOLL => " (SIGPOLL)",
-												fix: get the l4re target working again

											
										
										
											2023-06-13 20:20:17 +00:00
+								        #[cfg(not(target_os = "l4re"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGSYS => " (SIGSYS)",
-												Fix MIPS-specific signal bug

											
										
										
											2022-06-02 15:18:16 -07:00
+								        // For information on Linux signals, run `man 7 signal`
 								        #[cfg(all(
 								            target_os = "linux",
 								            any(
 								                target_arch = "x86_64",
 								                target_arch = "x86",
 								                target_arch = "arm",
 								                target_arch = "aarch64"
 								            )
 								        ))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGSTKFLT => " (SIGSTKFLT)",
-												Add QNX Neutrino support to libstd

Co-authored-by: gh-tr <troach@qnx.com>

											
										
										
											2023-01-10 10:44:05 +01:00
+								        #[cfg(any(target_os = "linux", target_os = "nto"))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGPWR => " (SIGPWR)",
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								        #[cfg(any(
 								            target_os = "freebsd",
 								            target_os = "netbsd",
 								            target_os = "openbsd",
-												Add QNX Neutrino support to libstd

Co-authored-by: gh-tr <troach@qnx.com>

											
										
										
											2023-01-10 10:44:05 +01:00
+								            target_os = "dragonfly",
 								            target_os = "nto",
-												Fix SIGEMT and SIGINFO parsing on watchOS and visionOS

											
										
										
											2024-04-28 17:37:04 +02:00
+								            target_vendor = "apple",
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								        ))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGEMT => " (SIGEMT)",
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								        #[cfg(any(
 								            target_os = "freebsd",
 								            target_os = "netbsd",
 								            target_os = "openbsd",
-												Fix SIGEMT and SIGINFO parsing on watchOS and visionOS

											
										
										
											2024-04-28 17:37:04 +02:00
+								            target_os = "dragonfly",
 								            target_vendor = "apple",
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								        ))]
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        libc::SIGINFO => " (SIGINFO)",
-												added support for GNU/Hurd

											
										
										
											2023-09-19 12:41:30 +02:00
+								        #[cfg(target_os = "hurd")]
 								        libc::SIGLOST => " (SIGLOST)",
-												std::unix::process adding few specific freebsd signals to be able to id.

											
										
										
											2024-06-08 08:31:35 +01:00
+								        #[cfg(target_os = "freebsd")]
 								        libc::SIGTHR => " (SIGTHR)",
 								        #[cfg(target_os = "freebsd")]
 								        libc::SIGLIBRT => " (SIGLIBRT)",
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								        _ => "",
 								    }
-												std: `<ExitStatus as Display>::fmt` name the signal it died from

											
										
										
											2022-04-08 13:39:24 -07:00
+								}
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								impl fmt::Display for ExitStatus {
 								    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
 								        if let Some(code) = self.code() {
-												Use implicit capture syntax in format_args

This updates the standard library's documentation to use the new syntax. The
documentation is worthwhile to update as it should be more idiomatic
(particularly for features like this, which are nice for users to get acquainted
with). The general codebase is likely more hassle than benefit to update: it'll
hurt git blame, and generally updates can be done by folks updating the code if
(and when) that makes things more readable with the new format.

A few places in the compiler and library code are updated (mostly just due to
already having been done when this commit was first authored).

											
										
										
											2022-02-12 23:16:17 +04:00
+								            write!(f, "exit status: {code}")
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								        } else if let Some(signal) = self.signal() {
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								            let signal_string = signal_string(signal);
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								            if self.core_dumped() {
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								                write!(f, "signal: {signal}{signal_string} (core dumped)")
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								            } else {
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								                write!(f, "signal: {signal}{signal_string}")
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								            }
 								        } else if let Some(signal) = self.stopped_signal() {
-												std: show signal number along with name

											
										
										
											2022-06-01 11:20:11 -07:00
+								            let signal_string = signal_string(signal);
 								            write!(f, "stopped (not terminated) by signal: {signal}{signal_string}")
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								        } else if self.continued() {
 								            write!(f, "continued (WIFCONTINUED)")
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								        } else {
-												process::unix: Handle other wait statuses in ExitStatus as Display

Currently, on Nightly, this panics:

```
use std::process::ExitStatus;
use std::os::unix::process::ExitStatusExt;

fn main() {
    let st = ExitStatus::from_raw(0x007f);
    println!("st = {}", st);
}
```

This is because the impl of Display assumes that if .code() is None,
.signal() must be Some.  That was a false assumption, although it was
true with buggy code before
  5b1316f78152a9c066b357ea9addf803d48e114a
  unix ExitStatus: Do not treat WIFSTOPPED as WIFSIGNALED

This is not likely to have affected many people in practice, because
`Command` will never produce such a wait status (`ExitStatus`).

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:30:03 +00:00
+								            write!(f, "unrecognised wait status: {} {:#x}", self.0, self.0)
-												Fix ExitStatus on Fuchsia

Fuchsia exit codes don't follow the convention of libc::WEXITSTATUS et
al, and they are 64 bits instead of 32 bits. This gives Fuchsia its own
representation of ExitStatus.

Additionally, the zircon syscall structs were out of date, causing us to
see bogus return codes.

											
										
										
											2019-09-24 21:34:44 -07:00
+								        }
 								    }
 								}
-												process::unix: Test wait status formatting

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:58:52 +00:00
-												Manual Debug for Unix ExitCode ExitStatus ExitStatusError

These structs have misleading names.  An ExitStatus[Error] is actually
a Unix wait status; an ExitCode is actually an exit status.

The Display impls are fixed, but the Debug impls are still misleading,
as reported in #74832.

Fix this by pretending that these internal structs are called
`unix_exit_status` and `unix_wait_status` as applicable.  (We can't
actually rename the structs because of the way that the cross-platform
machinery works: the names are cross-platform.)

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-08-24 18:56:24 +01:00
+								#[derive(PartialEq, Eq, Clone, Copy)]
-												Remove `raw_os_nonzero` feature.

											
										
										
											2024-01-24 03:19:51 +01:00
+								pub struct ExitStatusError(NonZero<c_int>);
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
 								impl Into<ExitStatus> for ExitStatusError {
 								    fn into(self) -> ExitStatus {
 								        ExitStatus(self.0.into())
 								    }
 								}
-												Manual Debug for Unix ExitCode ExitStatus ExitStatusError

These structs have misleading names.  An ExitStatus[Error] is actually
a Unix wait status; an ExitCode is actually an exit status.

The Display impls are fixed, but the Debug impls are still misleading,
as reported in #74832.

Fix this by pretending that these internal structs are called
`unix_exit_status` and `unix_wait_status` as applicable.  (We can't
actually rename the structs because of the way that the cross-platform
machinery works: the names are cross-platform.)

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-08-24 18:56:24 +01:00
+								impl fmt::Debug for ExitStatusError {
 								    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
 								        f.debug_tuple("unix_wait_status").field(&self.0).finish()
 								    }
 								}
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
+								impl ExitStatusError {
-												Use generic `NonZero` internally.

											
										
										
											2024-01-29 23:59:09 +01:00
+								    pub fn code(self) -> Option<NonZero<i32>> {
-												Provide ExitStatusError

Closes #73125

This is in pursuance of
  Issue #73127 Consider adding #[must_use] to std::process::ExitStatus

In
  MR #81452 Add #[must_use] to [...] process::ExitStatus
we concluded that the existing arrangements in are too awkward
so adding that #[must_use] is blocked on improving the ergonomics.

I wrote a mini-RFC-style discusion of the approach in
  https://github.com/rust-lang/rust/issues/73125#issuecomment-771092741

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-03-03 12:17:16 +00:00
+								        ExitStatus(self.0.into()).code().map(|st| st.try_into().unwrap())
 								    }
 								}
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								#[cfg(target_os = "linux")]
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								mod linux_child_ext {
 								    use crate::io;
 								    use crate::mem;
 								    use crate::os::linux::process as os;
 								    use crate::sys::pal::unix::linux::pidfd as imp;
 								    use crate::sys::pal::unix::ErrorKind;
 								    use crate::sys_common::FromInner;
 								    #[unstable(feature = "linux_pidfd", issue = "82971")]
 								    impl crate::os::linux::process::ChildExt for crate::process::Child {
 								        fn pidfd(&self) -> io::Result<&os::PidFd> {
 								            self.handle
 								                .pidfd
 								                .as_ref()
 								                // SAFETY: The os type is a transparent wrapper, therefore we can transmute references
 								                .map(|fd| unsafe { mem::transmute::<&imp::PidFd, &os::PidFd>(fd) })
 								                .ok_or_else(|| io::Error::new(ErrorKind::Uncategorized, "No pidfd was created."))
 								        }
-												Add PidFd type and seal traits

Improve docs

Split do_fork into two

Make do_fork unsafe

Add target attribute to create_pidfd field in Command

Add method to get create_pidfd value

											
										
										
											2021-02-06 14:15:49 +01:00
-												Add PidFd::{kill, wait, try_wait}

											
										
										
											2024-04-18 01:51:06 +02:00
+								        fn take_pidfd(&mut self) -> io::Result<os::PidFd> {
 								            self.handle
 								                .pidfd
 								                .take()
 								                .map(|fd| <os::PidFd as FromInner<imp::PidFd>>::from_inner(fd))
 								                .ok_or_else(|| io::Error::new(ErrorKind::Uncategorized, "No pidfd was created."))
 								        }
-												Add Linux-specific pidfd process extensions

Background:

Over the last year, pidfd support was added to the Linux kernel. This
allows interacting with other processes. In particular, this allows
waiting on a child process with a timeout in a race-free way, bypassing
all of the awful signal-handler tricks that are usually required.

Pidfds can be obtained for a child process (as well as any other
process) via the `pidfd_open` syscall. Unfortunately, this requires
several conditions to hold in order to be race-free (i.e. the pid is not
reused).
Per `man pidfd_open`:

```
· the disposition of SIGCHLD has not been explicitly set to SIG_IGN
 (see sigaction(2));

· the SA_NOCLDWAIT flag was not specified while establishing a han‐
 dler for SIGCHLD or while setting the disposition of that signal to
 SIG_DFL (see sigaction(2)); and

· the zombie process was not reaped elsewhere in the program (e.g.,
 either by an asynchronously executed signal handler or by wait(2)
 or similar in another thread).

If any of these conditions does not hold, then the child process
(along with a PID file descriptor that refers to it) should instead
be created using clone(2) with the CLONE_PIDFD flag.
```

Sadly, these conditions are impossible to guarantee once any libraries
are used. For example, C code runnng in a different thread could call
`wait()`, which is impossible to detect from Rust code trying to open a
pidfd.

While pid reuse issues should (hopefully) be rare in practice, we can do
better. By passing the `CLONE_PIDFD` flag to `clone()` or `clone3()`, we
can obtain a pidfd for the child process in a guaranteed race-free
manner.

This PR:

This PR adds Linux-specific process extension methods to allow obtaining
pidfds for processes spawned via the standard `Command` API. Other than
being made available to user code, the standard library does not make
use of these pidfds in any way. In particular, the implementation of
`Child::wait` is completely unchanged.

Two Linux-specific helper methods are added: `CommandExt::create_pidfd`
and `ChildExt::pidfd`. These methods are intended to serve as a building
block for libraries to build higher-level abstractions - in particular,
waiting on a process with a timeout.

I've included a basic test, which verifies that pidfds are created iff
the `create_pidfd` method is used. This test is somewhat special - it
should always succeed on systems with the `clone3` system call
available, and always fail on systems without `clone3` available. I'm
not sure how to best ensure this programatically.

This PR relies on the newer `clone3` system call to pass the `CLONE_FD`,
rather than the older `clone` system call. `clone3` was added to Linux
in the same release as pidfds, so this shouldn't unnecessarily limit the
kernel versions that this code supports.

Unresolved questions:
* What should the name of the feature gate be for these newly added
  methods?
* Should the `pidfd` method distinguish between an error occurring
  and `create_pidfd` not being called?

											
										
										
											2020-09-15 23:35:08 -04:00
+								    }
 								}
-												process::unix: Test wait status formatting

Signed-off-by: Ian Jackson <ijackson@chiark.greenend.org.uk>

											
										
										
											2021-02-22 14:58:52 +00:00
+								#[cfg(test)]
 								#[path = "process_unix/tests.rs"]
 								mod tests;
-												std: unix process_unsupported: Provide a wait status emulation

Fixes #114593

Needs FCP due to behavioural changes.

											
										
										
											2023-08-22 16:17:02 +01:00
 								// See [`process_unsupported_wait_status::compare_with_linux`];
 								#[cfg(all(test, target_os = "linux"))]
 								#[path = "process_unsupported/wait_status.rs"]
 								mod process_unsupported_wait_status;