From 5b1af3901927743ab63aa9d31d47a345c76500bf Mon Sep 17 00:00:00 2001
From: Brian Bowman <seeker14491@gmail.com>
Date: Wed, 29 Aug 2018 20:56:09 -0500
Subject: [PATCH] Fix Windows job management

Fixes #1493
---
 src/rustup-cli/job.rs         | 187 ++++++----------------------------
 src/rustup-cli/proxy_mode.rs  |  65 ++++++------
 src/rustup-cli/rustup_mode.rs |  10 +-
 src/rustup-utils/src/utils.rs |   2 +
 src/rustup/command.rs         |  16 +--
 5 files changed, 82 insertions(+), 198 deletions(-)
diff --git a/src/rustup-cli/job.rs b/src/rustup-cli/job.rs
index 5dd590daf4..34c56d591c 100644
--- a/src/rustup-cli/job.rs
+++ b/src/rustup-cli/job.rs
@@ -25,6 +25,9 @@ pub fn setup() -> Option<Setup> {
 
 #[cfg(unix)]
 mod imp {
+    use std::env;
+    use libc;
+
     pub type Setup = ();
 
     pub unsafe fn setup() -> Option<()> {
@@ -36,19 +39,23 @@ mod imp {
 mod imp {
     extern crate winapi;
 
-    use std::ffi::OsString;
     use std::io;
     use std::mem;
-    use std::os::windows::prelude::*;
-    use winapi::shared::*;
-    use winapi::um::*;
+    use std::ptr;
+
+    use self::winapi::shared::minwindef::*;
+    use self::winapi::um::handleapi::*;
+    use self::winapi::um::jobapi2::*;
+    use self::winapi::um::processthreadsapi::*;
+    use self::winapi::um::winnt::*;
+    use self::winapi::um::winnt::HANDLE;
 
     pub struct Setup {
         job: Handle,
     }
 
     pub struct Handle {
-        inner: ntdef::HANDLE,
+        inner: HANDLE,
     }
 
     fn last_err() -> io::Error {
@@ -65,7 +72,7 @@ mod imp {
         // use job objects, so we instead just ignore errors and assume that
         // we're otherwise part of someone else's job object in this case.
 
-        let job = jobapi2::CreateJobObjectW(0 as *mut _, 0 as *const _);
+        let job = CreateJobObjectW(ptr::null_mut(), ptr::null());
         if job.is_null() {
             return None;
         }
@@ -73,16 +80,16 @@ mod imp {
 
         // Indicate that when all handles to the job object are gone that all
         // process in the object should be killed. Note that this includes our
-        // entire process tree by default because we've added ourselves and and
+        // entire process tree by default because we've added ourselves and
         // our children will reside in the job once we spawn a process.
-        let mut info: winnt::JOBOBJECT_EXTENDED_LIMIT_INFORMATION;
+        let mut info: JOBOBJECT_EXTENDED_LIMIT_INFORMATION;
         info = mem::zeroed();
-        info.BasicLimitInformation.LimitFlags = winnt::JOB_OBJECT_LIMIT_KILL_ON_JOB_CLOSE;
-        let r = jobapi2::SetInformationJobObject(
+        info.BasicLimitInformation.LimitFlags = JOB_OBJECT_LIMIT_KILL_ON_JOB_CLOSE;
+        let r = SetInformationJobObject(
             job.inner,
-            winnt::JobObjectExtendedLimitInformation,
-            &mut info as *mut _ as minwindef::LPVOID,
-            mem::size_of_val(&info) as minwindef::DWORD,
+            JobObjectExtendedLimitInformation,
+            &mut info as *mut _ as LPVOID,
+            mem::size_of_val(&info) as DWORD,
         );
         if r == 0 {
             return None;
@@ -90,42 +97,28 @@ mod imp {
 
         // Assign our process to this job object, meaning that our children will
         // now live or die based on our existence.
-        let me = processthreadsapi::GetCurrentProcess();
-        let r = jobapi2::AssignProcessToJobObject(job.inner, me);
+        let me = GetCurrentProcess();
+        let r = AssignProcessToJobObject(job.inner, me);
         if r == 0 {
             return None;
         }
 
-        Some(Setup { job: job })
+        Some(Setup { job })
     }
 
     impl Drop for Setup {
         fn drop(&mut self) {
-            // This is a litte subtle. By default if we are terminated then all
-            // processes in our job object are terminated as well, but we
-            // intentionally want to whitelist some processes to outlive our job
-            // object (see below).
-            //
-            // To allow for this, we manually kill processes instead of letting
-            // the job object kill them for us. We do this in a loop to handle
-            // processes spawning other processes.
-            //
-            // Finally once this is all done we know that the only remaining
-            // ones are ourselves and the whitelisted processes. The destructor
-            // here then configures our job object to *not* kill everything on
-            // close, then closes the job object.
+            // On normal exits (not ctrl-c), we don't want to kill any child
+            // processes. The destructor here configures our job object to
+            // *not* kill everything on close, then closes the job object.
             unsafe {
-                while self.kill_remaining() {
-                    info!("killed some, going for more");
-                }
-
-                let mut info: winnt::JOBOBJECT_EXTENDED_LIMIT_INFORMATION;
+                let mut info: JOBOBJECT_EXTENDED_LIMIT_INFORMATION;
                 info = mem::zeroed();
-                let r = jobapi2::SetInformationJobObject(
+                let r = SetInformationJobObject(
                     self.job.inner,
-                    winnt::JobObjectExtendedLimitInformation,
-                    &mut info as *mut _ as minwindef::LPVOID,
-                    mem::size_of_val(&info) as minwindef::DWORD,
+                    JobObjectExtendedLimitInformation,
+                    &mut info as *mut _ as LPVOID,
+                    mem::size_of_val(&info) as DWORD,
                 );
                 if r == 0 {
                     info!("failed to configure job object to defaults: {}", last_err());
@@ -134,126 +127,10 @@ mod imp {
         }
     }
 
-    impl Setup {
-        unsafe fn kill_remaining(&mut self) -> bool {
-            #[repr(C)]
-            struct Jobs {
-                header: winnt::JOBOBJECT_BASIC_PROCESS_ID_LIST,
-                list: [basetsd::ULONG_PTR; 1024],
-            }
-
-            let mut jobs: Jobs = mem::zeroed();
-            let r = jobapi2::QueryInformationJobObject(
-                self.job.inner,
-                winnt::JobObjectBasicProcessIdList,
-                &mut jobs as *mut _ as minwindef::LPVOID,
-                mem::size_of_val(&jobs) as minwindef::DWORD,
-                0 as *mut _,
-            );
-            if r == 0 {
-                info!("failed to query job object: {}", last_err());
-                return false;
-            }
-
-            let mut killed = false;
-            let list = &jobs.list[..jobs.header.NumberOfProcessIdsInList as usize];
-            assert!(list.len() > 0);
-
-            let list = list.iter()
-                .filter(|&&id| {
-                    // let's not kill ourselves
-                    id as minwindef::DWORD != processthreadsapi::GetCurrentProcessId()
-                })
-                .filter_map(|&id| {
-                    // Open the process with the necessary rights, and if this
-                    // fails then we probably raced with the process exiting so we
-                    // ignore the problem.
-                    let flags = winnt::PROCESS_QUERY_INFORMATION | winnt::PROCESS_TERMINATE
-                        | winnt::SYNCHRONIZE;
-                    let p = processthreadsapi::OpenProcess(
-                        flags,
-                        minwindef::FALSE,
-                        id as minwindef::DWORD,
-                    );
-                    if p.is_null() {
-                        None
-                    } else {
-                        Some(Handle { inner: p })
-                    }
-                })
-                .filter(|p| {
-                    // Test if this process was actually in the job object or not.
-                    // If it's not then we likely raced with something else
-                    // recycling this PID, so we just skip this step.
-                    let mut res = 0;
-                    let r = jobapi::IsProcessInJob(p.inner, self.job.inner, &mut res);
-                    if r == 0 {
-                        info!("failed to test is process in job: {}", last_err());
-                        return false;
-                    }
-                    res == minwindef::TRUE
-                });
-
-            for p in list {
-                // Load the file which this process was spawned from. We then
-                // later use this for identification purposes.
-                let mut buf = [0; 1024];
-                let r = psapi::GetProcessImageFileNameW(
-                    p.inner,
-                    buf.as_mut_ptr(),
-                    buf.len() as minwindef::DWORD,
-                );
-                if r == 0 {
-                    info!("failed to get image name: {}", last_err());
-                    continue;
-                }
-                let s = OsString::from_wide(&buf[..r as usize]);
-                info!("found remaining: {:?}", s);
-
-                // And here's where we find the whole purpose for this
-                // function!  Currently, our only whitelisted process is
-                // `mspdbsrv.exe`, and more details about that can be found
-                // here:
-                //
-                //      https://github.com/rust-lang/rust/issues/33145
-                //
-                // The gist of it is that all builds on one machine use the
-                // same `mspdbsrv.exe` instance. If we were to kill this
-                // instance then we could erroneously cause other builds to
-                // fail.
-                if let Some(s) = s.to_str() {
-                    if s.contains("mspdbsrv") {
-                        info!("\toops, this is mspdbsrv");
-                        continue;
-                    }
-                }
-
-                // Ok, this isn't mspdbsrv, let's kill the process. After we
-                // kill it we wait on it to ensure that the next time around in
-                // this function we're not going to see it again.
-                let r = processthreadsapi::TerminateProcess(p.inner, 1);
-                if r == 0 {
-                    info!("\tfailed to kill subprocess: {}", last_err());
-                    info!("\tassuming subprocess is dead...");
-                } else {
-                    info!("\tterminated subprocess");
-                }
-                let r = synchapi::WaitForSingleObject(p.inner, winbase::INFINITE);
-                if r != 0 {
-                    info!("failed to wait for process to die: {}", last_err());
-                    return false;
-                }
-                killed = true;
-            }
-
-            return killed;
-        }
-    }
-
     impl Drop for Handle {
         fn drop(&mut self) {
             unsafe {
-                handleapi::CloseHandle(self.inner);
+                CloseHandle(self.inner);
             }
         }
     }
diff --git a/src/rustup-cli/proxy_mode.rs b/src/rustup-cli/proxy_mode.rs
index 9b9c174b52..fa60752c31 100644
--- a/src/rustup-cli/proxy_mode.rs
+++ b/src/rustup-cli/proxy_mode.rs
@@ -1,51 +1,54 @@
 use common::set_globals;
 use rustup::Cfg;
 use errors::*;
-use rustup_utils::utils;
+use rustup_utils::utils::{self, ExitCode};
 use rustup::command::run_command_for_dir;
 use std::env;
 use std::ffi::OsString;
 use std::path::PathBuf;
+use std::process;
 use job;
 
 pub fn main() -> Result<()> {
     ::self_update::cleanup_self_updater()?;
 
-    let _setup = job::setup();
-
-    let mut args = env::args();
-
-    let arg0 = args.next().map(PathBuf::from);
-    let arg0 = arg0.as_ref()
-        .and_then(|a| a.file_name())
-        .and_then(|a| a.to_str());
-    let ref arg0 = arg0.ok_or(ErrorKind::NoExeName)?;
-
-    // Check for a toolchain specifier.
-    let arg1 = args.next();
-    let toolchain = arg1.as_ref().and_then(|arg1| {
-        if arg1.starts_with('+') {
-            Some(&arg1[1..])
+    let ExitCode(c) = {
+        let _setup = job::setup();
+
+        let mut args = env::args();
+
+        let arg0 = args.next().map(PathBuf::from);
+        let arg0 = arg0.as_ref()
+            .and_then(|a| a.file_name())
+            .and_then(|a| a.to_str());
+        let ref arg0 = arg0.ok_or(ErrorKind::NoExeName)?;
+
+        // Check for a toolchain specifier.
+        let arg1 = args.next();
+        let toolchain = arg1.as_ref().and_then(|arg1| {
+            if arg1.starts_with('+') {
+                Some(&arg1[1..])
+            } else {
+                None
+            }
+        });
+
+        // Build command args now while we know whether or not to skip arg 1.
+        let cmd_args: Vec<_> = if toolchain.is_none() {
+            env::args_os().skip(1).collect()
         } else {
-            None
-        }
-    });
-
-    // Build command args now while we know whether or not to skip arg 1.
-    let cmd_args: Vec<_> = if toolchain.is_none() {
-        env::args_os().skip(1).collect()
-    } else {
-        env::args_os().skip(2).collect()
-    };
+            env::args_os().skip(2).collect()
+        };
 
-    let cfg = set_globals(false)?;
-    cfg.check_metadata_version()?;
-    direct_proxy(&cfg, arg0, toolchain, &cmd_args)?;
+        let cfg = set_globals(false)?;
+        cfg.check_metadata_version()?;
+        direct_proxy(&cfg, arg0, toolchain, &cmd_args)?
+    };
 
-    Ok(())
+    process::exit(c)
 }
 
-fn direct_proxy(cfg: &Cfg, arg0: &str, toolchain: Option<&str>, args: &[OsString]) -> Result<()> {
+fn direct_proxy(cfg: &Cfg, arg0: &str, toolchain: Option<&str>, args: &[OsString]) -> Result<ExitCode> {
     let cmd = match toolchain {
         None => cfg.create_command_for_dir(&utils::current_dir()?, arg0)?,
         Some(tc) => cfg.create_command_for_toolchain(tc, false, arg0)?,
diff --git a/src/rustup-cli/rustup_mode.rs b/src/rustup-cli/rustup_mode.rs
index 58897395f8..28737879bf 100644
--- a/src/rustup-cli/rustup_mode.rs
+++ b/src/rustup-cli/rustup_mode.rs
@@ -5,10 +5,10 @@ use rustup::settings::TelemetryMode;
 use errors::*;
 use rustup_dist::manifest::Component;
 use rustup_dist::dist::{PartialTargetTriple, PartialToolchainDesc, TargetTriple};
-use rustup_utils::utils;
+use rustup_utils::utils::{self, ExitCode};
 use self_update;
 use std::path::Path;
-use std::process::Command;
+use std::process::{self, Command};
 use std::iter;
 use std::error::Error;
 use term2;
@@ -606,12 +606,14 @@ fn run(cfg: &Cfg, m: &ArgMatches) -> Result<()> {
     let args: Vec<_> = args.collect();
     let cmd = cfg.create_command_for_toolchain(toolchain, m.is_present("install"), args[0])?;
 
-    Ok(command::run_command_for_dir(
+    let ExitCode(c) = command::run_command_for_dir(
         cmd,
         args[0],
         &args[1..],
         &cfg,
-    )?)
+    )?;
+
+    process::exit(c)
 }
 
 fn which(cfg: &Cfg, m: &ArgMatches) -> Result<()> {
diff --git a/src/rustup-utils/src/utils.rs b/src/rustup-utils/src/utils.rs
index 7996e40db0..af3d4eae14 100644
--- a/src/rustup-utils/src/utils.rs
+++ b/src/rustup-utils/src/utils.rs
@@ -19,6 +19,8 @@ use url::Url;
 pub use raw::{find_cmd, has_cmd, if_not_empty, is_directory, is_file, path_exists, prefix_arg,
               random_string};
 
+pub struct ExitCode(pub i32);
+
 pub fn ensure_dir_exists(
     name: &'static str,
     path: &Path,
diff --git a/src/rustup/command.rs b/src/rustup/command.rs
index 853ecf14ba..136cdab108 100644
--- a/src/rustup/command.rs
+++ b/src/rustup/command.rs
@@ -9,7 +9,7 @@ use tempfile::tempfile;
 use Cfg;
 use errors::*;
 use notifications::*;
-use rustup_utils;
+use rustup_utils::{self, utils::ExitCode};
 use telemetry::{Telemetry, TelemetryEvent};
 
 pub fn run_command_for_dir<S: AsRef<OsStr>>(
@@ -17,7 +17,7 @@ pub fn run_command_for_dir<S: AsRef<OsStr>>(
     arg0: &str,
     args: &[S],
     cfg: &Cfg,
-) -> Result<()> {
+) -> Result<ExitCode> {
     if (arg0 == "rustc" || arg0 == "rustc.exe") && cfg.telemetry_enabled()? {
         return telemetry_rustc(cmd, arg0, args, cfg);
     }
@@ -30,7 +30,7 @@ fn telemetry_rustc<S: AsRef<OsStr>>(
     arg0: &str,
     args: &[S],
     cfg: &Cfg,
-) -> Result<()> {
+) -> Result<ExitCode> {
     #[cfg(unix)]
     fn file_as_stdio(file: &File) -> Stdio {
         use std::os::unix::io::{AsRawFd, FromRawFd};
@@ -127,7 +127,7 @@ fn telemetry_rustc<S: AsRef<OsStr>>(
                 (cfg.notify_handler)(Notification::TelemetryCleanupError(&xe));
             });
 
-            process::exit(exit_code);
+            Ok(ExitCode(exit_code))
         }
         Err(e) => {
             let exit_code = e.raw_os_error().unwrap_or(1);
@@ -152,7 +152,7 @@ fn exec_command_for_dir_without_telemetry<S: AsRef<OsStr>>(
     mut cmd: Command,
     arg0: &str,
     args: &[S],
-) -> Result<()> {
+) -> Result<ExitCode> {
     cmd.args(args);
 
     // FIXME rust-lang/rust#32254. It's not clear to me
@@ -164,15 +164,15 @@ fn exec_command_for_dir_without_telemetry<S: AsRef<OsStr>>(
     });
 
     #[cfg(unix)]
-    fn exec(cmd: &mut Command) -> io::Result<()> {
+    fn exec(cmd: &mut Command) -> io::Result<ExitCode> {
         use std::os::unix::prelude::*;
         Err(cmd.exec())
     }
 
     #[cfg(windows)]
-    fn exec(cmd: &mut Command) -> io::Result<()> {
+    fn exec(cmd: &mut Command) -> io::Result<ExitCode> {
         let status = cmd.status()?;
-        process::exit(status.code().unwrap());
+        Ok(ExitCode(status.code().unwrap()))
     }
 }