From 52317aa8f8553f6f982d6667174149d845cc4158 Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Fri, 10 Mar 2023 14:27:50 -0800 Subject: [PATCH 1/6] Add some tests for simulating behavior under rustup. --- tests/testsuite/main.rs | 1 + tests/testsuite/rustup.rs | 264 ++++++++++++++++++++++++++++++++++++++ 2 files changed, 265 insertions(+) create mode 100644 tests/testsuite/rustup.rs diff --git a/tests/testsuite/main.rs b/tests/testsuite/main.rs index 9afb3945940..efc31f4933e 100644 --- a/tests/testsuite/main.rs +++ b/tests/testsuite/main.rs @@ -120,6 +120,7 @@ mod rustdoc; mod rustdoc_extern_html; mod rustdocflags; mod rustflags; +mod rustup; mod search; mod shell_quoting; mod source_replacement; diff --git a/tests/testsuite/rustup.rs b/tests/testsuite/rustup.rs new file mode 100644 index 00000000000..4a4c3a727a8 --- /dev/null +++ b/tests/testsuite/rustup.rs @@ -0,0 +1,264 @@ +//! Tests for Cargo's behavior under Rustup. + +use cargo_test_support::paths::{home, root, CargoPathExt}; +use cargo_test_support::{cargo_process, process, project}; +use std::env; +use std::env::consts::EXE_EXTENSION; +use std::ffi::OsString; +use std::fs; +use std::path::{Path, PathBuf}; + +/// Helper to generate an executable. +fn make_exe(dest: &Path, name: &str, contents: &str, env: &[(&str, PathBuf)]) -> PathBuf { + let rs_name = format!("{name}.rs"); + fs::write( + root().join(&rs_name), + &format!("fn main() {{ {contents} }}"), + ) + .unwrap(); + let mut pb = process("rustc"); + env.iter().for_each(|(key, value)| { + pb.env(key, value); + }); + pb.arg("--edition=2021") + .arg(root().join(&rs_name)) + .exec() + .unwrap(); + let exe = Path::new(name).with_extension(EXE_EXTENSION); + let output = dest.join(&exe); + fs::rename(root().join(&exe), &output).unwrap(); + output +} + +fn prepend_path(path: &Path) -> OsString { + let mut paths = vec![path.to_path_buf()]; + paths.extend(env::split_paths(&env::var_os("PATH").unwrap_or_default())); + env::join_paths(paths).unwrap() +} + +struct RustupEnvironment { + /// Path for ~/.cargo/bin + cargo_bin: PathBuf, + /// Path for ~/.rustup + rustup_home: PathBuf, + /// Path to the cargo executable in the toolchain directory + /// (~/.rustup/toolchain/test-toolchain/bin/cargo.exe). + cargo_toolchain_exe: PathBuf, +} + +/// Creates an executable which prints a message and then runs the *real* rustc. +fn real_rustc_wrapper(bin_dir: &Path, message: &str) -> PathBuf { + let real_rustc = cargo_util::paths::resolve_executable("rustc".as_ref()).unwrap(); + // The toolchain rustc needs to call the real rustc. In order to do that, + // it needs to restore or clear the RUSTUP environment variables so that + // if rustup is installed, it will call the correct rustc. + let rustup_toolchain_setup = match std::env::var_os("RUSTUP_TOOLCHAIN") { + Some(t) => format!( + ".env(\"RUSTUP_TOOLCHAIN\", \"{}\")", + t.into_string().unwrap() + ), + None => format!(".env_remove(\"RUSTUP_TOOLCHAIN\")"), + }; + let mut env = vec![("CARGO_RUSTUP_TEST_real_rustc", real_rustc)]; + let rustup_home_setup = match std::env::var_os("RUSTUP_HOME") { + Some(h) => { + env.push(("CARGO_RUSTUP_TEST_RUSTUP_HOME", h.into())); + format!(".env(\"RUSTUP_HOME\", env!(\"CARGO_RUSTUP_TEST_RUSTUP_HOME\"))") + } + None => format!(".env_remove(\"RUSTUP_HOME\")"), + }; + make_exe( + bin_dir, + "rustc", + &format!( + r#" + eprintln!("{message}"); + let r = std::process::Command::new(env!("CARGO_RUSTUP_TEST_real_rustc")) + .args(std::env::args_os().skip(1)) + {rustup_toolchain_setup} + {rustup_home_setup} + .status(); + std::process::exit(r.unwrap().code().unwrap_or(2)); + "# + ), + &env, + ) +} + +/// Creates a simulation of a rustup environment with `~/.cargo/bin` and +/// `~/.rustup` directories populated with some executables that simulate +/// rustup. +fn simulated_rustup_environment() -> RustupEnvironment { + // Set up ~/.rustup/toolchains/test-toolchain/bin with a custom rustc and cargo. + let rustup_home = home().join(".rustup"); + let toolchain_bin = rustup_home + .join("toolchains") + .join("test-toolchain") + .join("bin"); + toolchain_bin.mkdir_p(); + let rustc_toolchain_exe = real_rustc_wrapper(&toolchain_bin, "real rustc running"); + let cargo_toolchain_exe = make_exe( + &toolchain_bin, + "cargo", + r#"panic!("cargo toolchain should not be called");"#, + &[], + ); + + // Set up ~/.cargo/bin with a typical set of rustup proxies. + let cargo_bin = home().join(".cargo").join("bin"); + cargo_bin.mkdir_p(); + + let rustc_proxy = make_exe( + &cargo_bin, + "rustc", + &format!( + r#" + match std::env::args().next().unwrap().as_ref() {{ + "rustc" => {{}} + arg => panic!("proxy only supports rustc, got {{arg:?}}"), + }} + eprintln!("rustc proxy running"); + let r = std::process::Command::new(env!("CARGO_RUSTUP_TEST_rustc_toolchain_exe")) + .args(std::env::args_os().skip(1)) + .status(); + std::process::exit(r.unwrap().code().unwrap_or(2)); + "# + ), + &[("CARGO_RUSTUP_TEST_rustc_toolchain_exe", rustc_toolchain_exe)], + ); + fs::hard_link( + &rustc_proxy, + cargo_bin.join("cargo").with_extension(EXE_EXTENSION), + ) + .unwrap(); + fs::hard_link( + &rustc_proxy, + cargo_bin.join("rustup").with_extension(EXE_EXTENSION), + ) + .unwrap(); + + RustupEnvironment { + cargo_bin, + rustup_home, + cargo_toolchain_exe, + } +} + +#[cargo_test] +fn typical_rustup() { + // Test behavior under a typical rustup setup with a normal toolchain. + let RustupEnvironment { + cargo_bin, + rustup_home, + cargo_toolchain_exe, + } = simulated_rustup_environment(); + + // Set up a project and run a normal cargo build. + let p = project().file("src/lib.rs", "").build(); + // The path is modified so that cargo will call `rustc` from + // `~/.cargo/bin/rustc to use our custom rustup proxies. + let path = prepend_path(&cargo_bin); + p.cargo("check") + .env("RUSTUP_TOOLCHAIN", "test-toolchain") + .env("RUSTUP_HOME", &rustup_home) + .env("PATH", &path) + .with_stderr( + "\ +[CHECKING] foo v0.0.1 [..] +rustc proxy running +real rustc running +[FINISHED] [..] +", + ) + .run(); + + // Do a similar test, but with a toolchain link that does not have cargo + // (which normally would do a fallback to nightly/beta/stable). + cargo_toolchain_exe.rm_rf(); + p.build_dir().rm_rf(); + + p.cargo("check") + .env("RUSTUP_TOOLCHAIN", "test-toolchain") + .env("RUSTUP_HOME", &rustup_home) + .env("PATH", &path) + .with_stderr( + "\ +[CHECKING] foo v0.0.1 [..] +rustc proxy running +real rustc running +[FINISHED] [..] +", + ) + .run(); +} + +// This doesn't work on Windows because Cargo forces the PATH to contain the +// sysroot_libdir, which is actually `bin`, preventing the test from +// overriding the bin directory. +#[cargo_test(ignore_windows = "PATH can't be overridden on Windows")] +fn custom_calls_other_cargo() { + // Test behavior when a custom subcommand tries to manipulate PATH to use + // a different toolchain. + let RustupEnvironment { + cargo_bin, + rustup_home, + cargo_toolchain_exe: _, + } = simulated_rustup_environment(); + + // Create a directory with a custom toolchain (outside of the rustup universe). + let custom_bin = root().join("custom-bin"); + custom_bin.mkdir_p(); + // `cargo` points to the real cargo. + let cargo_exe = cargo_test_support::cargo_exe(); + fs::hard_link(&cargo_exe, custom_bin.join(cargo_exe.file_name().unwrap())).unwrap(); + // `rustc` executes the real rustc. + real_rustc_wrapper(&custom_bin, "custom toolchain rustc running"); + + // A project that cargo-custom will try to build. + let p = project().file("src/lib.rs", "").build(); + + // Create a custom cargo subcommand. + // This will modify PATH to a custom toolchain and call cargo from that. + make_exe( + &cargo_bin, + "cargo-custom", + r#" + use std::env; + use std::process::Command; + + eprintln!("custom command running"); + + let mut paths = vec![std::path::PathBuf::from(env!("CARGO_RUSTUP_TEST_custom_bin"))]; + paths.extend(env::split_paths(&env::var_os("PATH").unwrap_or_default())); + let path = env::join_paths(paths).unwrap(); + + let status = Command::new("cargo") + .arg("check") + .current_dir(env!("CARGO_RUSTUP_TEST_project_dir")) + .env("PATH", path) + .status() + .unwrap(); + assert!(status.success()); + "#, + &[ + ("CARGO_RUSTUP_TEST_custom_bin", custom_bin), + ("CARGO_RUSTUP_TEST_project_dir", p.root()), + ], + ); + + cargo_process("custom") + // Set these to simulate what would happen when running under rustup. + // We want to make sure that cargo-custom does not try to use the + // rustup proxies. + .env("RUSTUP_TOOLCHAIN", "test-toolchain") + .env("RUSTUP_HOME", &rustup_home) + .with_stderr( + "\ +custom command running +[CHECKING] foo [..] +custom toolchain rustc running +[FINISHED] [..] +", + ) + .run(); +} From d4b0b494f19fb6846f8fc7d0e9ba9f0c160de8d8 Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Fri, 10 Mar 2023 16:04:06 -0800 Subject: [PATCH 2/6] Add an optimization when running under rustup. --- src/cargo/util/config/mod.rs | 42 ++++++++++++++++++++++++++++++++++++ tests/testsuite/rustup.rs | 2 -- 2 files changed, 42 insertions(+), 2 deletions(-) diff --git a/src/cargo/util/config/mod.rs b/src/cargo/util/config/mod.rs index dad7e9c727b..89a3aa632d6 100644 --- a/src/cargo/util/config/mod.rs +++ b/src/cargo/util/config/mod.rs @@ -1644,6 +1644,48 @@ impl Config { /// as a path. fn get_tool(&self, tool: &str, from_config: &Option) -> PathBuf { self.maybe_get_tool(tool, from_config) + .or_else(|| { + // This is an optimization to circumvent the rustup proxies + // which can have a significant performance hit. The goal here + // is to determine if calling `rustc` from PATH would end up + // calling the proxies. + // + // This is somewhat cautious trying to determine if it is safe + // to circumvent rustup, because there are some situations + // where users may do things like modify PATH, call cargo + // directly, use a custom rustup toolchain link without a + // cargo executable, etc. However, there is still some risk + // this may make the wrong decision in unusual circumstances. + // + // First, we must be running under rustup in the first place. + let toolchain = self.get_env_os("RUSTUP_TOOLCHAIN")?; + // If the tool on PATH is the same as `rustup` on path, then + // there is pretty good evidence that it will be a proxy. + let tool_resolved = paths::resolve_executable(Path::new(tool)).ok()?; + let rustup_resolved = paths::resolve_executable(Path::new("rustup")).ok()?; + let tool_meta = tool_resolved.metadata().ok()?; + let rustup_meta = rustup_resolved.metadata().ok()?; + // This works on the assumption that rustup and its proxies + // use hard links to a single binary. If rustup ever changes + // that setup, then I think the worst consequence is that this + // optimization will not work, and it will take the slow path. + if tool_meta.len() != rustup_meta.len() { + return None; + } + // Try to find the tool in rustup's toolchain directory. + let tool_exe = Path::new(tool).with_extension(env::consts::EXE_EXTENSION); + let toolchain_exe = home::rustup_home() + .ok()? + .join("toolchains") + .join(&toolchain) + .join("bin") + .join(&tool_exe); + if toolchain_exe.exists() { + Some(toolchain_exe) + } else { + None + } + }) .unwrap_or_else(|| PathBuf::from(tool)) } diff --git a/tests/testsuite/rustup.rs b/tests/testsuite/rustup.rs index 4a4c3a727a8..aa93f546c54 100644 --- a/tests/testsuite/rustup.rs +++ b/tests/testsuite/rustup.rs @@ -165,7 +165,6 @@ fn typical_rustup() { .with_stderr( "\ [CHECKING] foo v0.0.1 [..] -rustc proxy running real rustc running [FINISHED] [..] ", @@ -184,7 +183,6 @@ real rustc running .with_stderr( "\ [CHECKING] foo v0.0.1 [..] -rustc proxy running real rustc running [FINISHED] [..] ", From cdf60e359469449e839a14781a88452deef40c88 Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Sat, 8 Apr 2023 10:50:03 -0700 Subject: [PATCH 3/6] Add an assert to confirm that this function is only used with proxies. --- src/cargo/util/config/mod.rs | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/cargo/util/config/mod.rs b/src/cargo/util/config/mod.rs index 89a3aa632d6..11c7d1a900d 100644 --- a/src/cargo/util/config/mod.rs +++ b/src/cargo/util/config/mod.rs @@ -1643,6 +1643,11 @@ impl Config { /// Looks for a path for `tool` in an environment variable or config path, defaulting to `tool` /// as a path. fn get_tool(&self, tool: &str, from_config: &Option) -> PathBuf { + // This function is designed to only work with rustup proxies. This + // assert is to ensure that if it is ever used for something else in + // the future that you must ensure that it is a proxy-able tool, or if + // not then you need to use `maybe_get_tool` instead. + assert!(matches!(tool, "rustc" | "rustdoc")); self.maybe_get_tool(tool, from_config) .or_else(|| { // This is an optimization to circumvent the rustup proxies From 42ef94f38405cf1c4301bdac1d9291eda691c82f Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Sat, 8 Apr 2023 10:54:43 -0700 Subject: [PATCH 4/6] Check for toolchains names with slashes and use the slow path in that case. --- src/cargo/util/config/mod.rs | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/cargo/util/config/mod.rs b/src/cargo/util/config/mod.rs index 11c7d1a900d..0a79e485e06 100644 --- a/src/cargo/util/config/mod.rs +++ b/src/cargo/util/config/mod.rs @@ -1664,6 +1664,11 @@ impl Config { // // First, we must be running under rustup in the first place. let toolchain = self.get_env_os("RUSTUP_TOOLCHAIN")?; + // This currently does not support toolchain paths. + // This also enforces UTF-8. + if toolchain.to_str()?.contains(&['/', '\\']) { + return None; + } // If the tool on PATH is the same as `rustup` on path, then // there is pretty good evidence that it will be a proxy. let tool_resolved = paths::resolve_executable(Path::new(tool)).ok()?; From 4f79ac3aa875f15c84a0ca3a02e9c474f7f28aa9 Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Wed, 3 May 2023 14:07:53 -0700 Subject: [PATCH 5/6] Change `get_tool` to use an enum to constrain which values it accepts. --- src/cargo/util/config/mod.rs | 46 +++++++++++++++++++++++++----------- 1 file changed, 32 insertions(+), 14 deletions(-) diff --git a/src/cargo/util/config/mod.rs b/src/cargo/util/config/mod.rs index 0a79e485e06..d841bc558ee 100644 --- a/src/cargo/util/config/mod.rs +++ b/src/cargo/util/config/mod.rs @@ -388,7 +388,7 @@ impl Config { /// Gets the path to the `rustdoc` executable. pub fn rustdoc(&self) -> CargoResult<&Path> { self.rustdoc - .try_borrow_with(|| Ok(self.get_tool("rustdoc", &self.build_config()?.rustdoc))) + .try_borrow_with(|| Ok(self.get_tool(Tool::Rustdoc, &self.build_config()?.rustdoc))) .map(AsRef::as_ref) } @@ -406,7 +406,7 @@ impl Config { ); Rustc::new( - self.get_tool("rustc", &self.build_config()?.rustc), + self.get_tool(Tool::Rustc, &self.build_config()?.rustc), wrapper, rustc_workspace_wrapper, &self @@ -1640,15 +1640,19 @@ impl Config { } } - /// Looks for a path for `tool` in an environment variable or config path, defaulting to `tool` - /// as a path. - fn get_tool(&self, tool: &str, from_config: &Option) -> PathBuf { - // This function is designed to only work with rustup proxies. This - // assert is to ensure that if it is ever used for something else in - // the future that you must ensure that it is a proxy-able tool, or if - // not then you need to use `maybe_get_tool` instead. - assert!(matches!(tool, "rustc" | "rustdoc")); - self.maybe_get_tool(tool, from_config) + /// Returns the path for the given tool. + /// + /// This will look for the tool in the following order: + /// + /// 1. From an environment variable matching the tool name (such as `RUSTC`). + /// 2. From the given config value (which is usually something like `build.rustc`). + /// 3. Finds the tool in the PATH environment variable. + /// + /// This is intended for tools that are rustup proxies. If you need to get + /// a tool that is not a rustup proxy, use `maybe_get_tool` instead. + fn get_tool(&self, tool: Tool, from_config: &Option) -> PathBuf { + let tool_str = tool.as_str(); + self.maybe_get_tool(tool_str, from_config) .or_else(|| { // This is an optimization to circumvent the rustup proxies // which can have a significant performance hit. The goal here @@ -1671,7 +1675,7 @@ impl Config { } // If the tool on PATH is the same as `rustup` on path, then // there is pretty good evidence that it will be a proxy. - let tool_resolved = paths::resolve_executable(Path::new(tool)).ok()?; + let tool_resolved = paths::resolve_executable(Path::new(tool_str)).ok()?; let rustup_resolved = paths::resolve_executable(Path::new("rustup")).ok()?; let tool_meta = tool_resolved.metadata().ok()?; let rustup_meta = rustup_resolved.metadata().ok()?; @@ -1683,7 +1687,7 @@ impl Config { return None; } // Try to find the tool in rustup's toolchain directory. - let tool_exe = Path::new(tool).with_extension(env::consts::EXE_EXTENSION); + let tool_exe = Path::new(tool_str).with_extension(env::consts::EXE_EXTENSION); let toolchain_exe = home::rustup_home() .ok()? .join("toolchains") @@ -1696,7 +1700,7 @@ impl Config { None } }) - .unwrap_or_else(|| PathBuf::from(tool)) + .unwrap_or_else(|| PathBuf::from(tool_str)) } pub fn jobserver_from_env(&self) -> Option<&jobserver::Client> { @@ -2697,3 +2701,17 @@ macro_rules! drop_eprint { $crate::__shell_print!($config, err, false, $($arg)*) ); } + +enum Tool { + Rustc, + Rustdoc, +} + +impl Tool { + fn as_str(&self) -> &str { + match self { + Tool::Rustc => "rustc", + Tool::Rustdoc => "rustdoc", + } + } +} From b9993bdc904e41aca94b54c8d7c14d6ad3de188e Mon Sep 17 00:00:00 2001 From: Eric Huss Date: Wed, 3 May 2023 14:09:28 -0700 Subject: [PATCH 6/6] Switch to then_some. --- src/cargo/util/config/mod.rs | 6 +----- 1 file changed, 1 insertion(+), 5 deletions(-) diff --git a/src/cargo/util/config/mod.rs b/src/cargo/util/config/mod.rs index d841bc558ee..40102a62fc3 100644 --- a/src/cargo/util/config/mod.rs +++ b/src/cargo/util/config/mod.rs @@ -1694,11 +1694,7 @@ impl Config { .join(&toolchain) .join("bin") .join(&tool_exe); - if toolchain_exe.exists() { - Some(toolchain_exe) - } else { - None - } + toolchain_exe.exists().then_some(toolchain_exe) }) .unwrap_or_else(|| PathBuf::from(tool_str)) }