From 60d4783c4e0d4d1b2b97cdeec649f71d210ad56d Mon Sep 17 00:00:00 2001 From: konstin Date: Fri, 20 Oct 2023 14:29:25 +0200 Subject: [PATCH] Escape rebase hell --- Cargo.lock | 89 +++++-- crates/install-wheel-rs/src/lib.rs | 6 +- crates/install-wheel-rs/src/wheel.rs | 2 +- crates/puffin-build-cli/.gitignore | 2 + crates/puffin-build-cli/Cargo.toml | 37 +++ crates/puffin-build-cli/src/lib.rs | 3 + .../src/main.rs | 16 +- crates/puffin-build-cli/src/sdist.rs | 74 ++++++ .../test.sh | 0 crates/puffin-build/Cargo.toml | 6 - crates/puffin-build/src/lib.rs | 93 ++----- crates/puffin-cli/Cargo.toml | 1 + crates/puffin-cli/src/commands/pip_compile.rs | 25 +- crates/puffin-client/Cargo.toml | 5 +- crates/puffin-interpreter/src/lib.rs | 2 +- crates/puffin-resolver/Cargo.toml | 10 + crates/puffin-resolver/src/error.rs | 8 + crates/puffin-resolver/src/lib.rs | 2 + crates/puffin-resolver/src/resolution.rs | 4 +- crates/puffin-resolver/src/resolver.rs | 241 ++++++++++++++---- .../src/source_distribution.rs | 103 ++++++++ crates/puffin-resolver/tests/resolver.rs | 9 + .../pubgrub/src/internal/partial_solution.rs | 8 +- 23 files changed, 570 insertions(+), 176 deletions(-) create mode 100644 crates/puffin-build-cli/.gitignore create mode 100644 crates/puffin-build-cli/Cargo.toml create mode 100644 crates/puffin-build-cli/src/lib.rs rename crates/{puffin-build => puffin-build-cli}/src/main.rs (87%) create mode 100644 crates/puffin-build-cli/src/sdist.rs rename crates/{puffin-build => puffin-build-cli}/test.sh (100%) create mode 100644 crates/puffin-resolver/src/source_distribution.rs diff --git a/Cargo.lock b/Cargo.lock index ffd4b52749cbe..58fc04c50dad4 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -518,9 +518,9 @@ checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa" [[package]] name = "cpufeatures" -version = "0.2.10" +version = "0.2.9" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3fbc60abd742b35f2492f808e1abbb83d45f72db402e14c55057edc9c7b1e9e4" +checksum = "a17b76ff3a4162b0b27f354a0c87015ddad39d35f9c0c36607a3bdd175dde1f1" dependencies = [ "libc", ] @@ -1045,9 +1045,9 @@ dependencies = [ [[package]] name = "hashbrown" -version = "0.14.2" +version = "0.14.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f93e7192158dbcda357bdec5fb5788eebf8bbac027f3f33e719d29135ae84156" +checksum = "7dfda62a12f55daeae5015f81b0baea145391cb4520f86c248fc615d72640d12" [[package]] name = "heck" @@ -1183,7 +1183,7 @@ dependencies = [ "httpdate", "itoa", "pin-project-lite", - "socket2 0.4.10", + "socket2 0.4.9", "tokio", "tower-service", "tracing", @@ -1270,7 +1270,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "8adf3ddd720272c6ea8bf59463c04e0f93d0bbf7c5439b691bca2987e0270897" dependencies = [ "equivalent", - "hashbrown 0.14.2", + "hashbrown 0.14.1", "serde", ] @@ -2025,12 +2025,6 @@ dependencies = [ "pep508_rs", "platform-host", "platform-tags", - "puffin-client", - "puffin-installer", - "puffin-interpreter", - "puffin-package", - "puffin-resolver", - "puffin-workspace", "pyproject-toml", "serde", "serde_json", @@ -2045,6 +2039,35 @@ dependencies = [ "zip", ] +[[package]] +name = "puffin-build-cli" +version = "0.0.1" +dependencies = [ + "anyhow", + "clap", + "colored", + "directories", + "fs-err", + "futures", + "gourgeist", + "itertools", + "pep508_rs", + "platform-host", + "platform-tags", + "puffin-build", + "puffin-client", + "puffin-installer", + "puffin-interpreter", + "puffin-package", + "puffin-resolver", + "puffin-workspace", + "tempfile", + "tokio", + "tracing", + "tracing-subscriber", + "which", +] + [[package]] name = "puffin-cli" version = "0.0.1" @@ -2072,6 +2095,7 @@ dependencies = [ "platform-tags", "predicates", "pubgrub", + "puffin-build-cli", "puffin-client", "puffin-installer", "puffin-interpreter", @@ -2103,6 +2127,7 @@ dependencies = [ "serde", "serde_json", "thiserror", + "tokio", "tracing", "url", ] @@ -2178,9 +2203,12 @@ dependencies = [ "clap", "colored", "distribution-filename", + "fs-err", "futures", "fxhash", + "gourgeist", "insta", + "install-wheel-rs", "itertools", "once_cell", "pep440_rs 0.3.12", @@ -2189,12 +2217,19 @@ dependencies = [ "platform-host", "platform-tags", "pubgrub", + "puffin-build", "puffin-client", + "puffin-interpreter", "puffin-package", + "tempfile", "thiserror", "tokio", + "tokio-util", "tracing", + "url", "waitmap", + "which", + "zip", ] [[package]] @@ -2581,9 +2616,9 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2" [[package]] name = "rustix" -version = "0.38.20" +version = "0.38.19" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "67ce50cb2e16c2903e30d1cbccfd8387a74b9d4c938b6a4c5ec6cc7556f7a8a0" +checksum = "745ecfa778e66b2b63c88a61cb36e0eea109e803b0b86bf9879fbc77c70e86ed" dependencies = [ "bitflags 2.4.1", "errno", @@ -2800,9 +2835,9 @@ checksum = "b7c388c1b5e93756d0c740965c41e8822f866621d41acbdf6336a6a168f8840c" [[package]] name = "socket2" -version = "0.4.10" +version = "0.4.9" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9f7916fc008ca5542385b89a3d3ce689953c143e9304a9bf8beec1de48994c0d" +checksum = "64a4a911eed85daf18834cfaa86a79b7d266ff93ff5ba14005426219480ed662" dependencies = [ "libc", "winapi", @@ -2810,9 +2845,9 @@ dependencies = [ [[package]] name = "socket2" -version = "0.5.5" +version = "0.5.4" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7b5fac59a5cb5dd637972e5fca70daf0523c9067fcdc4842f053dae04a18f8e9" +checksum = "4031e820eb552adee9295814c0ced9e5cf38ddf1e8b7d566d6de8e2538ea989e" dependencies = [ "libc", "windows-sys 0.48.0", @@ -2938,9 +2973,9 @@ dependencies = [ [[package]] name = "target-lexicon" -version = "0.12.12" +version = "0.12.11" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "14c39fd04924ca3a864207c66fc2cd7d22d7c016007f9ce846cbb9326331930a" +checksum = "9d0e916b1148c8e263850e1ebcbd046f333e0683c724876bb0da63ea4373dc8a" [[package]] name = "task-local-extensions" @@ -3037,18 +3072,18 @@ dependencies = [ [[package]] name = "thiserror" -version = "1.0.50" +version = "1.0.49" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f9a7210f5c9a7156bb50aa36aed4c95afb51df0df00713949448cf9e97d382d2" +checksum = "1177e8c6d7ede7afde3585fd2513e611227efd6481bd78d2e82ba1ce16557ed4" dependencies = [ "thiserror-impl", ] [[package]] name = "thiserror-impl" -version = "1.0.50" +version = "1.0.49" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "266b2e40bc00e5a6c09c3584011e08b06f123c00362c92b975ba9843aaaa14b8" +checksum = "10712f02019e9288794769fba95cd6847df9874d49d871d062172f9dd41bc4cc" dependencies = [ "proc-macro2", "quote", @@ -3130,7 +3165,7 @@ dependencies = [ "mio", "num_cpus", "pin-project-lite", - "socket2 0.5.5", + "socket2 0.5.4", "tokio-macros", "windows-sys 0.48.0", ] @@ -3249,9 +3284,9 @@ checksum = "b6bc1c9ce2b5135ac7f93c72918fc37feb872bdc6a5533a8b85eb4b86bfdae52" [[package]] name = "tracing" -version = "0.1.40" +version = "0.1.39" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c3523ab5a71916ccf420eebdf5521fcef02141234bbc0b8a49f2fdc4544364ef" +checksum = "ee2ef2af84856a50c1d430afce2fdded0a4ec7eda868db86409b4543df0797f9" dependencies = [ "log", "pin-project-lite", diff --git a/crates/install-wheel-rs/src/lib.rs b/crates/install-wheel-rs/src/lib.rs index 832ff8a584587..99214c9f1669a 100644 --- a/crates/install-wheel-rs/src/lib.rs +++ b/crates/install-wheel-rs/src/lib.rs @@ -2,18 +2,18 @@ use std::io; +use platform_host::{Arch, Os}; use platform_info::PlatformInfoError; use thiserror::Error; use zip::result::ZipError; pub use install_location::{normalize_name, InstallLocation, LockedDir}; -use platform_host::{Arch, Os}; pub use record::RecordEntry; pub use script::Script; pub use uninstall::{uninstall_wheel, Uninstall}; pub use wheel::{ - get_script_launcher, install_wheel, parse_key_value_file, read_record_file, relative_to, - SHEBANG_PYTHON, + find_dist_info, get_script_launcher, install_wheel, parse_key_value_file, read_record_file, + relative_to, SHEBANG_PYTHON, }; mod install_location; diff --git a/crates/install-wheel-rs/src/wheel.rs b/crates/install-wheel-rs/src/wheel.rs index a10e193414c2b..1ee333142a78f 100644 --- a/crates/install-wheel-rs/src/wheel.rs +++ b/crates/install-wheel-rs/src/wheel.rs @@ -1027,7 +1027,7 @@ pub fn install_wheel( /// Either way, we just search the wheel for the name /// /// -fn find_dist_info( +pub fn find_dist_info( filename: &WheelFilename, archive: &mut ZipArchive, ) -> Result { diff --git a/crates/puffin-build-cli/.gitignore b/crates/puffin-build-cli/.gitignore new file mode 100644 index 0000000000000..4d668e3d91671 --- /dev/null +++ b/crates/puffin-build-cli/.gitignore @@ -0,0 +1,2 @@ +downloads +wheels diff --git a/crates/puffin-build-cli/Cargo.toml b/crates/puffin-build-cli/Cargo.toml new file mode 100644 index 0000000000000..c3de63fc3858e --- /dev/null +++ b/crates/puffin-build-cli/Cargo.toml @@ -0,0 +1,37 @@ +[package] +name = "puffin-build-cli" +version = "0.0.1" +description = "Build wheels from source distributions" +edition = { workspace = true } +rust-version = { workspace = true } +homepage = { workspace = true } +documentation = { workspace = true } +repository = { workspace = true } +authors = { workspace = true } +license = { workspace = true } + +[dependencies] +gourgeist = { path = "../gourgeist" } +pep508_rs = { path = "../pep508-rs" } +platform-host = { path = "../platform-host" } +platform-tags = { path = "../platform-tags" } +puffin-build = { path = "../puffin-build" } +puffin-client = { path = "../puffin-client" } +puffin-installer = { path = "../puffin-installer" } +puffin-interpreter = { path = "../puffin-interpreter" } +puffin-package = { path = "../puffin-package" } +puffin-resolver = { path = "../puffin-resolver" } +puffin-workspace = { path = "../puffin-workspace" } + +anyhow = { workspace = true } +clap = { workspace = true, features = ["derive"] } +directories = { workspace = true } +fs-err = { workspace = true } +futures = { workspace = true } +itertools = { workspace = true } +tempfile = { workspace = true } +tokio = { workspace = true } +tracing = { workspace = true } +tracing-subscriber = { workspace = true } +which = { workspace = true } +colored = "2.0.4" diff --git a/crates/puffin-build-cli/src/lib.rs b/crates/puffin-build-cli/src/lib.rs new file mode 100644 index 0000000000000..4e1c4c771b81e --- /dev/null +++ b/crates/puffin-build-cli/src/lib.rs @@ -0,0 +1,3 @@ +mod sdist; + +pub use sdist::resolve_and_install; diff --git a/crates/puffin-build/src/main.rs b/crates/puffin-build-cli/src/main.rs similarity index 87% rename from crates/puffin-build/src/main.rs rename to crates/puffin-build-cli/src/main.rs index 248de6a981a2a..38c6332138bb1 100644 --- a/crates/puffin-build/src/main.rs +++ b/crates/puffin-build-cli/src/main.rs @@ -1,5 +1,6 @@ #![allow(clippy::print_stdout, clippy::print_stderr)] +use crate::sdist::resolve_and_install; use anyhow::Context; use clap::Parser; use colored::Colorize; @@ -16,6 +17,8 @@ use tracing_subscriber::layer::SubscriberExt; use tracing_subscriber::util::SubscriberInitExt; use tracing_subscriber::{fmt, EnvFilter}; +pub mod sdist; + #[derive(Parser)] struct Args { /// Base python in a way that can be found with `which` @@ -49,11 +52,16 @@ async fn run() -> anyhow::Result<()> { })?; let interpreter_info = gourgeist::get_interpreter_info(&base_python)?; - let builder = - SourceDistributionBuilder::setup(&args.sdist, &base_python, &interpreter_info, cache) - .await?; + let builder = SourceDistributionBuilder::setup( + &args.sdist, + &base_python, + &interpreter_info, + cache, + resolve_and_install, + ) + .await?; let wheel = builder.build(&wheel_dir)?; - println!("Wheel built to {}", wheel.display()); + println!("Wheel built to {}", wheel_dir.join(wheel).display()); Ok(()) } diff --git a/crates/puffin-build-cli/src/sdist.rs b/crates/puffin-build-cli/src/sdist.rs new file mode 100644 index 0000000000000..b1817d5e421f7 --- /dev/null +++ b/crates/puffin-build-cli/src/sdist.rs @@ -0,0 +1,74 @@ +use anyhow::Context; +use futures::FutureExt; +use itertools::{Either, Itertools}; +use pep508_rs::Requirement; +use platform_host::Platform; +use platform_tags::Tags; +use puffin_client::PypiClientBuilder; +use puffin_installer::{CachedDistribution, Downloader, LocalIndex, RemoteDistribution, Unzipper}; +use puffin_interpreter::PythonExecutable; +use puffin_package::package_name::PackageName; +use puffin_resolver::WheelFinder; +use std::future::Future; +use std::path::Path; +use std::pin::Pin; +use tempfile::tempdir; +use tracing::{debug, instrument}; + +#[instrument(skip_all)] +pub async fn resolve_and_install_impl( + venv: &Path, + requirements: &[Requirement], + cache: Option<&Path>, +) -> anyhow::Result<()> { + debug!("Installing {} build requirements", requirements.len()); + + let local_index = if let Some(cache) = cache { + LocalIndex::try_from_directory(cache)? + } else { + LocalIndex::default() + }; + let (cached, uncached): (Vec, Vec) = + requirements.iter().partition_map(|requirement| { + let package = PackageName::normalize(&requirement.name); + if let Some(distribution) = local_index + .get(&package) + .filter(|dist| requirement.is_satisfied_by(dist.version())) + { + Either::Left(distribution.clone()) + } else { + Either::Right(requirement.clone()) + } + }); + + let client = PypiClientBuilder::default().cache(cache).build(); + + let platform = Platform::current()?; + let python = PythonExecutable::from_venv(platform, venv, cache)?; + let tags = Tags::from_env(python.platform(), python.simple_version())?; + let resolution = WheelFinder::new(&tags, &client).resolve(&uncached).await?; + let uncached = resolution + .into_files() + .map(RemoteDistribution::from_file) + .collect::>>()?; + let staging = tempdir()?; + let downloads = Downloader::new(&client, cache) + .download(&uncached, cache.unwrap_or(staging.path())) + .await?; + let unzips = Unzipper::default() + .download(downloads, cache.unwrap_or(staging.path())) + .await + .context("Failed to download and unpack wheels")?; + let wheels = unzips.into_iter().chain(cached).collect::>(); + puffin_installer::Installer::new(&python).install(&wheels)?; + + Ok(()) +} + +pub fn resolve_and_install<'a>( + venv: &'a Path, + requirements: &'a [Requirement], + cache: Option<&'a Path>, +) -> Pin> + Send + 'a>> { + resolve_and_install_impl(venv, requirements, cache).boxed() +} diff --git a/crates/puffin-build/test.sh b/crates/puffin-build-cli/test.sh similarity index 100% rename from crates/puffin-build/test.sh rename to crates/puffin-build-cli/test.sh diff --git a/crates/puffin-build/Cargo.toml b/crates/puffin-build/Cargo.toml index 2648d9651057d..e109f8e22ec8e 100644 --- a/crates/puffin-build/Cargo.toml +++ b/crates/puffin-build/Cargo.toml @@ -15,12 +15,6 @@ gourgeist = { path = "../gourgeist" } pep508_rs = { path = "../pep508-rs" } platform-host = { path = "../platform-host" } platform-tags = { path = "../platform-tags" } -puffin-client = { path = "../puffin-client" } -puffin-installer = { path = "../puffin-installer" } -puffin-interpreter = { path = "../puffin-interpreter" } -puffin-package = { path = "../puffin-package" } -puffin-resolver = { path = "../puffin-resolver" } -puffin-workspace = { path = "../puffin-workspace" } anyhow = { workspace = true } clap = { workspace = true, features = ["derive"] } diff --git a/crates/puffin-build/src/lib.rs b/crates/puffin-build/src/lib.rs index e46d1a30f535c..82862f4222acd 100644 --- a/crates/puffin-build/src/lib.rs +++ b/crates/puffin-build/src/lib.rs @@ -2,26 +2,19 @@ //! //! -use anyhow::Context; use flate2::read::GzDecoder; use fs_err as fs; use fs_err::{DirEntry, File}; use gourgeist::{InterpreterInfo, Venv}; use indoc::formatdoc; -use itertools::{Either, Itertools}; use pep508_rs::Requirement; -use platform_host::Platform; -use platform_tags::Tags; -use puffin_client::PypiClientBuilder; -use puffin_installer::{CachedDistribution, Downloader, LocalIndex, RemoteDistribution, Unzipper}; -use puffin_interpreter::PythonExecutable; -use puffin_package::package_name::PackageName; -use puffin_resolver::WheelFinder; use pyproject_toml::PyProjectToml; +use std::future::Future; use std::io; use std::io::BufRead; use std::ops::Deref; use std::path::{Path, PathBuf}; +use std::pin::Pin; use std::process::{Command, Output}; use std::str::FromStr; use tar::Archive; @@ -108,6 +101,13 @@ pub struct SourceDistributionBuilder { metadata_directory: Option, } +pub type ResolveAndInstall = + for<'a> fn( + &'a Path, + &'a [Requirement], + Option<&'a Path>, + ) -> Pin> + Send + 'a)>>; + impl SourceDistributionBuilder { /// Extract the source distribution and create a venv with the required packages pub async fn setup( @@ -115,6 +115,7 @@ impl SourceDistributionBuilder { base_python: &Path, interpreter_info: &InterpreterInfo, cache: Option<&Path>, + resolve_and_install: ResolveAndInstall, ) -> Result { let temp_dir = tempdir()?; @@ -152,6 +153,7 @@ impl SourceDistributionBuilder { interpreter_info, pep517_backend, cache, + resolve_and_install, ) .await? } else { @@ -255,7 +257,7 @@ impl SourceDistributionBuilder { /// /// #[instrument(skip(self))] - pub fn build(&self, wheel_dir: &Path) -> Result { + pub fn build(&self, wheel_dir: &Path) -> Result { // The build scripts run with the extracted root as cwd, so they need the absolute path let wheel_dir = fs::canonicalize(wheel_dir)?; @@ -287,9 +289,9 @@ impl SourceDistributionBuilder { }; // TODO(konstin): Faster copy such as reflink? Or maybe don't really let the user pick the target dir let wheel = wheel_dir.join(dist_wheel.file_name()); - fs::copy(dist_wheel.path(), &wheel)?; + fs::copy(dist_wheel.path(), wheel)?; // TODO(konstin): Check wheel filename - Ok(wheel) + Ok(dist_wheel.file_name().to_string_lossy().to_string()) } } @@ -297,7 +299,7 @@ impl SourceDistributionBuilder { &self, wheel_dir: &Path, pep517_backend: &Pep517Backend, - ) -> Result { + ) -> Result { let metadata_directory = self .metadata_directory .as_deref() @@ -323,18 +325,19 @@ impl SourceDistributionBuilder { )); } let stdout = String::from_utf8_lossy(&output.stdout); - let wheel = stdout + let distribution_filename = stdout .lines() - .last() - .map(|distribution_filename| wheel_dir.join(distribution_filename)); - let Some(wheel) = wheel.filter(|wheel| wheel.is_file()) else { + .last(); + let Some(distribution_filename) = + distribution_filename.filter(|wheel| wheel_dir.join(wheel).is_file()) + else { return Err(Error::from_command_output( "Build backend did not return the wheel filename through `build_wheel()`" .to_string(), &output, )); }; - Ok(wheel) + Ok(distribution_filename.to_string()) } } @@ -352,6 +355,7 @@ async fn create_pep517_build_environment( data: &InterpreterInfo, pep517_backend: &Pep517Backend, cache: Option<&Path>, + resolve_and_install: ResolveAndInstall, ) -> Result { let venv = gourgeist::create_venv(root.join(".venv"), base_python, data, true)?; resolve_and_install( @@ -420,63 +424,12 @@ async fn create_pep517_build_environment( .cloned() .chain(extra_requires) .collect(); - resolve_and_install(&*venv, &requirements, cache) + resolve_and_install(venv.as_std_path(), &requirements, cache) .await .map_err(Error::RequirementsInstall)?; } Ok(venv) } - -#[instrument(skip_all)] -async fn resolve_and_install( - venv: impl AsRef, - requirements: &[Requirement], - cache: Option<&Path>, -) -> anyhow::Result<()> { - debug!("Installing {} build requirements", requirements.len()); - - let local_index = if let Some(cache) = cache { - LocalIndex::try_from_directory(cache)? - } else { - LocalIndex::default() - }; - let (cached, uncached): (Vec, Vec) = - requirements.iter().partition_map(|requirement| { - let package = PackageName::normalize(&requirement.name); - if let Some(distribution) = local_index - .get(&package) - .filter(|dist| requirement.is_satisfied_by(dist.version())) - { - Either::Left(distribution.clone()) - } else { - Either::Right(requirement.clone()) - } - }); - - let client = PypiClientBuilder::default().cache(cache).build(); - - let platform = Platform::current()?; - let python = PythonExecutable::from_venv(platform, venv.as_ref(), cache)?; - let tags = Tags::from_env(python.platform(), python.simple_version())?; - let resolution = WheelFinder::new(&tags, &client).resolve(&uncached).await?; - let uncached = resolution - .into_files() - .map(RemoteDistribution::from_file) - .collect::>>()?; - let staging = tempdir()?; - let downloads = Downloader::new(&client, cache) - .download(&uncached, cache.unwrap_or(staging.path())) - .await?; - let unzips = Unzipper::default() - .download(downloads, cache.unwrap_or(staging.path())) - .await - .context("Failed to download and unpack wheels")?; - let wheels = unzips.into_iter().chain(cached).collect::>(); - puffin_installer::Installer::new(&python).install(&wheels)?; - - Ok(()) -} - /// Returns the directory with the `pyproject.toml`/`setup.py` #[instrument(skip_all, fields(path))] fn extract_archive(sdist: &Path, extracted: &PathBuf) -> Result { diff --git a/crates/puffin-cli/Cargo.toml b/crates/puffin-cli/Cargo.toml index 6a960907856a9..544016d4d41be 100644 --- a/crates/puffin-cli/Cargo.toml +++ b/crates/puffin-cli/Cargo.toml @@ -15,6 +15,7 @@ pep508_rs = { path = "../pep508-rs" } platform-host = { path = "../platform-host" } platform-tags = { path = "../platform-tags" } pubgrub = { path = "../../vendor/pubgrub" } +puffin-build-cli = { path = "../puffin-build-cli" } puffin-client = { path = "../puffin-client" } puffin-installer = { path = "../puffin-installer" } puffin-interpreter = { path = "../puffin-interpreter" } diff --git a/crates/puffin-cli/src/commands/pip_compile.rs b/crates/puffin-cli/src/commands/pip_compile.rs index 1808c8d03c384..10f8a0d894eb6 100644 --- a/crates/puffin-cli/src/commands/pip_compile.rs +++ b/crates/puffin-cli/src/commands/pip_compile.rs @@ -7,21 +7,23 @@ use anyhow::Result; use colored::Colorize; use fs_err::File; use itertools::Itertools; -use pubgrub::report::Reporter; -use tracing::debug; - use pep508_rs::Requirement; use platform_host::Platform; use platform_tags::Tags; +use pubgrub::report::Reporter; +use puffin_build_cli::resolve_and_install; use puffin_client::PypiClientBuilder; use puffin_interpreter::PythonExecutable; use puffin_resolver::ResolutionMode; +use puffin_resolver::{BuiltSourceDistributionCache, SourceDistributionBuildContext}; +use tracing::debug; use crate::commands::{elapsed, ExitStatus}; use crate::printer::Printer; use crate::requirements::RequirementsSource; const VERSION: &str = env!("CARGO_PKG_VERSION"); +const BUILT_WHEELS_CACHE: &str = "built-wheels-v0"; /// Resolve a set of requirements into a set of pinned versions. pub(crate) async fn pip_compile( @@ -63,9 +65,22 @@ pub(crate) async fn pip_compile( // Instantiate a client. let client = PypiClientBuilder::default().cache(cache).build(); + let build_context = SourceDistributionBuildContext { + resolve_and_install, + python: python.clone(), + cache: cache.map(|cache| BuiltSourceDistributionCache::new(cache.join(BUILT_WHEELS_CACHE))), + }; + // Resolve the dependencies. - let resolver = - puffin_resolver::Resolver::new(requirements, constraints, mode, markers, &tags, &client); + let resolver = puffin_resolver::Resolver::new( + requirements, + constraints, + mode, + markers, + &tags, + &client, + Some(build_context), + ); let resolution = match resolver.resolve().await { Err(puffin_resolver::ResolveError::PubGrub(pubgrub::error::PubGrubError::NoSolution( mut derivation_tree, diff --git a/crates/puffin-client/Cargo.toml b/crates/puffin-client/Cargo.toml index b7028cfafa8f8..5cdc3e6e147d4 100644 --- a/crates/puffin-client/Cargo.toml +++ b/crates/puffin-client/Cargo.toml @@ -6,6 +6,7 @@ edition = "2021" [dependencies] puffin-package = { path = "../puffin-package" } +futures = { workspace = true } http-cache-reqwest = { workspace = true } reqwest = { workspace = true } reqwest-middleware = { workspace = true } @@ -13,6 +14,6 @@ reqwest-retry = { workspace = true } serde = { workspace = true } serde_json = { workspace = true } thiserror = { workspace = true } -url = { workspace = true } +tokio = { workspace = true } tracing = { workspace = true } -futures = { workspace = true } +url = { workspace = true } diff --git a/crates/puffin-interpreter/src/lib.rs b/crates/puffin-interpreter/src/lib.rs index 19fa890be3383..786b269f6feb4 100644 --- a/crates/puffin-interpreter/src/lib.rs +++ b/crates/puffin-interpreter/src/lib.rs @@ -13,7 +13,7 @@ mod python_platform; mod virtual_env; /// A Python executable and its associated platform markers. -#[derive(Debug)] +#[derive(Debug, Clone)] pub struct PythonExecutable { platform: PythonPlatform, venv: PathBuf, diff --git a/crates/puffin-resolver/Cargo.toml b/crates/puffin-resolver/Cargo.toml index c9bbc936d9ed3..800025a77ca69 100644 --- a/crates/puffin-resolver/Cargo.toml +++ b/crates/puffin-resolver/Cargo.toml @@ -10,12 +10,16 @@ authors = { workspace = true } license = { workspace = true } [dependencies] +gourgeist = { path = "../gourgeist" } +install-wheel-rs = { path = "../install-wheel-rs" } pep440_rs = { path = "../pep440-rs" } pep508_rs = { path = "../pep508-rs" } platform-host = { path = "../platform-host" } platform-tags = { path = "../platform-tags" } pubgrub = { path = "../../vendor/pubgrub" } +puffin-build = { path = "../puffin-build" } puffin-client = { path = "../puffin-client" } +puffin-interpreter = { path = "../puffin-interpreter" } puffin-package = { path = "../puffin-package" } distribution-filename = { path = "../distribution-filename" } @@ -23,15 +27,21 @@ anyhow = { workspace = true } bitflags = { workspace = true } clap = { workspace = true, features = ["derive"], optional = true } colored = { workspace = true } +fs-err = { workspace = true } futures = { workspace = true } fxhash = { workspace = true } itertools = { workspace = true } once_cell = { workspace = true } petgraph = { workspace = true } +tempfile = { workspace = true } thiserror = { workspace = true } tokio = { workspace = true } +tokio-util = { workspace = true, features = ["compat"] } tracing = { workspace = true } +url = { workspace = true } waitmap = { workspace = true } +which = { workspace = true } +zip = { workspace = true } [dev-dependencies] once_cell = { version = "1.18.0" } diff --git a/crates/puffin-resolver/src/error.rs b/crates/puffin-resolver/src/error.rs index 3d0f546fd859f..e4a27ac6fbbcb 100644 --- a/crates/puffin-resolver/src/error.rs +++ b/crates/puffin-resolver/src/error.rs @@ -25,6 +25,14 @@ pub enum ResolveError { #[error(transparent)] PubGrub(#[from] pubgrub::error::PubGrubError>), + + #[error("Failed to build source distribution {filename}")] + SourceDistribution { + filename: String, + // TODO: Gives this a proper error type + #[source] + err: anyhow::Error, + }, } impl From> for ResolveError { diff --git a/crates/puffin-resolver/src/lib.rs b/crates/puffin-resolver/src/lib.rs index df1c19a465ab6..ebec7e640dfc6 100644 --- a/crates/puffin-resolver/src/lib.rs +++ b/crates/puffin-resolver/src/lib.rs @@ -2,6 +2,7 @@ pub use error::ResolveError; pub use mode::ResolutionMode; pub use resolution::PinnedPackage; pub use resolver::Resolver; +pub use source_distribution::{BuiltSourceDistributionCache, SourceDistributionBuildContext}; pub use wheel_finder::{Reporter, WheelFinder}; mod error; @@ -9,4 +10,5 @@ mod mode; mod pubgrub; mod resolution; mod resolver; +mod source_distribution; mod wheel_finder; diff --git a/crates/puffin-resolver/src/resolution.rs b/crates/puffin-resolver/src/resolution.rs index 1fb44745a76bd..5413371555ce0 100644 --- a/crates/puffin-resolver/src/resolution.rs +++ b/crates/puffin-resolver/src/resolution.rs @@ -1,8 +1,8 @@ -use std::hash::BuildHasherDefault; - use colored::Colorize; use fxhash::FxHashMap; use petgraph::visit::EdgeRef; +use std::hash::BuildHasherDefault; + use pubgrub::range::Range; use pubgrub::solver::{Kind, State}; use pubgrub::type_aliases::SelectedDependencies; diff --git a/crates/puffin-resolver/src/resolver.rs b/crates/puffin-resolver/src/resolver.rs index 0cb89c0796fc6..7ce4b46674b90 100644 --- a/crates/puffin-resolver/src/resolver.rs +++ b/crates/puffin-resolver/src/resolver.rs @@ -2,12 +2,14 @@ use std::borrow::Borrow; use std::collections::hash_map::Entry; +use std::future::Future; +use std::path::PathBuf; +use std::pin::Pin; use std::str::FromStr; use std::sync::Arc; -use anyhow::Result; +use anyhow::{format_err, Result}; use futures::channel::mpsc::UnboundedReceiver; -use futures::future::Either; use futures::{pin_mut, FutureExt, StreamExt, TryFutureExt}; use fxhash::{FxHashMap, FxHashSet}; use pubgrub::error::PubGrubError; @@ -18,7 +20,7 @@ use tokio::select; use tracing::{debug, trace}; use waitmap::WaitMap; -use distribution_filename::WheelFilename; +use distribution_filename::{SourceDistributionFilename, WheelFilename}; use pep508_rs::{MarkerEnvironment, Requirement}; use platform_tags::Tags; use puffin_client::{File, PypiClient, SimpleJson}; @@ -32,6 +34,8 @@ use crate::pubgrub::package::PubGrubPackage; use crate::pubgrub::version::{PubGrubVersion, MIN_VERSION}; use crate::pubgrub::{iter_requirements, version_range}; use crate::resolution::Graph; +use crate::source_distribution::{download_and_build_sdist, read_dist_info}; +use crate::{BuiltSourceDistributionCache, SourceDistributionBuildContext}; pub struct Resolver<'a> { requirements: Vec, @@ -41,6 +45,8 @@ pub struct Resolver<'a> { client: &'a PypiClient, selector: CandidateSelector, cache: Arc, + /// sdist builder + source_distribution_build_context: Option, } impl<'a> Resolver<'a> { @@ -52,6 +58,7 @@ impl<'a> Resolver<'a> { markers: &'a MarkerEnvironment, tags: &'a Tags, client: &'a PypiClient, + resolve_and_install: Option, ) -> Self { Self { selector: CandidateSelector::from_mode(mode, &requirements), @@ -61,6 +68,7 @@ impl<'a> Resolver<'a> { markers, tags, client, + source_distribution_build_context: resolve_and_install, } } @@ -266,27 +274,46 @@ impl<'a> Resolver<'a> { }; let simple_json = entry.value(); - // Select the latest compatible version. - let Some(file) = self + // Try to find a wheel. If there isn't any, to a find a source distribution. If there + // isn't any either, short circuit and fail the resolution. + // TODO: Group files by version, then check for each version first for compatible wheels + // and then for a compatible sdist. This is required to still select the most recent + // version. + let Some((file, request)) = self .selector .iter_candidates(package_name, &simple_json.files) - .find(|file| { - let Ok(name) = WheelFilename::from_str(file.filename.as_str()) else { - return false; - }; - - if !name.is_compatible(self.tags) { - return false; + .find_map(|file| { + let wheel_filename = WheelFilename::from_str(file.filename.as_str()).ok()?; + if !wheel_filename.is_compatible(self.tags) { + return None; } - if !range + if range .borrow() - .contains(&PubGrubVersion::from(name.version.clone())) + .contains(&PubGrubVersion::from(wheel_filename.version.clone())) { - return false; - }; - - true + Some((file, Request::WheelVersion(file.clone()))) + } else { + None + } + }) + .or_else(|| { + self.selector + .iter_candidates(package_name, &simple_json.files) + .find_map(|file| { + let sdist_filename = + SourceDistributionFilename::parse(&file.filename, package_name) + .ok()?; + + if range + .borrow() + .contains(&PubGrubVersion::from(sdist_filename.version.clone())) + { + Some((file, Request::SdistVersion((file.clone(), sdist_filename)))) + } else { + None + } + }) }) else { // Short circuit: we couldn't find _any_ compatible versions for a package. @@ -296,7 +323,7 @@ impl<'a> Resolver<'a> { // Emit a request to fetch the metadata for this version. if in_flight.insert(file.hashes.sha256.clone()) { - request_sink.unbounded_send(Request::Version(file.clone()))?; + request_sink.unbounded_send(request)?; } selection = index; @@ -321,7 +348,7 @@ impl<'a> Resolver<'a> { ); // Find a compatible version. - let Some(wheel) = self + let mut wheel = self .selector .iter_candidates(package_name, &simple_json.files) .find_map(|file| { @@ -345,29 +372,69 @@ impl<'a> Resolver<'a> { name: package_name.clone(), version: name.version.clone(), }) - }) - else { - // Short circuit: we couldn't find _any_ compatible versions for a package. - return Ok((package, None)); - }; + }); - debug!( - "Selecting: {}=={} ({})", - wheel.name, wheel.version, wheel.file.filename - ); + if wheel.is_none() { + if let Some((sdist_file, parsed_filename)) = simple_json + .files + .iter() + .rev() + .filter_map(|file| { + let Ok(parsed_filename) = + SourceDistributionFilename::parse(&file.filename, package_name) + else { + return None; + }; + + if !range + .borrow() + .contains(&PubGrubVersion::from(parsed_filename.version.clone())) + { + return None; + }; + + Some((file, parsed_filename)) + }) + .max_by(|left, right| left.1.version.cmp(&right.1.version)) + { + // Emit a request to fetch the metadata for this version. + if in_flight.insert(sdist_file.hashes.sha256.clone()) { + request_sink.unbounded_send(Request::SdistVersion(( + sdist_file.clone(), + parsed_filename.clone(), + )))?; + } + // TODO(konstin): That's not a wheel + wheel = Some(Wheel { + file: sdist_file.clone(), + name: package_name.clone(), + version: parsed_filename.version.clone(), + }); + } + } + + if let Some(wheel) = wheel { + debug!( + "Selecting: {}=={} ({})", + wheel.name, wheel.version, wheel.file.filename + ); - // We want to return a package pinned to a specific version; but we _also_ want to - // store the exact file that we selected to satisfy that version. - pins.entry(wheel.name) - .or_default() - .insert(wheel.version.clone(), wheel.file.clone()); + // We want to return a package pinned to a specific version; but we _also_ want to + // store the exact file that we selected to satisfy that version. + pins.entry(wheel.name) + .or_default() + .insert(wheel.version.clone(), wheel.file.clone()); - // Emit a request to fetch the metadata for this version. - if in_flight.insert(wheel.file.hashes.sha256.clone()) { - request_sink.unbounded_send(Request::Version(wheel.file.clone()))?; - } + // Emit a request to fetch the metadata for this version. + if in_flight.insert(wheel.file.hashes.sha256.clone()) { + request_sink.unbounded_send(Request::WheelVersion(wheel.file.clone()))?; + } - Ok((package, Some(PubGrubVersion::from(wheel.version)))) + Ok((package, Some(PubGrubVersion::from(wheel.version)))) + } else { + // Short circuit: we couldn't find _any_ compatible versions for a package. + Ok((package, None)) + } } }; } @@ -485,20 +552,7 @@ impl<'a> Resolver<'a> { /// Fetch the metadata for a stream of packages and versions. async fn fetch(&self, request_stream: UnboundedReceiver) -> Result<(), ResolveError> { let mut response_stream = request_stream - .map({ - |request: Request| match request { - Request::Package(package_name) => Either::Left( - self.client - .simple(package_name.clone()) - .map_ok(move |metadata| Response::Package(package_name, metadata)), - ), - Request::Version(file) => Either::Right( - self.client - .file(file.clone()) - .map_ok(move |metadata| Response::Version(file, metadata)), - ), - } - }) + .map(|request| self.process_request(request)) .buffer_unordered(32) .ready_chunks(32); @@ -515,12 +569,87 @@ impl<'a> Resolver<'a> { .versions .insert(file.hashes.sha256.clone(), metadata); } + Response::Sdist(file, metadata) => { + trace!("Received sdist build metadata for {}", file.filename); + self.cache + .versions + .insert(file.hashes.sha256.clone(), metadata); + } } } } Ok::<(), ResolveError>(()) } + + fn process_request( + &'a self, + request: Request, + ) -> Pin> + 'a>> { + match request { + Request::Package(package_name) => Box::pin( + self.client + .simple(package_name.clone()) + .map_ok(move |metadata| Response::Package(package_name, metadata)) + .map_err(ResolveError::Client), + ), + Request::WheelVersion(file) => Box::pin( + self.client + .file(file.clone()) + .map_ok(move |metadata| Response::Version(file, metadata)) + .map_err(ResolveError::Client), + ), + Request::SdistVersion((file, filename)) => Box::pin(async move { + if let Some(build_context) = &self.source_distribution_build_context { + let cached_wheel = + self.find_cached_built_wheel(build_context.cache.as_ref(), &filename); + let metadata21 = if let Some(cached_wheel) = cached_wheel { + read_dist_info(cached_wheel).await + } else { + download_and_build_sdist(&file, self.client, build_context, &filename).await + } + .map_err(|err| ResolveError::SourceDistribution { + filename: file.filename.clone(), + err, + })?; + + Ok(Response::Sdist(file, metadata21)) + } else { + Err(ResolveError::SourceDistribution { + filename: file.filename, + err: format_err!("No build context registered"), + }) + } + }), + } + } + + fn find_cached_built_wheel( + &self, + cache: Option<&BuiltSourceDistributionCache>, + filename: &SourceDistributionFilename, + ) -> Option { + let Some(cache) = cache else { + return None; + }; + let Ok(read_dir) = fs_err::read_dir(cache.version(&filename.name, &filename.version)) + else { + return None; + }; + + for entry in read_dir { + let Ok(entry) = entry else { continue }; + let Ok(wheel) = WheelFilename::from_str(entry.file_name().to_string_lossy().as_ref()) + else { + continue; + }; + + if wheel.is_compatible(self.tags) { + return Some(entry.path().clone()); + } + } + None + } } #[derive(Debug, Clone)] @@ -537,8 +666,10 @@ struct Wheel { enum Request { /// A request to fetch the metadata for a package. Package(PackageName), + /// A request to fetch and build the source distribution for a specific package version + SdistVersion((File, SourceDistributionFilename)), /// A request to fetch the metadata for a specific version of a package. - Version(File), + WheelVersion(File), } #[derive(Debug)] @@ -547,6 +678,8 @@ enum Response { Package(PackageName, SimpleJson), /// The returned metadata for a specific version of a package. Version(File, Metadata21), + /// The returned metadata for an sdist build. + Sdist(File, Metadata21), } struct SolverCache { diff --git a/crates/puffin-resolver/src/source_distribution.rs b/crates/puffin-resolver/src/source_distribution.rs new file mode 100644 index 0000000000000..884fd1eb74f2a --- /dev/null +++ b/crates/puffin-resolver/src/source_distribution.rs @@ -0,0 +1,103 @@ +use distribution_filename::{SourceDistributionFilename, WheelFilename}; +use fs_err::tokio as fs; +use pep440_rs::Version; +use puffin_build::ResolveAndInstall; +use puffin_client::{File, PypiClient}; +use puffin_interpreter::PythonExecutable; +use puffin_package::metadata::Metadata21; +use puffin_package::package_name::PackageName; +use std::path::PathBuf; +use std::str::FromStr; +use tempfile::tempdir; +use tokio::task::spawn_blocking; +use tokio_util::compat::FuturesAsyncReadCompatExt; +use tracing::debug; +use url::Url; +use zip::ZipArchive; + +/// TODO: Find a better home for me? +/// +/// Stores wheels built from source distributions. We need to keep those separate from the regular +/// wheel cache since a wheel with the same name may be uploaded after we made our build and in that +/// case the hashes would clash. +pub struct BuiltSourceDistributionCache(PathBuf); + +impl BuiltSourceDistributionCache { + pub fn new(path: impl Into) -> Self { + Self(path.into()) + } + + pub fn version(&self, name: &PackageName, version: &Version) -> PathBuf { + self.0.join(name.to_string()).join(version.to_string()) + } +} + +/// Pass the information required to build source distributions around +pub struct SourceDistributionBuildContext { + /// Avoid circular crate dependencies by using a callback + pub resolve_and_install: ResolveAndInstall, + pub python: PythonExecutable, + /// We store + pub cache: Option, +} + +pub(crate) async fn download_and_build_sdist( + file: &File, + client: &PypiClient, + build_context: &SourceDistributionBuildContext, + sdist_filename: &SourceDistributionFilename, +) -> anyhow::Result { + debug!("Building {}", &file.filename); + let url = Url::parse(&file.url)?; + let reader = client.stream_external(&url).await?; + let mut reader = tokio::io::BufReader::new(reader.compat()); + let temp_dir = tempdir()?; + + let sdist_dir = temp_dir.path().join("sdist"); + tokio::fs::create_dir(&sdist_dir).await?; + let sdist_file = sdist_dir.join(&file.filename); + let mut writer = tokio::fs::File::create(&sdist_file).await?; + tokio::io::copy(&mut reader, &mut writer).await?; + + // TODO: Merge this with PythonExecutable + let interpreter_info = gourgeist::get_interpreter_info(build_context.python.executable())?; + + let wheel_dir = if let Some(cache) = &build_context.cache { + cache.version(&sdist_filename.name, &sdist_filename.version) + } else { + temp_dir.path().join("wheels") + }; + + fs::create_dir_all(&wheel_dir).await?; + + let builder = puffin_build::SourceDistributionBuilder::setup( + &sdist_file, + build_context.python.executable(), + &interpreter_info, + None, + build_context.resolve_and_install, + ) + .await?; + let disk_filename = builder.build(&wheel_dir)?; + let metadata21 = read_dist_info(wheel_dir.join(disk_filename)).await?; + + debug!("Finished Building {}", &file.filename); + Ok(metadata21) +} + +pub(crate) async fn read_dist_info(wheel: PathBuf) -> anyhow::Result { + let dist_info = spawn_blocking(move || -> anyhow::Result { + let mut archive = ZipArchive::new(std::fs::File::open(&wheel)?)?; + let dist_info_prefix = install_wheel_rs::find_dist_info( + &WheelFilename::from_str(wheel.file_name().unwrap().to_string_lossy().as_ref())?, + &mut archive, + )?; + let dist_info = std::io::read_to_string( + archive.by_name(&format!("{dist_info_prefix}.dist-info/METADATA"))?, + )?; + Ok(dist_info) + }) + .await + .unwrap()?; + Ok(Metadata21::parse(dist_info.as_bytes())?) +} diff --git a/crates/puffin-resolver/tests/resolver.rs b/crates/puffin-resolver/tests/resolver.rs index fb7c89a94ebc6..74108be1d2581 100644 --- a/crates/puffin-resolver/tests/resolver.rs +++ b/crates/puffin-resolver/tests/resolver.rs @@ -29,6 +29,7 @@ async fn pylint() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -52,6 +53,7 @@ async fn black() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -75,6 +77,7 @@ async fn black_colorama() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -98,6 +101,7 @@ async fn black_python_310() -> Result<()> { &MARKERS_310, &TAGS_310, &client, + None, ); let resolution = resolver.resolve().await?; @@ -123,6 +127,7 @@ async fn black_mypy_extensions() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -148,6 +153,7 @@ async fn black_mypy_extensions_extra() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -173,6 +179,7 @@ async fn black_flake8() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -196,6 +203,7 @@ async fn black_lowest() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; @@ -219,6 +227,7 @@ async fn black_lowest_direct() -> Result<()> { &MARKERS_311, &TAGS_311, &client, + None, ); let resolution = resolver.resolve().await?; diff --git a/vendor/pubgrub/src/internal/partial_solution.rs b/vendor/pubgrub/src/internal/partial_solution.rs index 1b683b9d84d8e..6c445ed84279b 100644 --- a/vendor/pubgrub/src/internal/partial_solution.rs +++ b/vendor/pubgrub/src/internal/partial_solution.rs @@ -141,7 +141,13 @@ impl PartialSolution { AssignmentsIntersection::Decision(_) => panic!("Already existing decision"), // Cannot be called if the versions is not contained in the terms intersection. AssignmentsIntersection::Derivations(term) => { - debug_assert!(term.contains(&version)) + debug_assert!( + term.contains(&version), + "{} {:?} {}", + package, + version, + term, + ) } }, }