From 483c5d1a241ceaec385dcb306c71e28014afee67 Mon Sep 17 00:00:00 2001 From: Rebecca Turner Date: Fri, 6 Dec 2024 15:56:16 -0800 Subject: [PATCH 1/3] Do not use shallow clones for short revisions When the `tag` of a `source-repository-stanza` is not a full hash, we cannot do a shallow clone and fetch it separately. Therefore, in those cases, we fall back to doing a full clone. Fixes #10605 Includes a regression test by @9999years. Co-authored-by: Rebecca Turner --- cabal-install/src/Distribution/Client/VCS.hs | 32 +++++++++++++++++-- .../SourceRepositoryPackageShallow/cabal.out | 10 ++++++ .../cabal.project | 8 +++++ .../cabal.test.hs | 4 +++ .../puppy.cabal | 9 ++++++ .../src/Puppy.hs | 1 + doc/how-to-source-packages.rst | 3 ++ 7 files changed, 65 insertions(+), 2 deletions(-) create mode 100644 cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.out create mode 100644 cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.project create mode 100644 cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.test.hs create mode 100644 cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/puppy.cabal create mode 100644 cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/src/Puppy.hs diff --git a/cabal-install/src/Distribution/Client/VCS.hs b/cabal-install/src/Distribution/Client/VCS.hs index 98b8251d9c1..afd6dfea43c 100644 --- a/cabal-install/src/Distribution/Client/VCS.hs +++ b/cabal-install/src/Distribution/Client/VCS.hs @@ -549,7 +549,10 @@ vcsGit = -- If we want a particular branch or tag, fetch it. ref <- case srpBranch `mplus` srpTag of Nothing -> pure "HEAD" - Just ref -> do + -- `doShallow` controls whether we use a shallow clone. + -- If the clone is shallow, make sure to fetch specified revisions + -- before using them. + Just ref | doShallow -> do -- /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ -- /!\ MULTIPLE HOURS HAVE BEEN LOST HERE!! /!\ -- /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ /!\ @@ -582,6 +585,9 @@ vcsGit = -- for now. Option 1 is possible but seems to have little benefit. git localDir ("fetch" : verboseArg ++ ["origin", ref]) pure "FETCH_HEAD" + Just ref + | otherwise -> + pure ref -- Then, reset to the appropriate ref. git localDir $ @@ -608,8 +614,30 @@ vcsGit = { progInvokeCwd = Just cwd } + -- Beware: if the user supplied revision for the source repository + -- package is /not/ a full hash, then we cannot fetch it, which means + -- we cannot do a shallow clone (--depth=1). + -- See #10605. + doShallow + | Nothing <- srpTag = + -- No tag, OK for shallow + True + -- full hashes are exactly 40 characters + | Just tg <- srpTag + , length tg == 40 + , all (`elem` (['0' .. '9'] ++ ['a' .. 'f'] ++ ['A' .. 'F'])) tg = + True + | otherwise = + False + + depthIs1 + | doShallow = ["--depth=1"] + | otherwise = [] + cloneArgs = - ["clone", "--depth=1", "--no-checkout", loc, localDir] + ["clone"] + ++ depthIs1 + ++ [ "--no-checkout", loc, localDir] ++ case peer of Nothing -> [] Just peerLocalDir -> ["--reference", peerLocalDir] diff --git a/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.out b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.out new file mode 100644 index 00000000000..b5579a8defc --- /dev/null +++ b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.out @@ -0,0 +1,10 @@ +# cabal v2-build +Configuration is affected by the following files: +- cabal.project +Resolving dependencies... +Build profile: -w ghc- -O1 +In order, the following will be built: + - puppy-1.0 (lib) (first run) +Configuring library for puppy-1.0... +Preprocessing library for puppy-1.0... +Building library for puppy-1.0... diff --git a/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.project b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.project new file mode 100644 index 00000000000..275c4fc4bb6 --- /dev/null +++ b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.project @@ -0,0 +1,8 @@ +packages: . + +-- Regression for https://github.com/haskell/cabal/issues/10605 +-- This is `my-lib` 0.9. +source-repository-package + type: git + location: https://github.com/9999years/cabal-testsuite-my-lib.git + tag: 9a0af0aa diff --git a/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.test.hs b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.test.hs new file mode 100644 index 00000000000..d8024a44c0a --- /dev/null +++ b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/cabal.test.hs @@ -0,0 +1,4 @@ +import Test.Cabal.Prelude + +main = cabalTest $ do + cabal "v2-build" [] diff --git a/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/puppy.cabal b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/puppy.cabal new file mode 100644 index 00000000000..d4dbe921e99 --- /dev/null +++ b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/puppy.cabal @@ -0,0 +1,9 @@ +cabal-version: 3.0 +name: puppy +version: 1.0 + +library + default-language: Haskell2010 + hs-source-dirs: src + build-depends: base + exposed-modules: Puppy diff --git a/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/src/Puppy.hs b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/src/Puppy.hs new file mode 100644 index 00000000000..47209451314 --- /dev/null +++ b/cabal-testsuite/PackageTests/SourceRepositoryPackageShallow/src/Puppy.hs @@ -0,0 +1 @@ +module Puppy () where diff --git a/doc/how-to-source-packages.rst b/doc/how-to-source-packages.rst index ec26f26f721..76fe7305974 100644 --- a/doc/how-to-source-packages.rst +++ b/doc/how-to-source-packages.rst @@ -239,6 +239,9 @@ for the ``tag`` field: - If the ``tag`` field is a Git branch name then the latest commit on that branch is used. - If the ``tag`` field is a Git tag then the current commit that tag points to is used. +Note that if the tag is not a full git hash (40 characters, hexadecimal), then +the source repository must be fully cloned, which is often much slower than +doing a shallow clone. *Source code* when dependency vendoring --------------------------------------- From 9ea6d4e4d02ae8ad198ca35f69c4ad256b6bd5d8 Mon Sep 17 00:00:00 2001 From: Rodrigo Mesquita Date: Fri, 13 Dec 2024 18:02:25 +0000 Subject: [PATCH 2/3] Fix verbosity of git The lack of parenthesis in this line meant that we'd only see the verbose output from git when we had a `peerLocalDir`. This should fix verbosity of git --- cabal-install/src/Distribution/Client/VCS.hs | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/cabal-install/src/Distribution/Client/VCS.hs b/cabal-install/src/Distribution/Client/VCS.hs index afd6dfea43c..a7356d85a3b 100644 --- a/cabal-install/src/Distribution/Client/VCS.hs +++ b/cabal-install/src/Distribution/Client/VCS.hs @@ -637,10 +637,11 @@ vcsGit = cloneArgs = ["clone"] ++ depthIs1 - ++ [ "--no-checkout", loc, localDir] - ++ case peer of - Nothing -> [] - Just peerLocalDir -> ["--reference", peerLocalDir] + ++ ["--no-checkout", loc, localDir] + ++ ( case peer of + Nothing -> [] + Just peerLocalDir -> ["--reference", peerLocalDir] + ) ++ verboseArg where loc = srpLocation From a19c6e3f5172b2fa0fb299d2f6b8a9513b0fc41e Mon Sep 17 00:00:00 2001 From: Rodrigo Mesquita Date: Wed, 18 Dec 2024 09:57:11 +0000 Subject: [PATCH 3/3] shallow clones: fetch tags shallowly too It turns out that git fetch origin tag will clone the full repository unless it is also given --depth=1 as an argument. This commit amends this oversight, ensuring source-repository-package stanzas with any tag don't have to fall back to fetch unnecessary information (which is coincidentally much faster) --- cabal-install/src/Distribution/Client/VCS.hs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cabal-install/src/Distribution/Client/VCS.hs b/cabal-install/src/Distribution/Client/VCS.hs index a7356d85a3b..10635384d10 100644 --- a/cabal-install/src/Distribution/Client/VCS.hs +++ b/cabal-install/src/Distribution/Client/VCS.hs @@ -583,7 +583,7 @@ vcsGit = -- -- Option 2 is what Cabal has done historically, and we're keeping it -- for now. Option 1 is possible but seems to have little benefit. - git localDir ("fetch" : verboseArg ++ ["origin", ref]) + git localDir ("fetch" : verboseArg ++ ["--depth=1", "origin", ref]) pure "FETCH_HEAD" Just ref | otherwise ->