Skip to content

Commit

Permalink
Use Base16 hash for script path.
Browse files Browse the repository at this point in the history
Issue #9334 shows that `%` characters on Windows result in invalid
paths, also `/` characters on Linux create invalid paths.

This changes from using base64 to using base16 with the same length
we use for unit-ids.
  • Loading branch information
jasagredo committed Nov 18, 2023
1 parent 88e4b00 commit f9c4641
Show file tree
Hide file tree
Showing 4 changed files with 16 additions and 27 deletions.
1 change: 0 additions & 1 deletion cabal-install/cabal-install.cabal
Original file line number Diff line number Diff line change
Expand Up @@ -209,7 +209,6 @@ library
async >= 2.0 && < 2.3,
array >= 0.4 && < 0.6,
base16-bytestring >= 0.1.1 && < 1.1.0.0,
base64-bytestring >= 1.0 && < 1.3,
binary >= 0.7.3 && < 0.9,
bytestring >= 0.10.6.0 && < 0.13,
containers >= 0.5.6.2 && < 0.8,
Expand Down
5 changes: 0 additions & 5 deletions cabal-install/src/Distribution/Client/HashValue.hs
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,6 @@ module Distribution.Client.HashValue
, hashValue
, truncateHash
, showHashValue
, showHashValueBase64
, readFileHashValue
, hashFromTUF
) where
Expand All @@ -19,7 +18,6 @@ import qualified Hackage.Security.Client as Sec

import qualified Crypto.Hash.SHA256 as SHA256
import qualified Data.ByteString.Base16 as Base16
import qualified Data.ByteString.Base64 as Base64
import qualified Data.ByteString.Char8 as BS
import qualified Data.ByteString.Lazy.Char8 as LBS

Expand Down Expand Up @@ -57,9 +55,6 @@ hashValue = HashValue . SHA256.hashlazy
showHashValue :: HashValue -> String
showHashValue (HashValue digest) = BS.unpack (Base16.encode digest)

showHashValueBase64 :: HashValue -> String
showHashValueBase64 (HashValue digest) = BS.unpack (Base64.encode digest)

-- | Hash the content of a file. Uses SHA256.
readFileHashValue :: FilePath -> IO HashValue
readFileHashValue tarball =
Expand Down
28 changes: 7 additions & 21 deletions cabal-install/src/Distribution/Client/ScriptUtils.hs
Original file line number Diff line number Diff line change
Expand Up @@ -36,8 +36,9 @@ import Distribution.Client.DistDirLayout
, DistDirParams (..)
)
import Distribution.Client.HashValue
( hashValue
, showHashValueBase64
( readFileHashValue
, showHashValue
, truncateHash
)
import Distribution.Client.HttpUtils
( HttpTransport
Expand Down Expand Up @@ -218,33 +219,18 @@ import qualified Text.Parsec as P
-- repl to deal with the fact that the repl is relative to the working directory and not
-- the project root.

-- | Get the hash of a script's absolute path)
--
-- Two hashes will be the same as long as the absolute paths
-- are the same.
-- | Get the hash of a script's contents.
getScriptHash :: FilePath -> IO String
getScriptHash script =
-- Base64 is shorter than Base16, which helps avoid long path issues on windows
-- but it can contain /'s which aren't valid in file paths so replace them with
-- %'s. 26 chars / 130 bits is enough to practically avoid collisions.
map (\c -> if c == '/' then '%' else c)
. take 26
. showHashValueBase64
. hashValue
. fromString
<$> canonicalizePath script
showHashValue
. truncateHash 26
<$> readFileHashValue script

-- | Get the directory for caching a script build.
--
-- The only identity of a script is it's absolute path, so append the
-- hashed path to the @script-builds@ dir to get the cache directory.
getScriptCacheDirectory :: FilePath -> IO FilePath
getScriptCacheDirectory script = (</>) <$> defaultScriptBuildsDir <*> getScriptHash script

-- | Get the directory for caching a script build and ensure it exists.
--
-- The only identity of a script is it's absolute path, so append the
-- hashed path to the @script-builds@ dir to get the cache directory.
ensureScriptCacheDirectory :: Verbosity -> FilePath -> IO FilePath
ensureScriptCacheDirectory verbosity script = do
cacheDir <- getScriptCacheDirectory script
Expand Down
9 changes: 9 additions & 0 deletions changelog.d/base16-script-cache
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
synopsis: Script cache dir is the base16 hash of the contents of the script.
prs: #9459
packages: cabal-install

description: {

Script cache dir is the base16 hash of the contents of the script.

}

0 comments on commit f9c4641

Please sign in to comment.