Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Gnu tar long filenames #80

Merged
Merged
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions Codec/Archive/Tar/Entry.hs
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,7 @@ module Codec.Archive.Tar.Entry (
fileEntry,
directoryEntry,
longLinkEntry,
longSymLinkEntry,

-- * Standard file permissions
-- | For maximum portability when constructing archives use only these file
Expand Down
35 changes: 27 additions & 8 deletions Codec/Archive/Tar/Pack.hs
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
{-# LANGUAGE MultiWayIf #-}
{-# LANGUAGE LambdaCase #-}
-----------------------------------------------------------------------------
-- |
-- Module : Codec.Archive.Tar
Expand All @@ -23,6 +24,7 @@ module Codec.Archive.Tar.Pack (

import Codec.Archive.Tar.Types
import Control.Monad (join, when, forM)
import qualified Data.ByteString as BSS
import qualified Data.ByteString.Lazy as BS
import System.FilePath
( (</>) )
Expand Down Expand Up @@ -80,24 +82,35 @@ preparePaths baseDir paths =
packPaths :: FilePath -> [FilePath] -> IO [Entry]
packPaths baseDir paths =
fmap concat $ interleave
[ do let tarpath = toTarPath' isDir relpath
[ do let tarpathRes = toTarPath' isDir relpath
isSymlink <- pathIsSymbolicLink filepath
if | isSymlink -> withLongLinkEntry filepath tarpath packSymlinkEntry
| isDir -> withLongLinkEntry filepath tarpath packDirectoryEntry
| otherwise -> withLongLinkEntry filepath tarpath packFileEntry
case tarpathRes of
FileNameEmpty -> throwIO $ userError "File name empty"
FileNameOK tarpath
| isSymlink -> (:[]) <$> packSymlinkEntry filepath tarpath
| isDir -> (:[]) <$> packDirectoryEntry filepath tarpath
| otherwise -> (:[]) <$> packFileEntry filepath tarpath
FileNameTooLong tarpath
| isSymlink -> do
linkTarget <- getSymbolicLinkTarget filepath
packSymlinkEntry' linkTarget tarpath >>= \case
sym@(Entry { entryContent = SymbolicLink (LinkTarget bs) })
| BSS.length bs > 100 -> do
pure [longSymLinkEntry linkTarget, longLinkEntry filepath, sym]
_ -> withLongLinkEntry filepath tarpath packSymlinkEntry
| isDir -> withLongLinkEntry filepath tarpath packDirectoryEntry
| otherwise -> withLongLinkEntry filepath tarpath packFileEntry
| relpath <- paths
, let isDir = FilePath.Native.hasTrailingPathSeparator filepath
filepath = baseDir </> relpath ]
where
-- prepend the long filepath entry if necessary
withLongLinkEntry
:: FilePath
-> ToTarPathResult
-> TarPath
-> (FilePath -> TarPath -> IO Entry)
-> IO [Entry]
withLongLinkEntry _ FileNameEmpty _ = throwIO $ userError "File name empty"
withLongLinkEntry filepath (FileNameOK tarpath) f = (:[]) <$> f filepath tarpath
withLongLinkEntry filepath (FileNameTooLong tarpath) f = do
withLongLinkEntry filepath tarpath f = do
mainEntry <- f filepath tarpath
pure [longLinkEntry filepath, mainEntry]

Expand Down Expand Up @@ -156,6 +169,12 @@ packSymlinkEntry :: FilePath -- ^ Full path to find the file on the local disk
-> IO Entry
packSymlinkEntry filepath tarpath = do
linkTarget <- getSymbolicLinkTarget filepath
packSymlinkEntry' linkTarget tarpath

packSymlinkEntry' :: String -- ^ link target
-> TarPath -- ^ Path to use for the tar Entry in the archive
-> IO Entry
packSymlinkEntry' linkTarget tarpath = do
let entry tp = symlinkEntry tp linkTarget
safeReturn tp = maybe (pure tp) throwIO $ checkEntrySecurity tp
safeReturn $ entry tarpath
Expand Down
18 changes: 18 additions & 0 deletions Codec/Archive/Tar/Types.hs
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@ module Codec.Archive.Tar.Types (

simpleEntry,
longLinkEntry,
longSymLinkEntry,
fileEntry,
symlinkEntry,
directoryEntry,
Expand Down Expand Up @@ -265,6 +266,23 @@ longLinkEntry tarpath = Entry {
entryFormat = GnuFormat
}

-- | [GNU extension](https://www.gnu.org/software/tar/manual/html_node/Standard.html)
-- to store a link target too long to fit into 'entryTarPath'
-- as 'OtherEntryType' @\'K\'@ with the full filepath as 'entryContent'.
-- The next entry must contain the actual
-- data with truncated 'entryTarPath'.
--
-- @since 0.6.0.0
longSymLinkEntry :: FilePath -> Entry
longSymLinkEntry linkTarget = Entry {
entryTarPath = TarPath (BS.Char8.pack "././@LongLink") BS.empty,
entryContent = OtherEntryType 'K' (LBS.fromStrict $ BS.Char8.pack linkTarget) (fromIntegral $ length linkTarget),
hasufell marked this conversation as resolved.
Show resolved Hide resolved
entryPermissions = ordinaryFilePermissions,
entryOwnership = Ownership "" "" 0 0,
entryTime = 0,
entryFormat = GnuFormat
}

-- | A tar 'Entry' for a directory.
--
-- Entry fields such as file permissions and ownership have default values.
Expand Down
83 changes: 56 additions & 27 deletions Codec/Archive/Tar/Unpack.hs
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@ import Codec.Archive.Tar.Check
import Data.Bits
( testBit )
import Data.List (partition, nub)
import Data.Maybe ( fromMaybe )
import qualified Data.ByteString.Char8 as Char8
import qualified Data.ByteString.Lazy as BS
import System.FilePath
Expand All @@ -32,6 +33,7 @@ import System.Directory
( createDirectoryIfMissing, copyFile, setPermissions, getDirectoryContents, doesDirectoryExist, createDirectoryLink, createFileLink )
import Control.Exception
( Exception, throwIO, handle )
import System.IO ( stderr, hPutStr )
import System.IO.Error
( ioeGetErrorType )
import GHC.IO (unsafeInterleaveIO)
Expand Down Expand Up @@ -73,7 +75,7 @@ import System.IO.Error
--
unpack :: Exception e => FilePath -> Entries e -> IO ()
unpack baseDir entries = do
uEntries <- unpackEntries [] (checkSecurity entries)
uEntries <- unpackEntries Nothing Nothing [] (checkSecurity entries)
let (hardlinks, symlinks) = partition (\(_, _, x) -> x) uEntries
-- handle hardlinks first, in case a symlink points to it
handleHardLinks hardlinks
Expand All @@ -83,32 +85,59 @@ unpack baseDir entries = do
-- We're relying here on 'checkSecurity' to make sure we're not scribbling
-- files all over the place.

unpackEntries _ (Fail err) = either throwIO throwIO err
unpackEntries links Done = return links
unpackEntries links (Next entry es) = case entryContent entry of
NormalFile file _ -> do
extractFile (entryPermissions entry) (entryPath entry) file (entryTime entry)
unpackEntries links es
Directory -> do
extractDir (entryPath entry) (entryTime entry)
unpackEntries links es
HardLink link -> (unpackEntries $! saveLink True (entryPath entry) link links) es
SymbolicLink link -> (unpackEntries $! saveLink False (entryPath entry) link links) es
OtherEntryType 'L' (Char8.unpack . BS.toStrict -> fn) _ ->
case es of
(Next entry' es') -> case entryContent entry' of
NormalFile file _ -> do
extractFile (entryPermissions entry') fn file (entryTime entry')
unpackEntries links es'
Directory -> extractDir fn (entryTime entry')
>> unpackEntries links es'
HardLink link -> (unpackEntries $! saveLink True fn link links) es'
SymbolicLink link -> (unpackEntries $! saveLink False fn link links) es'
OtherEntryType 'L' _ _ -> throwIO $ userError "Two subsequent OtherEntryType 'L'"
_ -> unpackEntries links es'
(Fail err) -> either throwIO throwIO err
Done -> throwIO $ userError "././@LongLink without a subsequent entry"
_ -> unpackEntries links es --ignore other file types
unpackEntries :: Exception e
=> Maybe LinkTarget
-> Maybe FilePath
-> [(FilePath, FilePath, Bool)] -- ^ links (path, link, isHardLink)
-> Entries (Either e FileNameError) -- ^ entries
-> IO [(FilePath, FilePath, Bool)]
unpackEntries _ _ _ (Fail err) = either throwIO throwIO err
unpackEntries _ _ links Done = return links
unpackEntries mLink mPath links (Next entry es) = do
hasufell marked this conversation as resolved.
Show resolved Hide resolved
let path = fromMaybe (entryPath entry) mPath
case entryContent entry of
NormalFile file _
| Just _ <- mLink -> throwIO $ userError "Expected SymbolicLink or HardLink after OtherEntryType K"
| otherwise -> do
extractFile (entryPermissions entry) path file (entryTime entry)
unpackEntries Nothing Nothing links es
Directory
| Just _ <- mLink -> throwIO $ userError "Expected SymbolicLink or HardLink after OtherEntryType K"
| otherwise -> do
extractDir path (entryTime entry)
unpackEntries Nothing Nothing links es
HardLink link -> do
let linkTarget = fromMaybe link mLink
(unpackEntries Nothing Nothing $! saveLink True path linkTarget links) es
SymbolicLink link -> do
let linkTarget = fromMaybe link mLink
(unpackEntries Nothing Nothing $! saveLink False path linkTarget links) es
OtherEntryType 'L' fn _
| Just _ <- mPath -> throwIO $ userError "Two subsequent OtherEntryType L"
| otherwise -> unpackEntries mLink (Just . Char8.unpack . BS.toStrict $ fn) links es
OtherEntryType 'K' link _
| Just _ <- mLink -> throwIO $ userError "Two subsequent OtherEntryType K"
| otherwise -> unpackEntries (Just . LinkTarget . BS.toStrict $ link) mPath links es
OtherEntryType _ file _
| Just _ <- mLink -> throwIO $ userError "Unknown entry type following OtherEntryType K"
hasufell marked this conversation as resolved.
Show resolved Hide resolved
| Just _ <- mPath -> throwIO $ userError "Unknown entry type following OtherEntryType L"
| otherwise -> do
hPutStr stderr "Warning: Unknown tar typecode, attempting to extract as normal file"
hasufell marked this conversation as resolved.
Show resolved Hide resolved
extractFile (entryPermissions entry) path file (entryTime entry)
unpackEntries Nothing Nothing links es
hasufell marked this conversation as resolved.
Show resolved Hide resolved
ec -> do
hPutStr stderr $ "Warning: Unsupported typecode \"" <> printEntryContentType ec <> "\", skipping"
hasufell marked this conversation as resolved.
Show resolved Hide resolved
unpackEntries Nothing Nothing links es -- ignore other file types
where
printEntryContentType NormalFile{} = "normal file"
printEntryContentType Directory{} = "directory"
printEntryContentType SymbolicLink{} = "symlink"
printEntryContentType HardLink{} = "hardlink"
printEntryContentType CharacterDevice{} = "chardev"
printEntryContentType BlockDevice{} = "blockdev"
printEntryContentType NamedPipe{} = "namedpipe"
printEntryContentType (OtherEntryType t _ _) = "other entry " <> show t


extractFile permissions path content mtime = do
-- Note that tar archives do not make sure each directory is created
Expand Down
4 changes: 3 additions & 1 deletion tar.cabal
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,8 @@ description: This library is for working with \"@.tar@\" archive files. It
content using an index.
build-type: Simple
cabal-version: 2.0
extra-source-files: changelog.md
extra-source-files: test/data/long.tar
extra-doc-files: changelog.md
tested-with: GHC==9.8.1, GHC==9.6.3, GHC==9.4.8, GHC==9.2.8, GHC==9.0.2,
GHC==8.10.7, GHC==8.8.4, GHC==8.6.5, GHC==8.4.4,
GHC==8.2.2, GHC==8.0.2
Expand Down Expand Up @@ -87,6 +88,7 @@ test-suite properties
containers,
deepseq,
directory >= 1.2,
file-embed,
filepath,
QuickCheck == 2.*,
tar-internal,
Expand Down
15 changes: 15 additions & 0 deletions test/Codec/Archive/Tar/Pack/Tests.hs
Original file line number Diff line number Diff line change
@@ -1,9 +1,17 @@
{-# LANGUAGE BangPatterns #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE ScopedTypeVariables #-}

module Codec.Archive.Tar.Pack.Tests
( prop_roundtrip
, unit_roundtrip
) where

import qualified Data.ByteString as B
import qualified Data.ByteString.Lazy as BL
import Data.FileEmbed
import qualified Codec.Archive.Tar as Tar
import qualified Codec.Archive.Tar.Pack as Pack
import Codec.Archive.Tar.Types (Entries(..))
import qualified Codec.Archive.Tar.Unpack as Unpack
Expand Down Expand Up @@ -49,3 +57,10 @@ prop_roundtrip xss (ASCIIString cnt)
mkFilePath :: ASCIIString -> FilePath
mkFilePath (ASCIIString xs) = makeValid $
filter (\c -> not $ isPathSeparator c || c == '.') xs

unit_roundtrip :: Property
unit_roundtrip =
let tar :: BL.ByteString = BL.fromStrict $(embedFile "test/data/long.tar")
entries = Tar.foldEntries (:) [] (const []) (Tar.read tar)
in Tar.write entries === tar

3 changes: 2 additions & 1 deletion test/Properties.hs
Original file line number Diff line number Diff line change
Expand Up @@ -55,7 +55,8 @@ main =
]

, testGroup "pack" [
testProperty "roundtrip" Pack.prop_roundtrip
testProperty "roundtrip" Pack.prop_roundtrip,
testProperty "long symlink" Pack.unit_roundtrip
]
]

Binary file added test/data/long.tar
Binary file not shown.
Loading