Files
sharpcompress/tests/SharpCompress.Test/Tar/TarReaderTests.cs

304 lines
11 KiB
C#
Raw Permalink Normal View History

2022-12-20 15:06:44 +00:00
using System;
2022-12-20 13:09:16 +00:00
using System.Collections.Generic;
2015-12-30 11:19:42 +00:00
using System.IO;
using SharpCompress.Common;
using SharpCompress.Compressors.BZip2;
using SharpCompress.Factories;
2016-09-26 11:49:49 +01:00
using SharpCompress.Readers;
using SharpCompress.Readers.Tar;
using SharpCompress.Test.Mocks;
2017-05-30 15:14:02 +01:00
using Xunit;
2015-12-30 11:19:42 +00:00
2022-12-20 15:20:49 +00:00
namespace SharpCompress.Test.Tar;
public class TarReaderTests : ReaderTests
2015-12-30 11:19:42 +00:00
{
2022-12-20 15:20:49 +00:00
public TarReaderTests() => UseExtensionInsteadOfNameToVerify = true;
2015-12-30 11:19:42 +00:00
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_Reader() => Read("Tar.tar", CompressionType.None);
2015-12-30 11:19:42 +00:00
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_Skip()
{
2024-03-14 08:37:17 +00:00
using Stream stream = new ForwardOnlyStream(
File.OpenRead(Path.Combine(TEST_ARCHIVES_PATH, "Tar.tar"))
);
2026-01-15 11:41:30 +00:00
using var reader = ReaderFactory.OpenReader(stream);
2024-03-14 08:38:12 +00:00
var x = 0;
2024-03-14 08:37:17 +00:00
while (reader.MoveToNextEntry())
2022-12-20 15:20:49 +00:00
{
2024-03-14 08:37:17 +00:00
if (!reader.Entry.IsDirectory)
{
2024-03-14 08:37:17 +00:00
x++;
if (x % 2 == 0)
{
reader.WriteEntryToDirectory(SCRATCH_FILES_PATH);
}
}
}
2022-12-20 15:20:49 +00:00
}
[Fact]
public void Tar_Z_Reader() => Read("Tar.tar.Z", CompressionType.Lzw);
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_BZip2_Reader() => Read("Tar.tar.bz2", CompressionType.BZip2);
2015-12-30 11:19:42 +00:00
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_GZip_Reader() => Read("Tar.tar.gz", CompressionType.GZip);
2015-12-30 11:19:42 +00:00
2025-09-23 03:26:33 -07:00
[Fact]
public void Tar_ZStandard_Reader() => Read("Tar.tar.zst", CompressionType.ZStandard);
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_LZip_Reader() => Read("Tar.tar.lz", CompressionType.LZip);
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_Xz_Reader() => Read("Tar.tar.xz", CompressionType.Xz);
[Fact]
public void Tar_GZip_OldGnu_Reader() => Read("Tar.oldgnu.tar.gz", CompressionType.GZip);
[Fact]
public void Tar_BZip2_Reader_NonSeekable()
{
// Regression test for: Dynamic default RingBuffer for BZip2
// Opening a .tar.bz2 from a non-seekable stream should succeed
// because EnsureMinimumRewindBufferSize expands the ring buffer
// to hold the BZip2 block before calling IsTarFile.
using var fs = File.OpenRead(Path.Combine(TEST_ARCHIVES_PATH, "Tar.tar.bz2"));
using var nonSeekable = new ForwardOnlyStream(fs);
using var reader = ReaderFactory.OpenReader(nonSeekable);
var entryCount = 0;
while (reader.MoveToNextEntry())
{
if (!reader.Entry.IsDirectory)
{
entryCount++;
}
}
Assert.True(entryCount > 0);
}
[Fact]
public void TarWrapper_BZip2_MinimumRewindBufferSize_IsMaxBZip2BlockSize()
{
// The BZip2 TarWrapper must declare a MinimumRewindBufferSize large enough
// to hold an entire maximum-size compressed BZip2 block (9 × 100 000 bytes).
var bzip2Wrapper = Array.Find(
TarWrapper.Wrappers,
w => w.CompressionType == CompressionType.BZip2
);
Assert.NotNull(bzip2Wrapper);
Assert.Equal(BZip2Constants.baseBlockSize * 9, bzip2Wrapper.MinimumRewindBufferSize);
}
[Fact]
public void TarWrapper_Default_MinimumRewindBufferSize_Is_DefaultRewindableBufferSize()
{
// Non-BZip2 wrappers that don't specify a custom size default to
// Constants.RewindableBufferSize so existing behaviour is unchanged.
var noneWrapper = Array.Find(
TarWrapper.Wrappers,
w => w.CompressionType == CompressionType.None
);
Assert.NotNull(noneWrapper);
Assert.Equal(Common.Constants.RewindableBufferSize, noneWrapper.MinimumRewindBufferSize);
}
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_BZip2_Entry_Stream()
{
using (Stream stream = File.OpenRead(Path.Combine(TEST_ARCHIVES_PATH, "Tar.tar.bz2")))
2026-01-15 11:41:30 +00:00
using (var reader = TarReader.OpenReader(stream))
2015-12-30 11:19:42 +00:00
{
2022-12-20 15:20:49 +00:00
while (reader.MoveToNextEntry())
2015-12-30 11:19:42 +00:00
{
2022-12-20 15:20:49 +00:00
if (!reader.Entry.IsDirectory)
2015-12-30 11:19:42 +00:00
{
2022-12-20 15:20:49 +00:00
Assert.Equal(CompressionType.BZip2, reader.Entry.CompressionType);
2024-03-14 08:37:17 +00:00
using var entryStream = reader.OpenEntryStream();
2024-03-14 08:38:12 +00:00
var file = Path.GetFileName(reader.Entry.Key);
var folder =
2024-03-14 08:37:17 +00:00
Path.GetDirectoryName(reader.Entry.Key)
?? throw new ArgumentNullException();
2024-03-14 08:38:12 +00:00
var destdir = Path.Combine(SCRATCH_FILES_PATH, folder);
2024-03-14 08:37:17 +00:00
if (!Directory.Exists(destdir))
2015-12-30 11:19:42 +00:00
{
2024-03-14 08:37:17 +00:00
Directory.CreateDirectory(destdir);
2015-12-30 11:19:42 +00:00
}
2024-04-18 14:25:10 +01:00
var destinationFileName = Path.Combine(destdir, file.NotNull());
2024-03-14 08:37:17 +00:00
2024-03-14 08:38:12 +00:00
using var fs = File.OpenWrite(destinationFileName);
2025-10-22 09:17:13 +01:00
entryStream.CopyTo(fs);
2015-12-30 11:19:42 +00:00
}
}
}
2022-12-20 15:20:49 +00:00
VerifyFiles();
}
2015-12-30 11:19:42 +00:00
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_LongNamesWithLongNameExtension()
{
var filePaths = new List<string>();
2022-12-20 15:20:49 +00:00
using (
Stream stream = File.OpenRead(
Path.Combine(TEST_ARCHIVES_PATH, "Tar.LongPathsWithLongNameExtension.tar")
2022-12-20 13:45:47 +00:00
)
2022-12-20 15:20:49 +00:00
)
2026-01-15 11:41:30 +00:00
using (var reader = TarReader.OpenReader(stream))
2022-12-20 15:20:49 +00:00
{
while (reader.MoveToNextEntry())
{
2022-12-20 15:20:49 +00:00
if (!reader.Entry.IsDirectory)
{
2024-04-18 14:25:10 +01:00
filePaths.Add(reader.Entry.Key.NotNull("Entry Key is null"));
2021-01-09 13:33:34 +00:00
}
}
}
2022-12-20 15:20:49 +00:00
Assert.Equal(3, filePaths.Count);
Assert.Contains("a.txt", filePaths);
Assert.Contains(
"wp-content/plugins/gravityformsextend/lib/Aws/Symfony/Component/ClassLoader/Tests/Fixtures/Apc/beta/Apc/ApcPrefixCollision/A/B/Bar.php",
filePaths
);
Assert.Contains(
"wp-content/plugins/gravityformsextend/lib/Aws/Symfony/Component/ClassLoader/Tests/Fixtures/Apc/beta/Apc/ApcPrefixCollision/A/B/Foo.php",
filePaths
);
}
[Fact]
public void Tar_BZip2_Skip_Entry_Stream()
{
2024-03-14 08:37:17 +00:00
using Stream stream = File.OpenRead(Path.Combine(TEST_ARCHIVES_PATH, "Tar.tar.bz2"));
2026-01-15 11:41:30 +00:00
using var reader = TarReader.OpenReader(stream);
2024-03-14 08:53:08 +00:00
var names = new List<string>();
2024-03-14 08:37:17 +00:00
while (reader.MoveToNextEntry())
2015-12-30 11:19:42 +00:00
{
2024-03-14 08:37:17 +00:00
if (!reader.Entry.IsDirectory)
2015-12-30 11:19:42 +00:00
{
2024-03-14 08:37:17 +00:00
Assert.Equal(CompressionType.BZip2, reader.Entry.CompressionType);
using var entryStream = reader.OpenEntryStream();
entryStream.SkipEntry();
2024-04-18 14:25:10 +01:00
names.Add(reader.Entry.Key.NotNull());
2015-12-30 11:19:42 +00:00
}
}
2024-03-14 08:37:17 +00:00
Assert.Equal(3, names.Count);
2022-12-20 15:20:49 +00:00
}
Merge branch 'master' into dnx Conflicts: NuGet/sharpcompress.nuspec SharpCompress/Common/Zip/WinzipAesCryptoStream.Portable.cs SharpCompress/Common/Zip/WinzipAesEncryptionData.Portable.cs SharpCompress/Crypto/PBKDF2.cs SharpCompress/SharpCompress.Portable.csproj SharpCompress/SharpCompress.PortableTest.csproj SharpCompress/SharpCompress.Unsigned.csproj SharpCompress/SharpCompress.WindowsStore.csproj SharpCompress/SharpCompress.csproj src/SharpCompress/Archive/ArchiveFactory.cs src/SharpCompress/Archive/Rar/FileInfoRarFilePart.cs src/SharpCompress/Archive/Rar/RarArchive.cs src/SharpCompress/Archive/Rar/RarArchiveEntry.cs src/SharpCompress/Archive/SevenZip/SevenZipArchiveEntry.cs src/SharpCompress/Common/GZip/GZipFilePart.cs src/SharpCompress/Common/GZip/GZipVolume.cs src/SharpCompress/Common/Rar/Headers/MarkHeader.cs src/SharpCompress/Common/Rar/Headers/RarHeaderFactory.cs src/SharpCompress/Common/SevenZip/ArchiveReader.cs src/SharpCompress/Common/SevenZip/DataReader.cs src/SharpCompress/Common/Tar/Headers/TarHeader.cs src/SharpCompress/Common/Zip/Headers/ZipFileEntry.cs src/SharpCompress/Common/Zip/WinzipAesCryptoStream.cs src/SharpCompress/Common/Zip/WinzipAesEncryptionData.cs src/SharpCompress/Common/Zip/ZipFilePart.cs src/SharpCompress/Compressor/Deflate/GZipStream.cs src/SharpCompress/Compressor/Deflate/Inflate.cs src/SharpCompress/Compressor/Deflate/ZlibBaseStream.cs src/SharpCompress/Compressor/LZMA/Bcj2DecoderStream.cs src/SharpCompress/Compressor/LZMA/LzmaStream.cs src/SharpCompress/Compressor/PPMd/H/FreqData.cs src/SharpCompress/Compressor/PPMd/H/PPMContext.cs src/SharpCompress/Compressor/PPMd/H/RarMemBlock.cs src/SharpCompress/Compressor/PPMd/H/RarNode.cs src/SharpCompress/Compressor/PPMd/H/State.cs src/SharpCompress/Compressor/PPMd/PpmdProperties.cs src/SharpCompress/Compressor/Rar/VM/RarVM.cs src/SharpCompress/EnumExtensions.cs src/SharpCompress/IO/MarkingBinaryReader.cs src/SharpCompress/Reader/ReaderFactory.cs src/SharpCompress/Utility.cs src/SharpCompress/Writer/IWriter.Extensions.cs src/SharpCompress/Writer/Zip/ZipCentralDirectoryEntry.cs src/SharpCompress/Writer/Zip/ZipWriter.cs test/SharpCompress.Test/Tar/TarArchiveTests.cs test/SharpCompress.Test/Tar/TarReaderTests.cs
2016-02-13 09:24:44 +00:00
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_Containing_Rar_Reader()
{
2024-03-14 08:38:12 +00:00
var archiveFullPath = Path.Combine(TEST_ARCHIVES_PATH, "Tar.ContainsRar.tar");
2024-03-14 08:37:17 +00:00
using Stream stream = File.OpenRead(archiveFullPath);
2026-01-15 11:41:30 +00:00
using var reader = ReaderFactory.OpenReader(stream);
Assert.True(reader.Type == ArchiveType.Tar);
2022-12-20 15:20:49 +00:00
}
2022-12-20 15:20:49 +00:00
[Fact]
public void Tar_With_TarGz_With_Flushed_EntryStream()
{
2024-03-14 08:38:12 +00:00
var archiveFullPath = Path.Combine(TEST_ARCHIVES_PATH, "Tar.ContainsTarGz.tar");
2024-03-14 08:37:17 +00:00
using Stream stream = File.OpenRead(archiveFullPath);
2026-01-15 11:41:30 +00:00
using var reader = ReaderFactory.OpenReader(stream);
2024-03-14 08:37:17 +00:00
Assert.True(reader.MoveToNextEntry());
Assert.Equal("inner.tar.gz", reader.Entry.Key);
using var entryStream = reader.OpenEntryStream();
2024-03-14 08:38:12 +00:00
using var flushingStream = new FlushOnDisposeStream(entryStream);
2024-03-14 08:37:17 +00:00
// Extract inner.tar.gz
2026-01-15 11:41:30 +00:00
using var innerReader = ReaderFactory.OpenReader(flushingStream);
2024-03-14 08:37:17 +00:00
Assert.True(innerReader.MoveToNextEntry());
Assert.Equal("test", innerReader.Entry.Key);
2022-12-20 15:20:49 +00:00
}
2023-03-28 23:07:21 +02:00
[Fact]
public void Tar_Broken_Stream()
{
2024-03-14 08:38:12 +00:00
var archiveFullPath = Path.Combine(TEST_ARCHIVES_PATH, "Tar.tar");
2024-03-14 08:37:17 +00:00
using Stream stream = File.OpenRead(archiveFullPath);
2026-01-15 11:41:30 +00:00
using var reader = ReaderFactory.OpenReader(stream);
2024-03-14 08:37:17 +00:00
var memoryStream = new MemoryStream();
2024-03-14 08:53:08 +00:00
Assert.True(reader.MoveToNextEntry());
Assert.True(reader.MoveToNextEntry());
2024-03-14 08:37:17 +00:00
reader.WriteEntryTo(memoryStream);
stream.Close();
2024-03-14 08:53:08 +00:00
Assert.Throws<IncompleteArchiveException>(() => reader.MoveToNextEntry());
2023-03-28 23:07:21 +02:00
}
[Fact]
public void Tar_Corrupted()
{
var archiveFullPath = Path.Combine(TEST_ARCHIVES_PATH, "TarCorrupted.tar");
using Stream stream = File.OpenRead(archiveFullPath);
2026-01-15 11:41:30 +00:00
using var reader = ReaderFactory.OpenReader(stream);
var memoryStream = new MemoryStream();
Assert.True(reader.MoveToNextEntry());
Assert.True(reader.MoveToNextEntry());
reader.WriteEntryTo(memoryStream);
stream.Close();
Assert.Throws<IncompleteArchiveException>(() => reader.MoveToNextEntry());
}
[Fact]
public void Tar_Malformed_LongName_Excessive_Size()
{
// Create a malformed TAR header with an excessively large LongName size
// This simulates what happens during auto-detection of compressed files
var buffer = new byte[512];
// Set up a basic TAR header structure
// Name field (offset 0, 100 bytes) - set to "././@LongLink" which is typical for LongName
var nameBytes = System.Text.Encoding.ASCII.GetBytes("././@LongLink");
Array.Copy(nameBytes, 0, buffer, 0, nameBytes.Length);
// Set entry type to LongName (offset 156)
buffer[156] = (byte)'L'; // EntryType.LongName
// Set an excessively large size (offset 124, 12 bytes, octal format)
// This simulates a corrupted/misinterpreted size field
// Using "77777777777" (octal) = 8589934591 bytes (~8GB)
var sizeBytes = System.Text.Encoding.ASCII.GetBytes("77777777777 ");
Array.Copy(sizeBytes, 0, buffer, 124, sizeBytes.Length);
// Calculate and set checksum (offset 148, 8 bytes)
// Set checksum field to spaces first
for (var i = 148; i < 156; i++)
{
buffer[i] = (byte)' ';
}
// Calculate checksum
var checksum = 0;
foreach (var b in buffer)
{
checksum += b;
}
var checksumStr = Convert.ToString(checksum, 8).PadLeft(6, '0') + "\0 ";
var checksumBytes = System.Text.Encoding.ASCII.GetBytes(checksumStr);
Array.Copy(checksumBytes, 0, buffer, 148, checksumBytes.Length);
// Create a stream with this malformed header
using var stream = new MemoryStream();
stream.Write(buffer, 0, buffer.Length);
stream.Position = 0;
// Attempt to read this malformed archive
// The InvalidFormatException from the validation gets caught and converted to IncompleteArchiveException
// The important thing is it doesn't cause OutOfMemoryException
Assert.Throws<IncompleteArchiveException>(() =>
{
2026-01-15 11:41:30 +00:00
using var reader = TarReader.OpenReader(stream);
reader.MoveToNextEntry();
});
}
2015-12-30 11:19:42 +00:00
}