SubtitleEdit/libse/ZipExtractor.cs

468 lines
17 KiB
C#
Raw Normal View History

// ZipStorer, by Jaime Olivares
// Website: zipstorer.codeplex.com
// Version: 2.35 (March 14, 2010)
// Simplified to extract-only by Nikse - August 18, 2010
using System;
using System.Collections.Generic;
using System.IO;
using System.IO.Compression;
using System.Text;
namespace Nikse.SubtitleEdit.Core
{
/// <summary>
/// Zip archive decompression. Represents a Zip file.
/// </summary>
public class ZipExtractor : IDisposable
{
/// <summary>
/// Compression method enumeration
/// </summary>
public enum Compression : ushort
{
/// <summary>Uncompressed storage</summary>
Store = 0,
/// <summary>Deflate compression method</summary>
Deflate = 8
}
/// <summary>
/// Represents an entry in Zip file directory
/// </summary>
public struct ZipFileEntry
{
/// <summary>Compression method</summary>
public Compression Method;
/// <summary>Full path and filename as stored in Zip</summary>
public string FilenameInZip;
/// <summary>Original file size</summary>
public uint FileSize;
/// <summary>Compressed file size</summary>
public uint CompressedSize;
/// <summary>Offset of header information inside Zip storage</summary>
public uint HeaderOffset;
/// <summary>Offset of file inside Zip storage</summary>
public uint FileOffset;
/// <summary>Size of header information</summary>
public uint HeaderSize;
/// <summary>32-bit checksum of entire file</summary>
public uint Crc32;
/// <summary>Last modification time of file</summary>
public DateTime ModifyTime;
/// <summary>User comment for file</summary>
public string Comment;
/// <summary>Overriden method</summary>
/// <returns>Filename in Zip</returns>
public override string ToString()
{
2019-09-29 14:33:26 +02:00
return FilenameInZip;
}
}
#region Public fields
#endregion Public fields
#region Private fields
// Stream object of storage file
private Stream ZipFileStream;
// Central dir image
2019-09-29 14:33:26 +02:00
private byte[] CentralDirImage;
// Static CRC32 Table
2019-09-29 14:33:26 +02:00
private static UInt32[] CrcTable;
// Default filename encoder
private static Encoding DefaultEncoding = Encoding.GetEncoding(437);
#endregion Private fields
#region Public methods
// Static constructor. Just invoked once in order to create the CRC32 lookup table.
static ZipExtractor()
{
// Generate CRC32 table
CrcTable = new UInt32[256];
for (int i = 0; i < CrcTable.Length; i++)
{
UInt32 c = (UInt32)i;
for (int j = 0; j < 8; j++)
{
if ((c & 1) != 0)
2019-01-19 14:40:37 +01:00
{
c = 3988292384 ^ (c >> 1);
2019-01-19 14:40:37 +01:00
}
else
2019-01-19 14:40:37 +01:00
{
c >>= 1;
2019-01-19 14:40:37 +01:00
}
}
CrcTable[i] = c;
}
}
/// <summary>
/// Method to open an existing storage file
/// </summary>
/// <param name="filename">Full path of Zip file to open</param>
/// <returns>A valid ZipStorer object</returns>
public static ZipExtractor Open(string filename)
{
Stream stream = new FileStream(filename, FileMode.Open, FileAccess.Read);
ZipExtractor zip = Open(stream);
return zip;
}
/// <summary>
/// Method to open an existing storage from stream
/// </summary>
/// <param name="stream">Already opened stream with zip contents</param>
/// <returns>A valid ZipStorer object</returns>
public static ZipExtractor Open(Stream stream)
{
ZipExtractor zip = new ZipExtractor();
zip.ZipFileStream = stream;
if (zip.ReadFileInfo())
2019-01-19 14:40:37 +01:00
{
return zip;
2019-01-19 14:40:37 +01:00
}
2019-09-29 14:33:26 +02:00
throw new InvalidDataException();
}
/// <summary>
/// Close the Zip storage
/// </summary>
/// <remarks>This is a required step, unless automatic dispose is used</remarks>
public void Close()
{
if (this.ZipFileStream != null)
{
this.ZipFileStream.Flush();
this.ZipFileStream.Dispose();
this.ZipFileStream = null;
}
}
/// <summary>
/// Read all the file records in the central directory
/// </summary>
/// <returns>List of all entries in directory</returns>
public List<ZipFileEntry> ReadCentralDir()
{
if (this.CentralDirImage == null)
2019-01-19 14:40:37 +01:00
{
throw new InvalidOperationException("Central directory currently does not exist");
2019-01-19 14:40:37 +01:00
}
List<ZipFileEntry> result = new List<ZipFileEntry>();
2016-01-24 11:51:04 +01:00
for (int pointer = 0; pointer < this.CentralDirImage.Length;)
{
uint signature = BitConverter.ToUInt32(CentralDirImage, pointer);
if (signature != 0x02014b50)
2019-01-19 14:40:37 +01:00
{
break;
2019-01-19 14:40:37 +01:00
}
2019-09-29 14:33:26 +02:00
bool encodeUtf8 = (BitConverter.ToUInt16(CentralDirImage, pointer + 8) & 0x0800) != 0;
ushort method = BitConverter.ToUInt16(CentralDirImage, pointer + 10);
uint modifyTime = BitConverter.ToUInt32(CentralDirImage, pointer + 12);
uint crc32 = BitConverter.ToUInt32(CentralDirImage, pointer + 16);
uint comprSize = BitConverter.ToUInt32(CentralDirImage, pointer + 20);
uint fileSize = BitConverter.ToUInt32(CentralDirImage, pointer + 24);
ushort filenameSize = BitConverter.ToUInt16(CentralDirImage, pointer + 28);
ushort extraSize = BitConverter.ToUInt16(CentralDirImage, pointer + 30);
ushort commentSize = BitConverter.ToUInt16(CentralDirImage, pointer + 32);
uint headerOffset = BitConverter.ToUInt32(CentralDirImage, pointer + 42);
uint headerSize = (uint)(46 + filenameSize + extraSize + commentSize);
2019-09-29 14:33:26 +02:00
Encoding encoder = encodeUtf8 ? Encoding.UTF8 : DefaultEncoding;
ZipFileEntry zfe = new ZipFileEntry();
zfe.Method = (Compression)method;
zfe.FilenameInZip = encoder.GetString(CentralDirImage, pointer + 46, filenameSize);
zfe.FileOffset = GetFileOffset(headerOffset);
zfe.FileSize = fileSize;
zfe.CompressedSize = comprSize;
zfe.HeaderOffset = headerOffset;
zfe.HeaderSize = headerSize;
zfe.Crc32 = crc32;
zfe.ModifyTime = DosTimeToDateTime(modifyTime);
if (commentSize > 0)
2019-01-19 14:40:37 +01:00
{
zfe.Comment = encoder.GetString(CentralDirImage, pointer + 46 + filenameSize + extraSize, commentSize);
2019-01-19 14:40:37 +01:00
}
result.Add(zfe);
pointer += (46 + filenameSize + extraSize + commentSize);
}
return result;
}
/// <summary>
/// Copy the contents of a stored file into a physical file
/// </summary>
/// <param name="zfe">Entry information of file to extract</param>
/// <param name="filename">Name of file to store uncompressed data</param>
/// <returns>True if success, false if not.</returns>
/// <remarks>Unique compression methods are Store and Deflate</remarks>
public bool ExtractFile(ZipFileEntry zfe, string filename)
{
// Make sure the parent directory exist
2019-09-29 14:33:26 +02:00
string path = Path.GetDirectoryName(filename);
if (!Directory.Exists(path))
2019-01-19 14:40:37 +01:00
{
Directory.CreateDirectory(path);
2019-01-19 14:40:37 +01:00
}
// Check it is directory. If so, do nothing
if (Directory.Exists(filename))
2019-01-19 14:40:37 +01:00
{
return true;
2019-01-19 14:40:37 +01:00
}
2019-09-29 14:33:26 +02:00
bool result;
using (Stream output = new FileStream(filename, FileMode.Create, FileAccess.Write))
{
result = ExtractFile(zfe, output);
}
File.SetCreationTime(filename, zfe.ModifyTime);
File.SetLastWriteTime(filename, zfe.ModifyTime);
return result;
}
/// <summary>
/// Copy the contents of a stored file into an opened stream
/// </summary>
/// <param name="zfe">Entry information of file to extract</param>
/// <param name="stream">Stream to store the uncompressed data</param>
/// <returns>True if success, false if not.</returns>
/// <remarks>Unique compression methods are Store and Deflate</remarks>
public bool ExtractFile(ZipFileEntry zfe, Stream stream)
{
if (!stream.CanWrite)
2019-01-19 14:40:37 +01:00
{
throw new InvalidOperationException("Stream cannot be written");
2019-01-19 14:40:37 +01:00
}
// check signature
byte[] signature = new byte[4];
this.ZipFileStream.Seek(zfe.HeaderOffset, SeekOrigin.Begin);
this.ZipFileStream.Read(signature, 0, 4);
if (BitConverter.ToUInt32(signature, 0) != 0x04034b50)
2019-01-19 14:40:37 +01:00
{
return false;
2019-01-19 14:40:37 +01:00
}
// Select input stream for inflating or just reading
Stream inStream;
if (zfe.Method == Compression.Store)
2019-01-19 14:40:37 +01:00
{
inStream = this.ZipFileStream;
2019-01-19 14:40:37 +01:00
}
else if (zfe.Method == Compression.Deflate)
2019-01-19 14:40:37 +01:00
{
inStream = new DeflateStream(this.ZipFileStream, CompressionMode.Decompress, true);
2019-01-19 14:40:37 +01:00
}
else
2019-01-19 14:40:37 +01:00
{
return false;
2019-01-19 14:40:37 +01:00
}
// Buffered copy
byte[] buffer = new byte[16384];
this.ZipFileStream.Seek(zfe.FileOffset, SeekOrigin.Begin);
uint bytesPending = zfe.FileSize;
while (bytesPending > 0)
{
int bytesRead = inStream.Read(buffer, 0, (int)Math.Min(bytesPending, buffer.Length));
stream.Write(buffer, 0, bytesRead);
bytesPending -= (uint)bytesRead;
}
stream.Flush();
if (zfe.Method == Compression.Deflate)
2019-01-19 14:40:37 +01:00
{
inStream.Dispose();
2019-01-19 14:40:37 +01:00
}
return true;
}
#endregion Public methods
#region Private methods
/// <summary>
/// Calculate the file offset by reading the corresponding local header
/// </summary>
private uint GetFileOffset(uint headerOffset)
{
byte[] buffer = new byte[2];
2019-09-29 14:33:26 +02:00
ZipFileStream.Seek(headerOffset + 26, SeekOrigin.Begin);
ZipFileStream.Read(buffer, 0, 2);
ushort filenameSize = BitConverter.ToUInt16(buffer, 0);
2019-09-29 14:33:26 +02:00
ZipFileStream.Read(buffer, 0, 2);
ushort extraSize = BitConverter.ToUInt16(buffer, 0);
return (uint)(30 + filenameSize + extraSize + headerOffset);
}
/* Local file header:
local file header signature 4 bytes (0x04034b50)
version needed to extract 2 bytes
general purpose bit flag 2 bytes
compression method 2 bytes
last mod file time 2 bytes
last mod file date 2 bytes
crc-32 4 bytes
compressed size 4 bytes
uncompressed size 4 bytes
filename length 2 bytes
extra field length 2 bytes
filename (variable size)
extra field (variable size)
*/
/* Central directory's File header:
central file header signature 4 bytes (0x02014b50)
version made by 2 bytes
version needed to extract 2 bytes
general purpose bit flag 2 bytes
compression method 2 bytes
last mod file time 2 bytes
last mod file date 2 bytes
crc-32 4 bytes
compressed size 4 bytes
uncompressed size 4 bytes
filename length 2 bytes
extra field length 2 bytes
file comment length 2 bytes
disk number start 2 bytes
internal file attributes 2 bytes
external file attributes 4 bytes
relative offset of local header 4 bytes
filename (variable size)
extra field (variable size)
file comment (variable size)
*
/* End of central dir record:
end of central dir signature 4 bytes (0x06054b50)
number of this disk 2 bytes
number of the disk with the
start of the central directory 2 bytes
total number of entries in
the central dir on this disk 2 bytes
total number of entries in
the central dir 2 bytes
size of the central directory 4 bytes
offset of start of central
directory with respect to
the starting disk number 4 bytes
zipfile comment length 2 bytes
zipfile comment (variable size)
*/
/* DOS Date and time:
MS-DOS date. The date is a packed value with the following format. Bits Description
0-4 Day of the month (131)
5-8 Month (1 = January, 2 = February, and so on)
9-15 Year offset from 1980 (add 1980 to get actual year)
MS-DOS time. The time is a packed value with the following format. Bits Description
0-4 Second divided by 2
5-10 Minute (059)
11-15 Hour (023 on a 24-hour clock)
*/
private static DateTime DosTimeToDateTime(uint dt)
{
return new DateTime(
(int)(dt >> 25) + 1980,
(int)(dt >> 21) & 15,
(int)(dt >> 16) & 31,
(int)(dt >> 11) & 31,
(int)(dt >> 5) & 63,
(int)(dt & 31) * 2);
}
// Reads the end-of-central-directory record
private bool ReadFileInfo()
{
2019-09-29 14:33:26 +02:00
if (ZipFileStream.Length < 22)
2019-01-19 14:40:37 +01:00
{
return false;
2019-01-19 14:40:37 +01:00
}
try
{
2019-09-29 14:33:26 +02:00
ZipFileStream.Seek(-17, SeekOrigin.End);
var br = new BinaryReader(this.ZipFileStream);
do
{
2019-09-29 14:33:26 +02:00
ZipFileStream.Seek(-5, SeekOrigin.Current);
var sig = br.ReadUInt32();
if (sig == 0x06054b50)
{
2019-09-29 14:33:26 +02:00
ZipFileStream.Seek(6, SeekOrigin.Current);
2019-09-29 14:33:26 +02:00
br.ReadUInt16();
var centralSize = br.ReadInt32();
var centralDirOffset = br.ReadUInt32();
var commentSize = br.ReadUInt16();
// check if comment field is the very last data in file
2019-09-29 14:33:26 +02:00
if (ZipFileStream.Position + commentSize != this.ZipFileStream.Length)
2019-01-19 14:40:37 +01:00
{
return false;
2019-01-19 14:40:37 +01:00
}
// Copy entire central directory to a memory buffer
2019-09-29 14:33:26 +02:00
CentralDirImage = new byte[centralSize];
ZipFileStream.Seek(centralDirOffset, SeekOrigin.Begin);
ZipFileStream.Read(this.CentralDirImage, 0, centralSize);
2019-09-29 14:33:26 +02:00
// Leave the pointer at the beginning of central dir, to append new files
ZipFileStream.Seek(centralDirOffset, SeekOrigin.Begin);
return true;
}
2019-09-29 14:33:26 +02:00
} while (ZipFileStream.Position > 0);
}
catch
{
2019-09-29 14:33:26 +02:00
// ignored
}
return false;
}
#endregion Private methods
#region IDisposable Members
public void Dispose()
{
Dispose(true);
GC.SuppressFinalize(this);
}
protected virtual void Dispose(bool disposing)
{
if (disposing)
{
2019-09-29 14:33:26 +02:00
Close();
}
}
#endregion IDisposable Members
}
2016-01-24 11:51:04 +01:00
}