mirror of
https://github.com/ProxymanApp/atlantis.git
synced 2026-05-20 20:20:35 +00:00
779 lines
30 KiB
Swift
Executable File
779 lines
30 KiB
Swift
Executable File
///
|
|
/// DataCompression
|
|
///
|
|
/// A libcompression wrapper as an extension for the `Data` type
|
|
/// (GZIP, ZLIB, LZFSE, LZMA, LZ4, deflate, RFC-1950, RFC-1951, RFC-1952)
|
|
///
|
|
/// Created by Markus Wanke, 2016/12/05
|
|
///
|
|
|
|
|
|
///
|
|
/// Apache License, Version 2.0
|
|
///
|
|
/// Copyright 2016, Markus Wanke
|
|
///
|
|
/// Licensed under the Apache License, Version 2.0 (the "License");
|
|
/// you may not use this file except in compliance with the License.
|
|
/// You may obtain a copy of the License at
|
|
///
|
|
/// http://www.apache.org/licenses/LICENSE-2.0
|
|
///
|
|
/// Unless required by applicable law or agreed to in writing, software
|
|
/// distributed under the License is distributed on an "AS IS" BASIS,
|
|
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
/// See the License for the specific language governing permissions and
|
|
/// limitations under the License.
|
|
///
|
|
|
|
|
|
import Foundation
|
|
import Compression
|
|
|
|
#if os(Linux)
|
|
import zlibLinux
|
|
#else
|
|
import zlib
|
|
#endif
|
|
|
|
extension Data
|
|
{
|
|
/// Compresses the data.
|
|
/// - parameter withAlgorithm: Compression algorithm to use. See the `CompressionAlgorithm` type
|
|
/// - returns: compressed data
|
|
func compress(withAlgorithm algo: CompressionAlgorithm) -> Data?
|
|
{
|
|
return self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_ENCODE, algorithm: algo.lowLevelType)
|
|
return perform(config, source: sourcePtr, sourceSize: count)
|
|
}
|
|
}
|
|
|
|
/// Decompresses the data.
|
|
/// - parameter withAlgorithm: Compression algorithm to use. See the `CompressionAlgorithm` type
|
|
/// - returns: decompressed data
|
|
func decompress(withAlgorithm algo: CompressionAlgorithm) -> Data?
|
|
{
|
|
return self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_DECODE, algorithm: algo.lowLevelType)
|
|
return perform(config, source: sourcePtr, sourceSize: count)
|
|
}
|
|
}
|
|
|
|
/// Please consider the [libcompression documentation](https://developer.apple.com/reference/compression/1665429-data_compression)
|
|
/// for further details. Short info:
|
|
/// zlib : Aka deflate. Fast with a good compression rate. Proved itself over time and is supported everywhere.
|
|
/// lzfse : Apples custom Lempel-Ziv style compression algorithm. Claims to compress as good as zlib but 2 to 3 times faster.
|
|
/// lzma : Horribly slow. Compression as well as decompression. Compresses better than zlib though.
|
|
/// lz4 : Fast, but compression rate is very bad. Apples lz4 implementation often to not compress at all.
|
|
enum CompressionAlgorithm
|
|
{
|
|
case zlib
|
|
case lzfse
|
|
case lzma
|
|
case lz4
|
|
}
|
|
|
|
/// Compresses the data using the zlib deflate algorithm.
|
|
/// - returns: raw deflated data according to [RFC-1951](https://tools.ietf.org/html/rfc1951).
|
|
/// - note: Fixed at compression level 5 (best trade off between speed and time)
|
|
func deflate() -> Data?
|
|
{
|
|
return self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_ENCODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: sourcePtr, sourceSize: count)
|
|
}
|
|
}
|
|
|
|
/// Decompresses the data using the zlib deflate algorithm. Self is expected to be a raw deflate
|
|
/// stream according to [RFC-1951](https://tools.ietf.org/html/rfc1951).
|
|
/// - returns: uncompressed data
|
|
func inflate() -> Data?
|
|
{
|
|
return self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_DECODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: sourcePtr, sourceSize: count)
|
|
}
|
|
}
|
|
|
|
/// Compresses the data using the deflate algorithm and makes it comply to the zlib format.
|
|
/// - returns: deflated data in zlib format [RFC-1950](https://tools.ietf.org/html/rfc1950)
|
|
/// - note: Fixed at compression level 5 (best trade off between speed and time)
|
|
func zip() -> Data?
|
|
{
|
|
let header = Data([0x78, 0x5e])
|
|
|
|
let deflated = self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_ENCODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: sourcePtr, sourceSize: count, preload: header)
|
|
}
|
|
|
|
guard var result = deflated else { return nil }
|
|
|
|
var adler = self.adler32().checksum.bigEndian
|
|
result.append(Data(bytes: &adler, count: MemoryLayout<UInt32>.size))
|
|
|
|
return result
|
|
}
|
|
|
|
/// Decompresses the data using the zlib deflate algorithm. Self is expected to be a zlib deflate
|
|
/// stream according to [RFC-1950](https://tools.ietf.org/html/rfc1950).
|
|
/// - returns: uncompressed data
|
|
func unzip(skipCheckSumValidation: Bool = true) -> Data?
|
|
{
|
|
// 2 byte header + 4 byte adler32 checksum
|
|
let overhead = 6
|
|
guard count > overhead else { return nil }
|
|
|
|
let header: UInt16 = withUnsafeBytes { (ptr: UnsafePointer<UInt16>) -> UInt16 in
|
|
return ptr.pointee.bigEndian
|
|
}
|
|
|
|
// check for the deflate stream bit
|
|
guard header >> 8 & 0b1111 == 0b1000 else { return nil }
|
|
// check the header checksum
|
|
guard header % 31 == 0 else { return nil }
|
|
|
|
let cresult: Data? = withUnsafeBytes { (ptr: UnsafePointer<UInt8>) -> Data? in
|
|
let source = ptr.advanced(by: 2)
|
|
let config = (operation: COMPRESSION_STREAM_DECODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: source, sourceSize: count - overhead)
|
|
}
|
|
|
|
guard let inflated = cresult else { return nil }
|
|
|
|
if skipCheckSumValidation { return inflated }
|
|
|
|
let cksum: UInt32 = withUnsafeBytes { (bytePtr: UnsafePointer<UInt8>) -> UInt32 in
|
|
let last = bytePtr.advanced(by: count - 4)
|
|
return last.withMemoryRebound(to: UInt32.self, capacity: 1) { (intPtr) -> UInt32 in
|
|
return intPtr.pointee.bigEndian
|
|
}
|
|
}
|
|
|
|
return cksum == inflated.adler32().checksum ? inflated : nil
|
|
}
|
|
|
|
/// Compresses the data using the deflate algorithm and makes it comply to the gzip stream format.
|
|
/// - returns: deflated data in gzip format [RFC-1952](https://tools.ietf.org/html/rfc1952)
|
|
/// - note: Fixed at compression level 5 (best trade off between speed and time)
|
|
func gzip() -> Data?
|
|
{
|
|
var header = Data([0x1f, 0x8b, 0x08, 0x00]) // magic, magic, deflate, noflags
|
|
|
|
var unixtime = UInt32(Date().timeIntervalSince1970).littleEndian
|
|
header.append(Data(bytes: &unixtime, count: MemoryLayout<UInt32>.size))
|
|
|
|
header.append(contentsOf: [0x00, 0x03]) // normal compression level, unix file type
|
|
|
|
let deflated = self.withUnsafeBytes { (sourcePtr: UnsafePointer<UInt8>) -> Data? in
|
|
let config = (operation: COMPRESSION_STREAM_ENCODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: sourcePtr, sourceSize: count, preload: header)
|
|
}
|
|
|
|
guard var result = deflated else { return nil }
|
|
|
|
// append checksum
|
|
var crc32: UInt32 = self.crc32().checksum.littleEndian
|
|
result.append(Data(bytes: &crc32, count: MemoryLayout<UInt32>.size))
|
|
|
|
// append size of original data
|
|
var isize: UInt32 = UInt32(truncatingIfNeeded: count).littleEndian
|
|
result.append(Data(bytes: &isize, count: MemoryLayout<UInt32>.size))
|
|
|
|
return result
|
|
}
|
|
|
|
/// Decompresses the data using the gzip deflate algorithm. Self is expected to be a gzip deflate
|
|
/// stream according to [RFC-1952](https://tools.ietf.org/html/rfc1952).
|
|
/// - returns: uncompressed data
|
|
func gunzip() -> Data?
|
|
{
|
|
// 10 byte header + data + 8 byte footer. See https://tools.ietf.org/html/rfc1952#section-2
|
|
let overhead = 10 + 8
|
|
guard count >= overhead else { return nil }
|
|
|
|
|
|
typealias GZipHeader = (id1: UInt8, id2: UInt8, cm: UInt8, flg: UInt8, xfl: UInt8, os: UInt8)
|
|
let hdr: GZipHeader = withUnsafeBytes { (ptr: UnsafePointer<UInt8>) -> GZipHeader in
|
|
// +---+---+---+---+---+---+---+---+---+---+
|
|
// |ID1|ID2|CM |FLG| MTIME |XFL|OS |
|
|
// +---+---+---+---+---+---+---+---+---+---+
|
|
return (id1: ptr[0], id2: ptr[1], cm: ptr[2], flg: ptr[3], xfl: ptr[8], os: ptr[9])
|
|
}
|
|
|
|
typealias GZipFooter = (crc32: UInt32, isize: UInt32)
|
|
let ftr: GZipFooter = withUnsafeBytes { (bptr: UnsafePointer<UInt8>) -> GZipFooter in
|
|
// +---+---+---+---+---+---+---+---+
|
|
// | CRC32 | ISIZE |
|
|
// +---+---+---+---+---+---+---+---+
|
|
return bptr.advanced(by: count - 8).withMemoryRebound(to: UInt32.self, capacity: 2) { ptr in
|
|
return (ptr[0].littleEndian, ptr[1].littleEndian)
|
|
}
|
|
}
|
|
|
|
// Wrong gzip magic or unsupported compression method
|
|
guard hdr.id1 == 0x1f && hdr.id2 == 0x8b && hdr.cm == 0x08 else { return nil }
|
|
|
|
let has_crc16: Bool = hdr.flg & 0b00010 != 0
|
|
let has_extra: Bool = hdr.flg & 0b00100 != 0
|
|
let has_fname: Bool = hdr.flg & 0b01000 != 0
|
|
let has_cmmnt: Bool = hdr.flg & 0b10000 != 0
|
|
|
|
let cresult: Data? = withUnsafeBytes { (ptr: UnsafePointer<UInt8>) -> Data? in
|
|
var pos = 10 ; let limit = count - 8
|
|
|
|
if has_extra {
|
|
pos += ptr.advanced(by: pos).withMemoryRebound(to: UInt16.self, capacity: 1) {
|
|
return Int($0.pointee.littleEndian) + 2 // +2 for xlen
|
|
}
|
|
}
|
|
if has_fname {
|
|
while pos < limit && ptr[pos] != 0x0 { pos += 1 }
|
|
pos += 1 // skip null byte as well
|
|
}
|
|
if has_cmmnt {
|
|
while pos < limit && ptr[pos] != 0x0 { pos += 1 }
|
|
pos += 1 // skip null byte as well
|
|
}
|
|
if has_crc16 {
|
|
pos += 2 // ignoring header crc16
|
|
}
|
|
|
|
guard pos < limit else { return nil }
|
|
let config = (operation: COMPRESSION_STREAM_DECODE, algorithm: COMPRESSION_ZLIB)
|
|
return perform(config, source: ptr.advanced(by: pos), sourceSize: limit - pos)
|
|
}
|
|
|
|
guard let inflated = cresult else { return nil }
|
|
guard ftr.isize == UInt32(truncatingIfNeeded: inflated.count) else { return nil }
|
|
guard ftr.crc32 == inflated.crc32().checksum else { return nil }
|
|
return inflated
|
|
}
|
|
|
|
/// Calculate the Adler32 checksum of the data.
|
|
/// - returns: Adler32 checksum type. Can still be further advanced.
|
|
func adler32() -> Adler32
|
|
{
|
|
var res = Adler32()
|
|
res.advance(withChunk: self)
|
|
return res
|
|
}
|
|
|
|
/// Calculate the Crc32 checksum of the data.
|
|
/// - returns: Crc32 checksum type. Can still be further advanced.
|
|
func crc32() -> Crc32
|
|
{
|
|
var res = Crc32()
|
|
res.advance(withChunk: self)
|
|
return res
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Struct based type representing a Crc32 checksum.
|
|
struct Crc32: CustomStringConvertible
|
|
{
|
|
private static let zLibCrc32: ZLibCrc32FuncPtr? = loadCrc32fromZLib()
|
|
|
|
init() {}
|
|
|
|
// C convention function pointer type matching the signature of `libz::crc32`
|
|
private typealias ZLibCrc32FuncPtr = @convention(c) (
|
|
_ cks: UInt32,
|
|
_ buf: UnsafePointer<UInt8>,
|
|
_ len: UInt32
|
|
) -> UInt32
|
|
|
|
/// Raw checksum. Updated after a every call to `advance(withChunk:)`
|
|
var checksum: UInt32 = 0
|
|
|
|
/// Advance the current checksum with a chunk of data. Designed t be called multiple times.
|
|
/// - parameter chunk: data to advance the checksum
|
|
mutating func advance(withChunk chunk: Data)
|
|
{
|
|
if let fastCrc32 = Crc32.zLibCrc32 {
|
|
checksum = chunk.withUnsafeBytes({ (ptr: UnsafePointer<UInt8>) -> UInt32 in
|
|
return fastCrc32(checksum, ptr, UInt32(chunk.count))
|
|
})
|
|
}
|
|
else {
|
|
checksum = slowCrc32(start: checksum, data: chunk)
|
|
}
|
|
}
|
|
|
|
/// Formatted checksum.
|
|
var description: String
|
|
{
|
|
return String(format: "%08x", checksum)
|
|
}
|
|
|
|
/// Load `crc32()` from '/usr/lib/libz.dylib' if libz is installed.
|
|
/// - returns: A function pointer to crc32() of zlib or nil if zlib can't be found
|
|
private static func loadCrc32fromZLib() -> ZLibCrc32FuncPtr?
|
|
{
|
|
guard let libz = dlopen("/usr/lib/libz.dylib", RTLD_NOW) else { return nil }
|
|
guard let fptr = dlsym(libz, "crc32") else { return nil }
|
|
return unsafeBitCast(fptr, to: ZLibCrc32FuncPtr.self)
|
|
}
|
|
|
|
/// Rudimentary fallback implementation of the crc32 checksum. This is only a backup used
|
|
/// when zlib can't be found under '/usr/lib/libz.dylib'.
|
|
/// - returns: crc32 checksum (4 byte)
|
|
private func slowCrc32(start: UInt32, data: Data) -> UInt32
|
|
{
|
|
return ~data.reduce(~start) { (crc: UInt32, next: UInt8) -> UInt32 in
|
|
let tableOffset = (crc ^ UInt32(next)) & 0xff
|
|
return lookUpTable[Int(tableOffset)] ^ crc >> 8
|
|
}
|
|
}
|
|
|
|
/// Lookup table for faster crc32 calculation.
|
|
/// table source: http://web.mit.edu/freebsd/head/sys/libkern/crc32.c
|
|
private let lookUpTable: [UInt32] = [
|
|
0x00000000, 0x77073096, 0xee0e612c, 0x990951ba, 0x076dc419, 0x706af48f, 0xe963a535, 0x9e6495a3,
|
|
0x0edb8832, 0x79dcb8a4, 0xe0d5e91e, 0x97d2d988, 0x09b64c2b, 0x7eb17cbd, 0xe7b82d07, 0x90bf1d91,
|
|
0x1db71064, 0x6ab020f2, 0xf3b97148, 0x84be41de, 0x1adad47d, 0x6ddde4eb, 0xf4d4b551, 0x83d385c7,
|
|
0x136c9856, 0x646ba8c0, 0xfd62f97a, 0x8a65c9ec, 0x14015c4f, 0x63066cd9, 0xfa0f3d63, 0x8d080df5,
|
|
0x3b6e20c8, 0x4c69105e, 0xd56041e4, 0xa2677172, 0x3c03e4d1, 0x4b04d447, 0xd20d85fd, 0xa50ab56b,
|
|
0x35b5a8fa, 0x42b2986c, 0xdbbbc9d6, 0xacbcf940, 0x32d86ce3, 0x45df5c75, 0xdcd60dcf, 0xabd13d59,
|
|
0x26d930ac, 0x51de003a, 0xc8d75180, 0xbfd06116, 0x21b4f4b5, 0x56b3c423, 0xcfba9599, 0xb8bda50f,
|
|
0x2802b89e, 0x5f058808, 0xc60cd9b2, 0xb10be924, 0x2f6f7c87, 0x58684c11, 0xc1611dab, 0xb6662d3d,
|
|
0x76dc4190, 0x01db7106, 0x98d220bc, 0xefd5102a, 0x71b18589, 0x06b6b51f, 0x9fbfe4a5, 0xe8b8d433,
|
|
0x7807c9a2, 0x0f00f934, 0x9609a88e, 0xe10e9818, 0x7f6a0dbb, 0x086d3d2d, 0x91646c97, 0xe6635c01,
|
|
0x6b6b51f4, 0x1c6c6162, 0x856530d8, 0xf262004e, 0x6c0695ed, 0x1b01a57b, 0x8208f4c1, 0xf50fc457,
|
|
0x65b0d9c6, 0x12b7e950, 0x8bbeb8ea, 0xfcb9887c, 0x62dd1ddf, 0x15da2d49, 0x8cd37cf3, 0xfbd44c65,
|
|
0x4db26158, 0x3ab551ce, 0xa3bc0074, 0xd4bb30e2, 0x4adfa541, 0x3dd895d7, 0xa4d1c46d, 0xd3d6f4fb,
|
|
0x4369e96a, 0x346ed9fc, 0xad678846, 0xda60b8d0, 0x44042d73, 0x33031de5, 0xaa0a4c5f, 0xdd0d7cc9,
|
|
0x5005713c, 0x270241aa, 0xbe0b1010, 0xc90c2086, 0x5768b525, 0x206f85b3, 0xb966d409, 0xce61e49f,
|
|
0x5edef90e, 0x29d9c998, 0xb0d09822, 0xc7d7a8b4, 0x59b33d17, 0x2eb40d81, 0xb7bd5c3b, 0xc0ba6cad,
|
|
0xedb88320, 0x9abfb3b6, 0x03b6e20c, 0x74b1d29a, 0xead54739, 0x9dd277af, 0x04db2615, 0x73dc1683,
|
|
0xe3630b12, 0x94643b84, 0x0d6d6a3e, 0x7a6a5aa8, 0xe40ecf0b, 0x9309ff9d, 0x0a00ae27, 0x7d079eb1,
|
|
0xf00f9344, 0x8708a3d2, 0x1e01f268, 0x6906c2fe, 0xf762575d, 0x806567cb, 0x196c3671, 0x6e6b06e7,
|
|
0xfed41b76, 0x89d32be0, 0x10da7a5a, 0x67dd4acc, 0xf9b9df6f, 0x8ebeeff9, 0x17b7be43, 0x60b08ed5,
|
|
0xd6d6a3e8, 0xa1d1937e, 0x38d8c2c4, 0x4fdff252, 0xd1bb67f1, 0xa6bc5767, 0x3fb506dd, 0x48b2364b,
|
|
0xd80d2bda, 0xaf0a1b4c, 0x36034af6, 0x41047a60, 0xdf60efc3, 0xa867df55, 0x316e8eef, 0x4669be79,
|
|
0xcb61b38c, 0xbc66831a, 0x256fd2a0, 0x5268e236, 0xcc0c7795, 0xbb0b4703, 0x220216b9, 0x5505262f,
|
|
0xc5ba3bbe, 0xb2bd0b28, 0x2bb45a92, 0x5cb36a04, 0xc2d7ffa7, 0xb5d0cf31, 0x2cd99e8b, 0x5bdeae1d,
|
|
0x9b64c2b0, 0xec63f226, 0x756aa39c, 0x026d930a, 0x9c0906a9, 0xeb0e363f, 0x72076785, 0x05005713,
|
|
0x95bf4a82, 0xe2b87a14, 0x7bb12bae, 0x0cb61b38, 0x92d28e9b, 0xe5d5be0d, 0x7cdcefb7, 0x0bdbdf21,
|
|
0x86d3d2d4, 0xf1d4e242, 0x68ddb3f8, 0x1fda836e, 0x81be16cd, 0xf6b9265b, 0x6fb077e1, 0x18b74777,
|
|
0x88085ae6, 0xff0f6a70, 0x66063bca, 0x11010b5c, 0x8f659eff, 0xf862ae69, 0x616bffd3, 0x166ccf45,
|
|
0xa00ae278, 0xd70dd2ee, 0x4e048354, 0x3903b3c2, 0xa7672661, 0xd06016f7, 0x4969474d, 0x3e6e77db,
|
|
0xaed16a4a, 0xd9d65adc, 0x40df0b66, 0x37d83bf0, 0xa9bcae53, 0xdebb9ec5, 0x47b2cf7f, 0x30b5ffe9,
|
|
0xbdbdf21c, 0xcabac28a, 0x53b39330, 0x24b4a3a6, 0xbad03605, 0xcdd70693, 0x54de5729, 0x23d967bf,
|
|
0xb3667a2e, 0xc4614ab8, 0x5d681b02, 0x2a6f2b94, 0xb40bbe37, 0xc30c8ea1, 0x5a05df1b, 0x2d02ef8d,
|
|
]
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// Struct based type representing a Adler32 checksum.
|
|
struct Adler32: CustomStringConvertible
|
|
{
|
|
private static let zLibAdler32: ZLibAdler32FuncPtr? = loadAdler32fromZLib()
|
|
|
|
init() {}
|
|
|
|
// C convention function pointer type matching the signature of `libz::adler32`
|
|
private typealias ZLibAdler32FuncPtr = @convention(c) (
|
|
_ cks: UInt32,
|
|
_ buf: UnsafePointer<UInt8>,
|
|
_ len: UInt32
|
|
) -> UInt32
|
|
|
|
/// Raw checksum. Updated after a every call to `advance(withChunk:)`
|
|
var checksum: UInt32 = 1
|
|
|
|
/// Advance the current checksum with a chunk of data. Designed t be called multiple times.
|
|
/// - parameter chunk: data to advance the checksum
|
|
mutating func advance(withChunk chunk: Data)
|
|
{
|
|
if let fastAdler32 = Adler32.zLibAdler32 {
|
|
checksum = chunk.withUnsafeBytes({ (ptr: UnsafePointer<UInt8>) -> UInt32 in
|
|
return fastAdler32(checksum, ptr, UInt32(chunk.count))
|
|
})
|
|
}
|
|
else {
|
|
checksum = slowAdler32(start: checksum, data: chunk)
|
|
}
|
|
}
|
|
|
|
/// Formatted checksum.
|
|
var description: String
|
|
{
|
|
return String(format: "%08x", checksum)
|
|
}
|
|
|
|
/// Load `adler32()` from '/usr/lib/libz.dylib' if libz is installed.
|
|
/// - returns: A function pointer to adler32() of zlib or nil if zlib can't be found
|
|
private static func loadAdler32fromZLib() -> ZLibAdler32FuncPtr?
|
|
{
|
|
guard let libz = dlopen("/usr/lib/libz.dylib", RTLD_NOW) else { return nil }
|
|
guard let fptr = dlsym(libz, "adler32") else { return nil }
|
|
return unsafeBitCast(fptr, to: ZLibAdler32FuncPtr.self)
|
|
}
|
|
|
|
/// Rudimentary fallback implementation of the adler32 checksum. This is only a backup used
|
|
/// when zlib can't be found under '/usr/lib/libz.dylib'.
|
|
/// - returns: adler32 checksum (4 byte)
|
|
private func slowAdler32(start: UInt32, data: Data) -> UInt32
|
|
{
|
|
var s1: UInt32 = start & 0xffff
|
|
var s2: UInt32 = (start >> 16) & 0xffff
|
|
let prime: UInt32 = 65521
|
|
|
|
for byte in data {
|
|
s1 += UInt32(byte)
|
|
if s1 >= prime { s1 = s1 % prime }
|
|
s2 += s1
|
|
if s2 >= prime { s2 = s2 % prime }
|
|
}
|
|
return (s2 << 16) | s1
|
|
}
|
|
}
|
|
|
|
|
|
|
|
fileprivate extension Data
|
|
{
|
|
func withUnsafeBytes<ResultType, ContentType>(_ body: (UnsafePointer<ContentType>) throws -> ResultType) rethrows -> ResultType
|
|
{
|
|
return try self.withUnsafeBytes({ (rawBufferPointer: UnsafeRawBufferPointer) -> ResultType in
|
|
return try body(rawBufferPointer.bindMemory(to: ContentType.self).baseAddress!)
|
|
})
|
|
}
|
|
}
|
|
|
|
fileprivate extension Data.CompressionAlgorithm
|
|
{
|
|
var lowLevelType: compression_algorithm {
|
|
switch self {
|
|
case .zlib : return COMPRESSION_ZLIB
|
|
case .lzfse : return COMPRESSION_LZFSE
|
|
case .lz4 : return COMPRESSION_LZ4
|
|
case .lzma : return COMPRESSION_LZMA
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
fileprivate typealias Config = (operation: compression_stream_operation, algorithm: compression_algorithm)
|
|
|
|
|
|
fileprivate func perform(_ config: Config, source: UnsafePointer<UInt8>, sourceSize: Int, preload: Data = Data()) -> Data?
|
|
{
|
|
guard config.operation == COMPRESSION_STREAM_ENCODE || sourceSize > 0 else { return nil }
|
|
|
|
let streamBase = UnsafeMutablePointer<compression_stream>.allocate(capacity: 1)
|
|
defer { streamBase.deallocate() }
|
|
var stream = streamBase.pointee
|
|
|
|
let status = compression_stream_init(&stream, config.operation, config.algorithm)
|
|
guard status != COMPRESSION_STATUS_ERROR else { return nil }
|
|
defer { compression_stream_destroy(&stream) }
|
|
|
|
var result = preload
|
|
var flags: Int32 = Int32(COMPRESSION_STREAM_FINALIZE.rawValue)
|
|
let blockLimit = 64 * 1024
|
|
var bufferSize = Swift.max(sourceSize, 64)
|
|
|
|
if sourceSize > blockLimit {
|
|
bufferSize = blockLimit
|
|
if config.algorithm == COMPRESSION_LZFSE && config.operation != COMPRESSION_STREAM_ENCODE {
|
|
// This fixes a bug in Apples lzfse decompressor. it will sometimes fail randomly when the input gets
|
|
// splitted into multiple chunks and the flag is not 0. Even though it should always work with FINALIZE...
|
|
flags = 0
|
|
}
|
|
}
|
|
|
|
let buffer = UnsafeMutablePointer<UInt8>.allocate(capacity: bufferSize)
|
|
defer { buffer.deallocate() }
|
|
|
|
stream.dst_ptr = buffer
|
|
stream.dst_size = bufferSize
|
|
stream.src_ptr = source
|
|
stream.src_size = sourceSize
|
|
|
|
while true {
|
|
switch compression_stream_process(&stream, flags) {
|
|
case COMPRESSION_STATUS_OK:
|
|
guard stream.dst_size == 0 else { return nil }
|
|
result.append(buffer, count: stream.dst_ptr - buffer)
|
|
stream.dst_ptr = buffer
|
|
stream.dst_size = bufferSize
|
|
|
|
if flags == 0 && stream.src_size == 0 { // part of the lzfse bugfix above
|
|
flags = Int32(COMPRESSION_STREAM_FINALIZE.rawValue)
|
|
}
|
|
|
|
case COMPRESSION_STATUS_END:
|
|
result.append(buffer, count: stream.dst_ptr - buffer)
|
|
return result
|
|
|
|
default:
|
|
return nil
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/// Compression level whose rawValue is based on the zlib's constants.
|
|
struct CompressionLevel: RawRepresentable {
|
|
|
|
/// Compression level in the range of `0` (no compression) to `9` (maximum compression).
|
|
let rawValue: Int32
|
|
|
|
static let noCompression = CompressionLevel(Z_NO_COMPRESSION)
|
|
static let bestSpeed = CompressionLevel(Z_BEST_SPEED)
|
|
static let bestCompression = CompressionLevel(Z_BEST_COMPRESSION)
|
|
|
|
static let defaultCompression = CompressionLevel(Z_DEFAULT_COMPRESSION)
|
|
|
|
|
|
init(rawValue: Int32) {
|
|
|
|
self.rawValue = rawValue
|
|
}
|
|
|
|
|
|
init(_ rawValue: Int32) {
|
|
|
|
self.rawValue = rawValue
|
|
}
|
|
}
|
|
|
|
/// Errors on gzipping/gunzipping based on the zlib error codes.
|
|
struct GzipError: Swift.Error {
|
|
// cf. http://www.zlib.net/manual.html
|
|
|
|
enum Kind: Equatable {
|
|
/// The stream structure was inconsistent.
|
|
///
|
|
/// - underlying zlib error: `Z_STREAM_ERROR` (-2)
|
|
case stream
|
|
|
|
/// The input data was corrupted
|
|
/// (input stream not conforming to the zlib format or incorrect check value).
|
|
///
|
|
/// - underlying zlib error: `Z_DATA_ERROR` (-3)
|
|
case data
|
|
|
|
/// There was not enough memory.
|
|
///
|
|
/// - underlying zlib error: `Z_MEM_ERROR` (-4)
|
|
case memory
|
|
|
|
/// No progress is possible or there was not enough room in the output buffer.
|
|
///
|
|
/// - underlying zlib error: `Z_BUF_ERROR` (-5)
|
|
case buffer
|
|
|
|
/// The zlib library version is incompatible with the version assumed by the caller.
|
|
///
|
|
/// - underlying zlib error: `Z_VERSION_ERROR` (-6)
|
|
case version
|
|
|
|
/// An unknown error occurred.
|
|
///
|
|
/// - parameter code: return error by zlib
|
|
case unknown(code: Int)
|
|
}
|
|
|
|
/// Error kind.
|
|
let kind: Kind
|
|
|
|
/// Returned message by zlib.
|
|
let message: String
|
|
|
|
|
|
internal init(code: Int32, msg: UnsafePointer<CChar>?) {
|
|
|
|
self.message = {
|
|
guard let msg = msg, let message = String(validatingUTF8: msg) else {
|
|
return "Unknown gzip error"
|
|
}
|
|
return message
|
|
}()
|
|
|
|
self.kind = {
|
|
switch code {
|
|
case Z_STREAM_ERROR:
|
|
return .stream
|
|
case Z_DATA_ERROR:
|
|
return .data
|
|
case Z_MEM_ERROR:
|
|
return .memory
|
|
case Z_BUF_ERROR:
|
|
return .buffer
|
|
case Z_VERSION_ERROR:
|
|
return .version
|
|
default:
|
|
return .unknown(code: Int(code))
|
|
}
|
|
}()
|
|
}
|
|
|
|
|
|
var localizedDescription: String {
|
|
|
|
return self.message
|
|
}
|
|
|
|
}
|
|
|
|
|
|
extension Data {
|
|
|
|
/// Whether the receiver is compressed in gzip format.
|
|
var isGzipped: Bool {
|
|
|
|
return self.starts(with: [0x1f, 0x8b]) // check magic number
|
|
}
|
|
|
|
|
|
/// Create a new `Data` object by compressing the receiver using zlib.
|
|
/// Throws an error if compression failed.
|
|
///
|
|
/// - Parameter level: Compression level.
|
|
/// - Returns: Gzip-compressed `Data` object.
|
|
/// - Throws: `GzipError`
|
|
func gzipped(level: CompressionLevel = .defaultCompression) throws -> Data {
|
|
|
|
guard !self.isEmpty else {
|
|
return Data()
|
|
}
|
|
|
|
var stream = z_stream()
|
|
var status: Int32
|
|
|
|
status = deflateInit2_(&stream, level.rawValue, Z_DEFLATED, MAX_WBITS + 16, MAX_MEM_LEVEL, Z_DEFAULT_STRATEGY, ZLIB_VERSION, Int32(DataSize.stream))
|
|
|
|
guard status == Z_OK else {
|
|
// deflateInit2 returns:
|
|
// Z_VERSION_ERROR The zlib library version is incompatible with the version assumed by the caller.
|
|
// Z_MEM_ERROR There was not enough memory.
|
|
// Z_STREAM_ERROR A parameter is invalid.
|
|
|
|
throw GzipError(code: status, msg: stream.msg)
|
|
}
|
|
|
|
var data = Data(capacity: DataSize.chunk)
|
|
repeat {
|
|
if Int(stream.total_out) >= data.count {
|
|
data.count += DataSize.chunk
|
|
}
|
|
|
|
let inputCount = self.count
|
|
let outputCount = data.count
|
|
|
|
self.withUnsafeBytes { (inputPointer: UnsafeRawBufferPointer) in
|
|
stream.next_in = UnsafeMutablePointer<Bytef>(mutating: inputPointer.bindMemory(to: Bytef.self).baseAddress!).advanced(by: Int(stream.total_in))
|
|
stream.avail_in = uint(inputCount) - uInt(stream.total_in)
|
|
|
|
data.withUnsafeMutableBytes { (outputPointer: UnsafeMutableRawBufferPointer) in
|
|
stream.next_out = outputPointer.bindMemory(to: Bytef.self).baseAddress!.advanced(by: Int(stream.total_out))
|
|
stream.avail_out = uInt(outputCount) - uInt(stream.total_out)
|
|
|
|
status = zlib.deflate(&stream, Z_FINISH)
|
|
|
|
stream.next_out = nil
|
|
}
|
|
|
|
stream.next_in = nil
|
|
}
|
|
|
|
} while stream.avail_out == 0
|
|
|
|
guard deflateEnd(&stream) == Z_OK, status == Z_STREAM_END else {
|
|
throw GzipError(code: status, msg: stream.msg)
|
|
}
|
|
|
|
data.count = Int(stream.total_out)
|
|
|
|
return data
|
|
}
|
|
|
|
|
|
/// Create a new `Data` object by decompressing the receiver using zlib.
|
|
/// Throws an error if decompression failed.
|
|
///
|
|
/// - Returns: Gzip-decompressed `Data` object.
|
|
/// - Throws: `GzipError`
|
|
func gunzipped() throws -> Data {
|
|
|
|
guard !self.isEmpty else {
|
|
return Data()
|
|
}
|
|
|
|
var stream = z_stream()
|
|
var status: Int32
|
|
|
|
status = inflateInit2_(&stream, MAX_WBITS + 32, ZLIB_VERSION, Int32(DataSize.stream))
|
|
|
|
guard status == Z_OK else {
|
|
// inflateInit2 returns:
|
|
// Z_VERSION_ERROR The zlib library version is incompatible with the version assumed by the caller.
|
|
// Z_MEM_ERROR There was not enough memory.
|
|
// Z_STREAM_ERROR A parameters are invalid.
|
|
|
|
throw GzipError(code: status, msg: stream.msg)
|
|
}
|
|
|
|
var data = Data(capacity: self.count * 2)
|
|
repeat {
|
|
if Int(stream.total_out) >= data.count {
|
|
data.count += self.count / 2
|
|
}
|
|
|
|
let inputCount = self.count
|
|
let outputCount = data.count
|
|
|
|
self.withUnsafeBytes { (inputPointer: UnsafeRawBufferPointer) in
|
|
stream.next_in = UnsafeMutablePointer<Bytef>(mutating: inputPointer.bindMemory(to: Bytef.self).baseAddress!).advanced(by: Int(stream.total_in))
|
|
stream.avail_in = uint(inputCount) - uInt(stream.total_in)
|
|
|
|
data.withUnsafeMutableBytes { (outputPointer: UnsafeMutableRawBufferPointer) in
|
|
stream.next_out = outputPointer.bindMemory(to: Bytef.self).baseAddress!.advanced(by: Int(stream.total_out))
|
|
stream.avail_out = uInt(outputCount) - uInt(stream.total_out)
|
|
|
|
status = zlib.inflate(&stream, Z_SYNC_FLUSH)
|
|
|
|
stream.next_out = nil
|
|
}
|
|
|
|
stream.next_in = nil
|
|
}
|
|
|
|
} while status == Z_OK
|
|
|
|
guard inflateEnd(&stream) == Z_OK, status == Z_STREAM_END else {
|
|
// inflate returns:
|
|
// Z_DATA_ERROR The input data was corrupted (input stream not conforming to the zlib format or incorrect check value).
|
|
// Z_STREAM_ERROR The stream structure was inconsistent (for example if next_in or next_out was NULL).
|
|
// Z_MEM_ERROR There was not enough memory.
|
|
// Z_BUF_ERROR No progress is possible or there was not enough room in the output buffer when Z_FINISH is used.
|
|
|
|
throw GzipError(code: status, msg: stream.msg)
|
|
}
|
|
|
|
data.count = Int(stream.total_out)
|
|
|
|
return data
|
|
}
|
|
|
|
}
|
|
|
|
|
|
private struct DataSize {
|
|
|
|
static let chunk = 2 ^ 14
|
|
static let stream = MemoryLayout<z_stream>.size
|
|
|
|
private init() { }
|
|
}
|