module deflate // vfmt off // RFC 1951 length/distance decode tables const length_bases = [3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 15, 17, 19, 23, 27, 31, 35, 43, 51, 59, 67, 83, 99, 115, 131, 163, 195, 227, 258] const length_extra_bits = [0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5, 0] const dist_bases = [1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193, 257, 385, 513, 769, 1025, 1537, 2049, 3073, 4097, 6145, 8193, 12289, 16385, 24577] const dist_extra_bits = [0, 0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 13, 13] // code-length alphabet order (RFC 1951) const cl_order = [16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15] // vmt on // fixed_litlen_lengths returns code lengths for the fixed Huffman lit/len tree (RFC 1951 ยง3.2.6). fn fixed_litlen_lengths() []int { mut lens := []int{len: 288} for i in 0 .. 144 { lens[i] = 8 } for i in 144 .. 256 { lens[i] = 9 } for i in 256 .. 280 { lens[i] = 7 } for i in 280 .. 288 { lens[i] = 8 } return lens } // HuffTree is a MSB-first Huffman lookup table for DEFLATE decoding. // Indexed by the next max_bits bits read LSB-first from the stream. struct HuffTree { table []u32 // entry: (symbol << 5) | code_length; 0xFFFF_FFFF = invalid max_bits int } fn build_huff_tree(lengths []int) HuffTree { mut max_bits := 0 for l in lengths { if l > max_bits { max_bits = l } } if max_bits == 0 { return HuffTree{ table: [u32(0)] max_bits: 0 } } mut bl_count := []int{len: max_bits + 1} for l in lengths { if l > 0 { bl_count[l]++ } } mut next_code := []u32{len: max_bits + 1} mut c := u32(0) for bits in 1 .. max_bits + 1 { c = (c + u32(bl_count[bits - 1])) << 1 next_code[bits] = c } table_size := 1 << max_bits mut table := []u32{len: table_size, init: 0xffff_ffff} for sym in 0 .. lengths.len { l := lengths[sym] if l == 0 { continue } code := next_code[l] next_code[l]++ // Reverse code for LSB-first bit reader rev := bit_reverse(code, l) step := 1 << l mut idx := int(rev) for idx < table_size { table[idx] = (u32(sym) << 5) | u32(l) idx += step } } return HuffTree{ table: table max_bits: max_bits } } struct BitReader { buf []u8 mut: pos int bits u32 nbits int } @[direct_array_access; inline] fn (mut r BitReader) read_bits(n int) !u32 { for r.nbits < n { if r.pos >= r.buf.len { return error('inflate: unexpected end of stream') } r.bits |= u32(r.buf[r.pos]) << r.nbits r.pos++ r.nbits += 8 } val := r.bits & ((u32(1) << n) - 1) r.bits >>= u32(n) r.nbits -= n return val } @[inline] fn (mut r BitReader) align_byte() { r.bits = 0 r.nbits = 0 } @[direct_array_access; inline] fn (mut r BitReader) read_byte_raw() !u8 { if r.pos >= r.buf.len { return error('inflate: unexpected end of stream') } b := r.buf[r.pos] r.pos++ return b } @[direct_array_access; inline] fn (mut r BitReader) huff_decode(t HuffTree) !u32 { for r.nbits < t.max_bits { if r.pos >= r.buf.len { break } r.bits |= u32(r.buf[r.pos]) << r.nbits r.pos++ r.nbits += 8 } idx := int(r.bits & ((u32(1) << t.max_bits) - 1)) entry := t.table[idx] if entry == 0xffff_ffff { return error('inflate: invalid Huffman code') } len_ := int(entry & 0x1f) sym := entry >> 5 r.bits >>= u32(len_) r.nbits -= len_ return sym } // inflate decompresses raw RFC 1951 DEFLATE data. fn inflate(data []u8) ![]u8 { mut r := BitReader{ buf: data } mut out := []u8{} fixed_ll := build_huff_tree(fixed_litlen_lengths()) fixed_d := build_huff_tree([]int{len: 32, init: 5}) for { bfinal := r.read_bits(1)! btype := r.read_bits(2)! match btype { 0 { r.align_byte() len_ := int(r.read_byte_raw()!) | (int(u32(r.read_byte_raw()!) << 8)) nlen := int(r.read_byte_raw()!) | (int(u32(r.read_byte_raw()!) << 8)) if len_ & 0xffff != (~nlen) & 0xffff { return error('inflate: bad stored block length') } for _ in 0 .. len_ { out << r.read_byte_raw()! } } 1 { inflate_block(mut r, mut out, fixed_ll, fixed_d)! } 2 { hlit := int(r.read_bits(5)!) + 257 hdist := int(r.read_bits(5)!) + 1 hclen := int(r.read_bits(4)!) + 4 mut cl_lens := []int{len: 19} for i in 0 .. hclen { cl_lens[cl_order[i]] = int(r.read_bits(3)!) } cl_tree := build_huff_tree(cl_lens) mut all_lens := []int{} for all_lens.len < hlit + hdist { sym := r.huff_decode(cl_tree)! if sym <= 15 { all_lens << int(sym) } else if sym == 16 { if all_lens.len == 0 { return error('inflate: repeat with empty history') } rep := int(r.read_bits(2)!) + 3 last := all_lens[all_lens.len - 1] for _ in 0 .. rep { all_lens << last } } else if sym == 17 { rep := int(r.read_bits(3)!) + 3 for _ in 0 .. rep { all_lens << 0 } } else if sym == 18 { rep := int(r.read_bits(7)!) + 11 for _ in 0 .. rep { all_lens << 0 } } else { return error('inflate: bad code length symbol') } } ll_tree := build_huff_tree(all_lens[..hlit]) d_tree := build_huff_tree(all_lens[hlit..]) inflate_block(mut r, mut out, ll_tree, d_tree)! } else { return error('inflate: reserved block type') } } if bfinal == 1 { break } } return out } @[direct_array_access] fn inflate_block(mut r BitReader, mut out []u8, ll HuffTree, dist HuffTree) ! { for { sym := r.huff_decode(ll)! if sym == 256 { break } if sym < 256 { out << u8(sym) } else { li := int(sym) - 257 if li < 0 || li >= length_bases.len { return error('inflate: invalid length symbol ${sym}') } length := length_bases[li] + int(r.read_bits(length_extra_bits[li])!) dsym := r.huff_decode(dist)! di := int(dsym) if di >= dist_bases.len { return error('inflate: invalid distance symbol ${dsym}') } distance := dist_bases[di] + int(r.read_bits(dist_extra_bits[di])!) if distance > out.len { return error('inflate: distance past output start') } base := out.len - distance for i in 0 .. length { out << out[base + i] } } } }