JpegFile.py

from struct import pack_into, unpack_from, pack, pack_into, calcsize
from io import BytesIO
from array import array
from copy import copy
import logging

logger = logging.getLogger(__name__)

component_map = {1: 'Y', 2: 'Cb', 3: 'Cr', 4: 'I', 5: 'Q'}

"""
References:

http://vip.sugovica.hu/Sardi/kepnezo/JPEG%20File%20Layout%20and%20Format.htm
Used for making JPEG parser

https://tools.ietf.org/html/rfc2435
Used as a reference RTP-MJPEG packetizer
"""


def clamp(x):
    """
    Clamps value to the range [0, 255]
    :param x:
    :return:
    """
    return 0 if x < 0 else 255 if x > 255 else x


class Readable(object):
    """
    Wrapper for IO operations from the buffer
    """
    __slots__ = 'data', 'position'

    def __init__(self, data):
        self.data = data
        self.position = 0

    def clone(self):
        return copy(self)

    def jump(self, position):
        self.position = position

    def skip(self, length):
        self.position += length

    def peek(self, prefix):
        return self.data.startswith(prefix, self.position)

    def read(self, length):
        p = self.position
        self.position += length
        return self.data[p:self.position]

    def parse(self, fmt):
        p = self.position
        self.position += calcsize(fmt)
        return unpack_from(fmt, self.data, p)

    def uint8(self):
        p = self.position
        self.position += 1
        return self.data[p]

    def uint16(self):
        d, p = self.data, self.position
        self.position += 2
        return d[p] << 8 | d[p+1]

    def uint32(self):
        d, p = self.data, self.position
        self.position += 4
        return d[p] << 24 | d[p+1] << 16 | d[p+2] << 8 | d[p+3]

    def int8(self):
        t = self.uint8()
        return t - ((t & (1 << 7)) << 1)

    def int16(self):
        t = self.uint16()
        return t - ((t & (1 << 15)) << 1)

    def int32(self):
        t = self.uint32()
        return t - ((t & (1 << 31)) << 1)

    def uint16le(self):
        d, p = self.data, self.position
        self.position += 2
        return d[p] | d[p+1] << 8

    def uint32le(self):
        d, p = self.data, self.position
        self.position += 4
        return d[p] | d[p+1] << 8 | d[p+2] << 16 | d[p+3] << 24

    def int16le(self):
        t = self.uint16le()
        return t - ((t & (1 << 15)) << 1)

    def int32le(self):
        t = self.uint32le()
        return t - ((t & (1 << 31)) << 1)


def _inverse_dct(block, q):
    # Ref.: Independent JPEG Group's "jidctint.c", v8d
    # Copyright (C) 1994-1996, Thomas G. Lane
    # Modification developed 2003-2009 by Guido Vollbeding
    for i in range(8):
        z2 = block[16+i]*q[16+i]
        z3 = block[48+i]*q[48+i]
        z1 = (z2 + z3)*4433 # FIX_0_541196100
        tmp2 = z1 + z2*6270 # FIX_0_765366865
        tmp3 = z1 - z3*15137 # FIX_1_847759065
        z2 = block[i]*q[i]
        z3 = block[32+i]*q[32+i]
        z2 <<= 13 # CONST_BITS
        z3 <<= 13
        z2 += 1024 # 1 << CONST_BITS-PASS1_BITS-1
        tmp0 = z2 + z3
        tmp1 = z2 - z3
        tmp10 = tmp0 + tmp2
        tmp13 = tmp0 - tmp2
        tmp11 = tmp1 + tmp3
        tmp12 = tmp1 - tmp3
        tmp0 = block[56+i]*q[56+i]
        tmp1 = block[40+i]*q[40+i]
        tmp2 = block[24+i]*q[24+i]
        tmp3 = block[8+i]*q[8+i]
        z2 = tmp0 + tmp2
        z3 = tmp1 + tmp3
        z1 = (z2 + z3)*9633 # FIX_1_175875602
        z2 = z2*-16069 # FIX_1_961570560
        z3 = z3*-3196 # FIX_0_390180644
        z2 += z1
        z3 += z1
        z1 = (tmp0 + tmp3)*-7373 # FIX_0_899976223
        tmp0 = tmp0*2446 # FIX_0_298631336
        tmp3 = tmp3*12299 # FIX_1_501321110
        tmp0 += z1 + z2
        tmp3 += z1 + z3
        z1 = (tmp1 + tmp2)*-20995 # FIX_2_562915447
        tmp1 = tmp1*16819 # FIX_2_053119869
        tmp2 = tmp2*25172 # FIX_3_072711026
        tmp1 += z1 + z3
        tmp2 += z1 + z2
        block[i] = (tmp10 + tmp3) >> 11 # CONST_BITS-PASS1_BITS
        block[56+i] = (tmp10 - tmp3) >> 11
        block[8+i] = (tmp11 + tmp2) >> 11
        block[48+i] = (tmp11 - tmp2) >> 11
        block[16+i] = (tmp12 + tmp1) >> 11
        block[40+i] = (tmp12 - tmp1) >> 11
        block[24+i] = (tmp13 + tmp0) >> 11
        block[32+i] = (tmp13 - tmp0) >> 11
    for i in range(0, 64, 8):
        z2 = block[2+i]
        z3 = block[6+i]
        z1 = (z2 + z3)*4433 # FIX_0_541196100
        tmp2 = z1 + z2*6270 # FIX_0_765366865
        tmp3 = z1 - z3*15137 # FIX_1_847759065
        z2 = block[i] + 16 # 1 << (PASS1_BITS+2)
        z3 = block[4+i]
        tmp0 = (z2 + z3) << 13 # CONST_BITS
        tmp1 = (z2 - z3) << 13
        tmp10 = tmp0 + tmp2
        tmp13 = tmp0 - tmp2
        tmp11 = tmp1 + tmp3
        tmp12 = tmp1 - tmp3
        tmp0 = block[7+i]
        tmp1 = block[5+i]
        tmp2 = block[3+i]
        tmp3 = block[1+i]
        z2 = tmp0 + tmp2
        z3 = tmp1 + tmp3
        z1 = (z2 + z3)*9633 # FIX_1_175875602
        z2 = z2*-16069 # FIX_1_961570560
        z3 = z3*-3196 # FIX_0_390180644
        z2 += z1
        z3 += z1
        z1 = (tmp0 + tmp3)*-7373 # FIX_0_899976223
        tmp0 = tmp0*2446 # FIX_0_298631336
        tmp3 = tmp3*12299 # FIX_1_501321110
        tmp0 += z1 + z2
        tmp3 += z1 + z3
        z1 = (tmp1 + tmp2)*-20995 # FIX_2_562915447
        tmp1 = tmp1*16819 # FIX_2_053119869
        tmp2 = tmp2*25172 # FIX_3_072711026
        tmp1 += z1 + z3
        tmp2 += z1 + z2
        block[i] = (tmp10 + tmp3) >> 18 # (CONST_BITS+PASS1_BITS+3)
        block[7+i] = (tmp10 - tmp3) >> 18
        block[1+i] = (tmp11 + tmp2) >> 18
        block[6+i] = (tmp11 - tmp2) >> 18
        block[2+i] = (tmp12 + tmp1) >> 18
        block[5+i] = (tmp12 - tmp1) >> 18
        block[3+i] = (tmp13 + tmp0) >> 18
        block[4+i] = (tmp13 - tmp0) >> 18


def _forward_dct(block):
    # Ref.: Independent JPEG Group's "jfdctint.c", v8d
    # Copyright (C) 1994-1996, Thomas G. Lane
    # Modification developed 2003-2009 by Guido Vollbeding
    """
    :param block: contains input data. Output will be stored right here
    """
    for i in range(0, 64, 8):
        tmp0 = block[i] + block[i+7]
        tmp1 = block[i+1] + block[i+6]
        tmp2 = block[i+2] + block[i+5]
        tmp3 = block[i+3] + block[i+4]
        tmp10 = tmp0 + tmp3
        tmp12 = tmp0 - tmp3
        tmp11 = tmp1 + tmp2
        tmp13 = tmp1 - tmp2
        tmp0 = block[i] - block[i+7]
        tmp1 = block[i+1] - block[i+6]
        tmp2 = block[i+2] - block[i+5]
        tmp3 = block[i+3] - block[i+4]
        block[i] = (tmp10 + tmp11 - 8*128) << 2  # PASS1_BITS
        block[i+4] = (tmp10 - tmp11) << 2
        z1 = (tmp12 + tmp13)*4433  # FIX_0_541196100
        z1 += 1024  # 1 << (CONST_BITS-PASS1_BITS-1)
        block[i+2] = (z1 + tmp12*6270) >> 11  # FIX_0_765366865
        block[i+6] = (z1 - tmp13*15137) >> 11  # FIX_1_847759065
        tmp10 = tmp0 + tmp3
        tmp11 = tmp1 + tmp2
        tmp12 = tmp0 + tmp2
        tmp13 = tmp1 + tmp3
        z1 = (tmp12 + tmp13)*9633  # FIX_1_175875602
        z1 += 1024  # 1 << (CONST_BITS-PASS1_BITS-1)
        tmp0 = tmp0*12299  # FIX_1_501321110
        tmp1 = tmp1*25172  # FIX_3_072711026
        tmp2 = tmp2*16819  # FIX_2_053119869
        tmp3 = tmp3*2446  # FIX_0_298631336
        tmp10 = tmp10*-7373  # FIX_0_899976223
        tmp11 = tmp11*-20995  # FIX_2_562915447
        tmp12 = tmp12*-3196  # FIX_0_390180644
        tmp13 = tmp13*-16069  # FIX_1_961570560
        tmp12 += z1
        tmp13 += z1
        block[i+1] = (tmp0 + tmp10 + tmp12) >> 11
        block[i+3] = (tmp1 + tmp11 + tmp13) >> 11
        block[i+5] = (tmp2 + tmp11 + tmp12) >> 11
        block[i+7] = (tmp3 + tmp10 + tmp13) >> 11

    for i in range(8):
        tmp0 = block[i] + block[i+56]
        tmp1 = block[i+8] + block[i+48]
        tmp2 = block[i+16] + block[i+40]
        tmp3 = block[i+24] + block[i+32]
        tmp10 = tmp0 + tmp3 + 2  # 1 << (PASS1_BITS-1)
        tmp12 = tmp0 - tmp3
        tmp11 = tmp1 + tmp2
        tmp13 = tmp1 - tmp2
        tmp0 = block[i] - block[i+56]
        tmp1 = block[i+8] - block[i+48]
        tmp2 = block[i+16] - block[i+40]
        tmp3 = block[i+24] - block[i+32]
        block[i] = (tmp10 + tmp11) >> 2  # PASS1_BITS
        block[i+32] = (tmp10 - tmp11) >> 2
        z1 = (tmp12 + tmp13)*4433  # FIX_0_541196100
        z1 += 16384  # 1 << (CONST_BITS+PASS1_BITS-1)
        block[i+16] = (z1 + tmp12*6270) >> 15  # FIX_0_765366865, CONST_BITS+PASS1_BITS
        block[i+48] = (z1 - tmp13*15137) >> 15  # FIX_1_847759065
        tmp10 = tmp0 + tmp3
        tmp11 = tmp1 + tmp2
        tmp12 = tmp0 + tmp2
        tmp13 = tmp1 + tmp3
        z1 = (tmp12 + tmp13)*9633  # FIX_1_175875602
        z1 += 16384 # 1 << (CONST_BITS+PASS1_BITS-1)
        tmp0 = tmp0*12299  # FIX_1_501321110
        tmp1 = tmp1*25172  # FIX_3_072711026
        tmp2 = tmp2*16819  # FIX_2_053119869
        tmp3 = tmp3*2446  # FIX_0_298631336
        tmp10 = tmp10*-7373  # FIX_0_899976223
        tmp11 = tmp11*-20995  # FIX_2_562915447
        tmp12 = tmp12*-3196  # FIX_0_390180644
        tmp13 = tmp13*-16069  # FIX_1_961570560
        tmp12 += z1
        tmp13 += z1
        block[i+8] = (tmp0 + tmp10 + tmp12) >> 15  # CONST_BITS+PASS1_BITS
        block[i+24] = (tmp1 + tmp11 + tmp13) >> 15
        block[i+40] = (tmp2 + tmp11 + tmp12) >> 15
        block[i+56] = (tmp3 + tmp10 + tmp13) >> 15

# Zig-zag indices of AC coefficients
_z_z = bytearray([
         1,  8, 16,  9,  2,  3, 10, 17, 24, 32, 25, 18, 11,  4,  5,
    12, 19, 26, 33, 40, 48, 41, 34, 27, 20, 13,  6,  7, 14, 21, 28,
    35, 42, 49, 56, 57, 50, 43, 36, 29, 22, 15, 23, 30, 37, 44, 51,
    58, 59, 52, 45, 38, 31, 39, 46, 53, 60, 61, 54, 47, 55, 62, 63])

# Luminance quantization table in zig-zag order
_luminance_quantization = bytearray([
    16, 11, 12, 14, 12, 10, 16, 14, 13, 14, 18, 17, 16, 19, 24, 40,
    26, 24, 22, 22, 24, 49, 35, 37, 29, 40, 58, 51, 61, 60, 57, 51,
    56, 55, 64, 72, 92, 78, 64, 68, 87, 69, 55, 56, 80,109, 81, 87,
    95, 98,103,104,103, 62, 77,113,121,112,100,120, 92,101,103, 99])

# Chrominance quantization table in zig-zag order
_chrominance_quantization = bytearray([
    17, 18, 18, 24, 21, 24, 47, 26, 26, 47, 99, 66, 56, 66, 99, 99,
    99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99,
    99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99,
    99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99])

# These are standard tables, used for MJPEG streaming

# Standard MJPEG Luminance DC code lengths
_lum_dc_code_length = bytearray([0, 1, 5, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0])

# Standard MJPEG Luminance DC values
_lum_dc_symbols = bytearray([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11])

# Standard MJPEG Luminance AC code lengths
_lum_ac_code_length = bytearray([0, 2, 1, 3, 3, 2, 4, 3, 5, 5, 4, 4, 0, 0, 1, 125])

# Standard MJPEG Luminance AC values
_lum_ac_symbols = bytearray([
      1,  2,  3,  0,  4, 17,  5, 18, 33, 49, 65,  6, 19, 81, 97,  7, 34,113,
     20, 50,129,145,161,  8, 35, 66,177,193, 21, 82,209,240, 36, 51, 98,114,
    130,  9, 10, 22, 23, 24, 25, 26, 37, 38, 39, 40, 41, 42, 52, 53, 54, 55,
     56, 57, 58, 67, 68, 69, 70, 71, 72, 73, 74, 83, 84, 85, 86, 87, 88, 89,
     90, 99,100,101,102,103,104,105,106,115,116,117,118,119,120,121,122,131,
    132,133,134,135,136,137,138,146,147,148,149,150,151,152,153,154,162,163,
    164,165,166,167,168,169,170,178,179,180,181,182,183,184,185,186,194,195,
    196,197,198,199,200,201,202,210,211,212,213,214,215,216,217,218,225,226,
    227,228,229,230,231,232,233,234,241,242,243,244,245,246,247,248,249,250])

# Standard MJPEG Chrominance DC code lengths
_chm_dc_codelens = bytearray([0, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0])

# Standard MJPEG Chrominance DC values
_chm_dc_symbols = bytearray([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11])

# Standard MJPEG Chrominance AC code lengths
_ca_lengths = bytearray([ 0, 2, 1, 2, 4, 4, 3, 4, 7, 5, 4, 4, 0, 1, 2, 119])

"""
u_char chm_dc_codelens[] = { 0, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, };

u_char chm_dc_symbols[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, };

u_char chm_ac_codelens[] = { 0, 2, 1, 2, 4, 4, 3, 4, 7, 5, 4, 4, 0, 1, 2, 0x77, };
"""

# Standard MJPEG Chrominance AC values
_ca_values = bytearray([
      0,  1,  2,  3, 17,  4,  5, 33, 49,  6, 18, 65, 81,  7, 97,113, 19, 34,
     50,129,  8, 20, 66,145,161,177,193,  9, 35, 51, 82,240, 21, 98,114,209,
     10, 22, 36, 52,225, 37,241, 23, 24, 25, 26, 38, 39, 40, 41, 42, 53, 54,
     55, 56, 57, 58, 67, 68, 69, 70, 71, 72, 73, 74, 83, 84, 85, 86, 87, 88,
     89, 90, 99,100,101,102,103,104,105,106,115,116,117,118,119,120,121,122,
    130,131,132,133,134,135,136,137,138,146,147,148,149,150,151,152,153,154,
    162,163,164,165,166,167,168,169,170,178,179,180,181,182,183,184,185,186,
    194,195,196,197,198,199,200,201,202,210,211,212,213,214,215,216,217,218,
    226,227,228,229,230,231,232,233,234,242,243,244,245,246,247,248,249,250])


class EntropyDecoder(object):

    def __init__(self, readable):
        self.readable = readable
        self.value = 0
        self.length = 0
        self.rst = 0

    def restart(self):
        marker = self.readable.uint16()
        if marker != 0xffd0 + self.rst:
            raise ValueError('Invalid RST marker.')
        self.value = 0
        self.length = 0
        self.rst = (self.rst + 1) & 7

    def fill(self, length):
        while True:
            byte = self.readable.uint8()
            self.value = ((self.value & 0xffff) << 8) | byte
            self.length += 8
            if byte == 0xff:
                byte = self.readable.uint8()
                if byte != 0:
                    self.readable.position -= 2
            if self.length >= length:
                break

    def decode_huffman(self, cache):
        if self.length < 16:
            self.fill(16)
        key = (self.value >> (self.length - 16)) & 0xffff
        size = cache.sizes[key]
        if size == 255:
            raise ValueError('Corrupted Huffman sequence.')
        code = (self.value >> (self.length - size)) & ((1 << size) - 1)
        self.length -= size
        return cache.values[code - cache.offsets[size]]

    def receive_extend(self, length):
        if self.length < length:
            self.fill(length)
        value = (self.value >> (self.length - length)) & ((1 << length) - 1)
        self.length -= length
        if value < 1 << (length - 1):
            return value - (1 << length) + 1
        return value

    def decode(self, previous, block, dc, ac):
        i = 0
        while i < 64:
            block[i] = block[i + 1] = block[i + 2] = block[i + 3] = 0
            i += 4
        t = self.decode_huffman(dc)
        d = 0 if t == 0 else self.receive_extend(t)
        previous += d
        block[0] = previous
        i = 0
        while i < 63:
            rs = self.decode_huffman(ac)
            s = rs & 15
            r = rs >> 4
            if s == 0:
                if r != 15:
                    break
                i += 16
            else:
                i += r
                block[_z_z[i]] = self.receive_extend(s)
                i += 1

        return previous

    def decode_and_dct(self, previous, block, q, dc, ac):
        i = 0
        while i < 64:
            block[i] = block[i + 1] = block[i + 2] = block[i + 3] = 0
            i += 4
        t = self.decode_huffman(dc)
        d = 0 if t == 0 else self.receive_extend(t)
        previous += d
        block[0] = previous
        i = 0
        while i < 63:
            rs = self.decode_huffman(ac)
            s = rs & 15
            r = rs >> 4
            if s == 0:
                if r != 15:
                    break
                i += 16
            else:
                i += r
                block[_z_z[i]] = self.receive_extend(s)
                i += 1
        _inverse_dct(block, q)
        return previous


def decompress_impl(image, readable):
    if not image.components:
        raise ValueError('Missing SOF segment.')
    if not image.scans:
        raise ValueError('Missing SOS segment.')
    if not image.qtables:
        raise ValueError('Missing DQT segment.')
    if not image.htables:
        raise ValueError('Missing DHT segment.')
    if image.progressive:
        raise ValueError('Progressive DCT not supported.')

    print("Will try to decode %d bytes" % len(readable.data))
    w, h, n = image.width, image.height, len(image.components)
    interval, transform = image.reset_interval, image.transform
    d = EntropyDecoder(readable)
    data = bytearray(w * h * n)
    predictions = [0, 0, 0, 0]
    ublock, vblock, kblock = [0] * 64, [0] * 64, [0] * 64

    yblocks = [0] * 64, [0] * 64, [0] * 64, [0] * 64
    blocks = [yblocks, [ublock], [vblock], [kblock]]
    hs = [c.h for c in image.components]
    vs = [c.v for c in image.components]
    qs = [image.qtables[c.destination] for c in image.components]
    dcs = [image.htables[image.scans[c.identifier].dc] for c in image.components]
    acs = [image.htables[image.scans[c.identifier].ac] for c in image.components]
    h0, v0 = hs[0], vs[0]
    hb, vb = h0.bit_length() - 1, v0.bit_length() - 1

    # These are functions for color transformations
    def decode_color_block1(x, y, sx, sy):
        yblock = yblocks[sx + sy * h0]
        for by in range(min(8, h - y - sy * 8)):
            for bx in range(min(8, w - x - sx * 8)):
                i = ((sx * 8 + bx) >> hb) + ((sy * 8 + by) >> vb) * 8
                j = (x + sx * 8 + bx + (y + sy * 8 + by) * w) * n
                data[j] = clamp(yblock[i] + 128)

    def decode_color_block3(x, y, sx, sy):
        yblock = yblocks[sx + sy * h0]
        for by in range(min(8, h - y - sy * 8)):
            for bx in range(min(8, w - x - sx * 8)):
                i = ((sx * 8 + bx) >> hb) + ((sy * 8 + by) >> vb) * 8
                j = (x + sx * 8 + bx + (y + sy * 8 + by) * w) * n
                t, u, v = yblock[bx + by * 8], ublock[i], vblock[i]
                t = (t << 16) + 8421376
                data[j] = clamp((t + 91881 * v) >> 16)
                data[j + 1] = clamp((t - 22554 * u - 46802 * v) >> 16)
                data[j + 2] = clamp((t + 116130 * u) >> 16)

    def decode_color_block4(x, y, sx, sy):
        yblock = yblocks[sx + sy * h0]
        for by in range(min(8, h - y - sy * 8)):
            for bx in range(min(8, w - x - sx * 8)):
                i = ((sx * 8 + bx) >> hb) + ((sy * 8 + by) >> vb) * 8
                j = (x + sx * 8 + bx + (y + sy * 8 + by) * w) * n
                t, u, v, k = yblock[bx + by * 8], ublock[i], vblock[i], kblock[i]
                data[j] = clamp(t + 128)
                data[j + 1] = clamp(u + 128)
                data[j + 2] = clamp(v + 128)
                data[j + 3] = clamp(k + 128)

    def decode_color_block4_transformed(x, y, sx, sy):
        yblock = yblocks[sx + sy * h0]
        for by in range(min(8, h - y - sy * 8)):
            for bx in range(min(8, w - x - sx * 8)):
                i = ((sx * 8 + bx) >> hb) + ((sy * 8 + by) >> vb) * 8
                j = (x + sx * 8 + bx + (y + sy * 8 + by) * w) * n
                t, u, v, k = yblock[bx + by * 8], ublock[i], vblock[i], kblock[i]

                t = (t << 16) + 8421376
                data[j] = 255 - clamp((t + 91881 * v) >> 16)
                data[j + 1] = 255 - clamp((t - 22554 * u - 46802 * v) >> 16)
                data[j + 2] = 255 - clamp((t + 116130 * u) >> 16)
                data[j + 3] = clamp(k + 128)

    color_decoder = None

    if n == 1:
        color_decoder = decode_color_block1
    elif n == 3:
        color_decoder = decode_color_block3
    elif n == 4:
        if image.transform:
            color_decoder = decode_color_block4_transformed
        else:
            color_decoder = decode_color_block4

    count = 0
    if interval == 0:
        interval = ((w + 8 * h0 - 1) // (8 * h0)) * ((h + 8 * v0 - 1) // (8 * v0))
    for y in range(0, h, 8 * v0):
        for x in range(0, w, 8 * h0):
            count += 1
            if count > interval:
                d.restart()
                predictions[:] = [0, 0, 0, 0]
                count = 1
            for i in range(n):
                for j in range(hs[i] * vs[i]):
                    section = blocks[i][j]
                    predictions[i] = d.decode(predictions[i], section, dcs[i], acs[i])
                    _inverse_dct(section, qs[i])

            for sy in range(v0):
                for sx in range(h0):
                    color_decoder(x, y, sx, sy)

    if not readable.peek(b'\xff\xd9'):  # EOI
        raise ValueError('Missing EOI segment.')
    return data


class JpegFile:
    HAVE_PIXELS = 1
    HAVE_BLOCKS = 2

    STATUS_JPEG_BLOCKS = 1
    DefaultChromaQuant = _chrominance_quantization
    DefaultLumaQuant = _luminance_quantization

    class ParserState:
        """
        State for parsing jpeg file
        """
        def __init__(self):
            self.error = 0
            self.found_quant = 0
            self.found_soi = 0
            self.found_sof = 0
            self.found_sofn = 0
            self.found_dqt = 0
            self.found_dht = 0
            self.found_jfif = 0
            self.found_data = False
            self.done = False
    """
    Dissector for JPEG file
    """
    def __init__(self):
        self.width = 0
        self.height = 0
        self.bit = 0
        # Expected number of MCU blocks
        self.nmcu = None
        self.type = 0
        self.reset_interval = 0

        # Flag shows that
        self.flags = 0

        # Color components
        self.components = []

        # DCT-coded MCU blocks
        self._coded_mcu_blocks = []

        # Decoded MCU blocks
        self._mcu_blocks = []

        # bytearray with raw scanlines from jpeg file
        self._image_data = None
        self.pixels = None

        # Thumbnail stuff
        self._has_thumbnail = False
        self._thumb_width = 0
        self._thumb_height = 0

        self.progressive = False

        # Quantization tables, lqt, cqt
        self.qtables = {}
        # Raw quantitization tables, as specified in the file
        self.qtables_raw = {}

        # Huffman tables,
        self.htables = {}

        # Coding table destinations for a scan
        self.scans = {}

        self.transform = False
        self._parse_state = None
        self._raw_blocks = []

    # Reset parser to initial state
    def reset(self):
        self.width = 0
        self.height = 0
        self.bit = 0
        self.nmcu = None
        self.reset_interval = 0
        self.qtables = {}
        self.htables = {}
        self.scans = {}
        self._raw_blocks = []
        self._has_thumbnail = False
        self._parse_state = self.ParserState()

    @property
    def image_data(self):
        return self._image_data

    def _add_raw_block(self, hdr_lo, hdr_hi, data):
        """
        Adds raw block to the storage
        :param hdr_lo: lower byte of the header id
        :param hdr_hi: upper byte of the header id
        :param data: raw data
        """
        hdr = hdr_lo | (hdr_hi << 8)
        self._raw_blocks.append((hdr, data))

    def write_chroma(self, out, offset):
        """
        Writes jpeg chroma table to a specified location of a bytearray
        :param out:bytes output data
        :param offset:int offset to the table
        """
        out[offset:offset + 64] = self.qtables[0][0:64]

    def write_luma(self, out, offset):
        """
        Writes jpeg luminance table to a specified location of a bytearray
        :param out:bytes output data
        :param offset:int offset to the table
        """
        out[offset:offset + 64] = self.qtables[1][0:64]

    def load_data(self, jpeg_bytes, offset=0, end=0):
        """
        Parses JPEG header from a block of data
        :param jpeg_bytes: a list of bytes
        :param offset:int byte offset to start of image data
        :param end:int byte offset to an end of data block
        :return:
        """

        start = offset

        if end == 0:
            end = len(jpeg_bytes)

        self.reset()

        if jpeg_bytes[offset+0] != 0xff or jpeg_bytes[offset+1] != 0xd8:
            logger.error("No SOI header at start")
            return False

        pstate = self._parse_state
        pstate.done = False

        while offset+4 < end and not pstate.done:
            temp_data = jpeg_bytes[offset:]          # Debug view of the data
            (head_lo, head_hi) = unpack_from('!BB', jpeg_bytes, offset)
            head = (head_lo << 8) | head_hi

            handler = self.block_parsers.get(head)
            if handler:
                try:
                    offset += handler(self, jpeg_bytes, offset, pstate)
                except:  # Everything we catch here is really internal crap
                    logger.error("Internal JPEG decoder error")

            else:
                length = unpack_from("!H", jpeg_bytes, offset + 2)[0]
                logger.warn("Unknown block %x:%x len=%d at offset=%d" % (head_lo, head_hi, length, offset))
                next_block = temp_data[length:]
                offset += length

        if pstate.found_data:
            if offset + 2 >= end:
                logger.error("Data is too short: %d bytes" % (end - offset))
                return False
            else:
                # Try end of data block
                (head_lo, head_hi) = unpack_from('!BB', jpeg_bytes, end-2)
                if head_lo != 0xff and head_hi != 0xd9:
                    logger.error("Missing EOI block")
                self._image_data = jpeg_bytes[offset:end]

                logger.debug("Length of image data=%d bytes" % len(self._image_data))
                return True
        return False

    def _parse_jfif(self, data, offset, pstate):
        pos = 0
        (app_l, app_h, length) = unpack_from("!BBH", data, offset)
        logger.debug("Parsing JFIF block id=%x:%x len=%d" % (app_l, app_h, length))
        if app_l != 0xff and app_h != 0xe0:
            logger.error("Wrong APP0 header %x:%x" % (app_l, app_h))
            return length+2
        pos += 4
        id = unpack_from("!5c", data, offset+pos)
        # Should be 'JFIF'#0 (0x4a, 0x46, 0x49, 0x46, 0x00)
        pos += 5
        (version_major, version_minor, units) = unpack_from("!BBB", data, offset+pos)
        if version_major != 1:
            logger.warn("Strange JFIF version %d.%d" % (version_major, version_minor))
        pos += 3

        (width, height, xtumb, ytumb) = unpack_from("!hhbb", data, offset+pos)
        pos += 6
        if 2 + length - pos > 0:
            thumb_data = 3*width*height

        if xtumb > 0 or ytumb > 0:
            logger.debug("Expecting thumbnail %dx%d" % (xtumb, ytumb))
            self._thumb_height = ytumb
            self._thumb_width = xtumb

        pstate.found_jfif += 1
        return length+2

    def _parse_start_of_image(self, data, offset, pstate):
        (app_l, app_h) = unpack_from("!BB", data, offset)
        logger.debug("Parsing SOI block id=%x:%x" % (app_l, app_h))
        pstate.found_soi += 1
        return 2

    def _parse_comment(self, data, offset, pstate):
        (app_l, app_h, length) = unpack_from("!BBH", data, offset)
        if app_l != 0xff or app_h != 0xfe:
            logger.debug("Not a comment block id=%x:%x" % (app_l, app_h))
        else:
            logger.debug("Found comment block id=%x:%x" % (app_l, app_h))
        return length+2

    def _parse_start_of_frames(self, data, offset, pstate):
        """
        SOF0 (Start Of Frame 0) marker:

        Field                   Size                      Description
        Marker Identifier       2 bytes    0xff, 0xc0 to identify SOF0 marker
        Length                  2 bytes    This value equals to 8 + components*3 value
        Data precision          1 byte     This is in bits/sample, usually 8 (12 and 16 not supported by most software).
        Image height            2 bytes    This must be > 0
        Image Width             2 bytes    This must be > 0
        Number of components    1 byte     Usually 1 = grey scaled, 3 = color YcbCr or YIQ, 4 = color CMYK
        Each component          3 bytes    Read each component data of 3 bytes. It contains,
                                           (component Id(1byte)(1 = Y, 2 = Cb, 3 = Cr, 4 = I, 5 = Q),
                                           sampling factors (1byte) (bit 0-3 vertical., 4-7 horizontal.),
                                           quantization table number (1 byte)).
        Remarks:     JFIF uses either 1 component (Y, greyscaled) or 3 components (YCbCr, sometimes called YUV, colour).
        """
        (app_l, app_h, length) = unpack_from("!BBH", data, offset)
        if app_l == 0xff and app_h in range(0xc0, 0xcf):
            logger.debug("Parsing SOF block id=%x:%x len=%d" % (app_l, app_h, length))
        else:
            logger.error("Block mismatch")
            return None

        if app_h == 0xc2:
            logger.warn("This is progressive encoding!")

        pos = 4
        (precision, self.height, self.width, num_components) = unpack_from("!BHHB", data, offset+pos)
        pos += 6
        logger.debug("\t - image size %dx%d" % (self.width, self.height))
        pstate.found_sof += 1

        if num_components == 1:
            kind = 'g'
        elif num_components == 3:
            kind = 'rgb'
        elif num_components == 4:
            kind = 'cmyk'

        self.kind = kind

        for i in range(0, num_components):
            (comp_id, comp_sampling, quant_table) = unpack_from("!3B", data, offset+pos)
            h, v = comp_sampling >> 4, comp_sampling & 15
            if h not in (1, 2, 4):
                raise ValueError('Invalid horizontal sampling factor.')
            if v not in (1, 2, 4):
                raise ValueError('Invalid vertical sampling factor.')
            if i > 0:
                if h != 1 or v != 1:
                    raise ValueError('Unsupported sampling factor.')

            if num_components == 1:
                h, v = 1, 1
            logger.debug("\t -component %s samp=%d, qt=%d" % (component_map.get(comp_id, 'N'), comp_sampling, quant_table))
            self.components.append(Component(comp_id, h, v, quant_table))

            if i == 0:
                if comp_sampling == 0x11:
                    self.type = 0
                elif comp_sampling == 0x22:
                    self.type = 1
                else:
                    logger.error("\twrong sampling factor %d for Y component!"%comp_sampling)
            pos += 3
        """
        depth, height, width, n = readable.parse('>BHHB')
        if depth != 8:
            raise ValueError('Unsupported sample precision.')
        if n == 1:
            kind = 'g'
        elif n == 3:
            kind = 'rgb'
        elif n == 4:
            kind = 'cmyk'
        else:
            ValueError('Unsupported color type.')
        for i in range(n):
            identifier, sampling, destination = readable.parse('>BBB')
            h, v = sampling >> 4, sampling & 15
            if h not in (1, 2, 4):
                raise ValueError('Invalid horizontal sampling factor.')
            if v not in (1, 2, 4):
                raise ValueError('Invalid vertical sampling factor.')
            if i > 0:
                if h != 1 or v != 1:
                    raise ValueError('Unsupported sampling factor.')
            if n == 1:
                h, v = 1, 1
            components.append(_frame_component(identifier, h, v, destination))
        return width, height, kind, n
        """
        return length + 2

    def _parse_dri(self, data, offset, pstate):
        """
        Parsing DRI block
        In fact we just skip this block

        # Block structure:
        Marker Identifier   2 bytes     0xff, 0xdd  identifies DRI marker
        Length              2 bytes     It must be 4
        Restart interval    2 bytes     This is in units of MCU blocks, means that every n
                                        MCU blocks a RSTn marker can be found.The first marker
                                        will be RST0, then RST1 etc, after RST7 repeating from RST0.
        """
        (app_l, app_h, length, self.reset_interval) = unpack_from("!BBH", data, offset)
        if app_l == 0xff and app_h == 0xdd:
            logger.debug("Parsed DRI block id=%x:%x len=%d" % (app_l, app_h, length))
        return length + 2

    def _parse_huffman_table(self, data, offset, pstate):
        """
        Parsing Huffman table
        :param data:
        :param offset:
        :return:int number of bytes parsed

        HT block structure:
            int16 bid
            int16 length
            int8 flags
            int8[16] ht_header
            int8[] table_data
        """
        (app_l, app_h, length) = unpack_from("!BBH", data, offset)
        offset += 4

        if app_l != 0xff or app_h != 0xc4 or length < 16:
            logger.error("Wrong DHT block id=%x:%x len=%d" % (app_l, app_h, length))

        self.progressive = (app_h == 0xc2)

        offset_end = offset + length - 2

        while offset_end - offset > 17:
            table_flags = data[offset]
            offset += 1
            identifier = table_flags & 0b111

            if identifier >= 2:
                raise ValueError('Unsupported htable destination identifier.')

            is_dc = (table_flags & 0b0001000) == 0

            # Obtaining header of the table
            lengths = unpack_from("!BBBBBBBBBBBBBBBB", data, offset)
            offset += 16

            total_len = 0
            for l in lengths:
                total_len += l

            if is_dc:
                logger.info("Found id=%x:%x len=%d DHT DC table=%d header=%s table_len=%d" %
                             (app_l, app_h, length, identifier, lengths, total_len))
            else:
                logger.info("Found id=%x:%x len=%d DHT AC table=%d header=%s table_len=%d" %
                             (app_l, app_h, length, identifier, lengths, total_len))

            values = data[offset:offset + total_len]
            self.htables[table_flags] = HuffmanCachedTable(lengths, values)
            pstate.found_dht += 1
            offset += total_len

        if offset != offset_end:
            logger.error("DHT table parser has %d bytes left" % (offset_end - offset))
            return length + 2

        return length + 2

    def _parse_start_of_frame_n(self, data, offset, pstate):
        # We skip this block
        (app_l, app_h, length) = unpack_from("!BBH", data, offset)
        if app_l == 0xff and app_h in range(0xc0, 0xcf):
            logger.error("Skipping SOFn block id=%x:%x len=%d" % (app_l, app_h, length))
            pstate.found_sofn += 1
        return length+2

    def _parse_quant_block(self, data, offset, pstate):
        (head_lo, head_hi, length) = unpack_from('!BBH', data, offset)
        offset += 4
        if head_lo != 0xff and head_hi != 0xdb:
            logger.error("Failed to find DQT header")
            return length + 2
        logger.info("Parsing Quantization block id=%x:%x len=%d" % (head_lo, head_hi, length))

        offset_end = offset + length - 2

        while offset_end - offset >= 65:
            info = data[offset]
            offset += 1
            precision, table_index = info >> 4, info & 15
            table_length = 64*(precision+1)
            if precision != 0:  # Unsuported qtable element precision.
                offset += table_length
                continue
            if table_index >= 4:  # Invalid qtable destination identifier.
                offset += table_length
                continue
            qt = data[offset:offset+table_length]
            table = bytearray(64)
            table[0] = qt[0]
            i = 1
            for z in _z_z:
                table[z] = qt[i]

            pstate.found_quant += 1

            self.qtables[table_index] = table
            self.qtables_raw[table_index] = qt
            offset += table_length

        if offset != offset_end:
            logger.error("DQT table parser has %d bytes left" % (offset_end - offset))
            return length + 2

        return 2+length

    def _parse_sos(self, data, offset, pstate):
        """
        Parses Start of Scan block
        Marker Identifier             2 bytes      0xff, 0xda identify SOS marker
        Length                        2 bytes      This must be equal to 6+2*(number of components in scan).
        Number of Components in scan  1 byte       This must be >= 1 and <=4 (otherwise error), usually 1 or 3
        Each component                2 bytes      For each component, read 2 bytes. It contains,
                                                         1 byte   Component Id (1=Y, 2=Cb, 3=Cr, 4=I, 5=Q),
                                                         1 byte   Huffman table to use :
                                                               bit 0..3 : AC table (0..3)
                                                               bit 4..7 : DC table (0..3)
        Ignorable Bytes               3 bytes      We have to skip 3 bytes.
        """
        (head_lo, head_hi, length, num_components) = unpack_from('!BBHB', data, offset)

        if num_components not in range(1, 4):
            logger.warn("\t %d - strange number of components" % num_components)
        pos = 5
        for c in range(0, num_components):
            (comp_id, table_flags) = unpack_from('!BB', data, offset+pos)
            comp_name = component_map.get(comp_id, 'N')
            ac_table = table_flags & 0b1111
            dc_table = (table_flags >> 4) & 0b1111
            logger.info("\t- component %s uses Huffman AC table %d DC table %d" % (comp_name, ac_table, dc_table))
            # ACs always have Tc == 1
            self.scans[comp_id] = CodingDestination(dc_table, 16 | ac_table)
            pos += 2

        (scan_start, scan_end, bit_pos) = unpack_from('!BBB', data, offset+pos)
        pos += 3

        logger.debug("Parsing Start Of Scan id=%x:%x len=%d, start=%d, end=%d" % (head_lo, head_hi, length, scan_start, scan_end))

        pstate.found_data = True
        pstate.done = True

        return length + 2

    def _parse_end_of_image(self, data, offset, pstate):
        logger.debug("Parsing End Of Image")
        (head_lo, head_hi, length) = unpack_from('!BBH', data, offset)
        pstate.done = True
        return length + 2

    def decompress(self):
        """
        Does full jpeg decompression
        :return:bytearray decompressed pixel data
        """
        readable = Readable(self._image_data)
        data = decompress_impl(self, readable)
        return data

    # Defining JFIF blocks to be parsed
    HEADER_SOI = 0xffd8
    HEADER_APP0 = 0xffe0
    HEADER_SOS = 0xffda
    HEADER_QUANT = 0xffdb
    HEADER_DRI = 0xffdd
    HEADER_EOI = 0xffd9

    # Contains a table of parsers for each defined block type
    block_parsers = {
        HEADER_SOI: _parse_start_of_image,
        HEADER_APP0: _parse_jfif,
        HEADER_DRI: _parse_dri,
        0xffc0: _parse_start_of_frames,
        0xffc1: _parse_start_of_frames,
        0xffc2: _parse_start_of_frames,
        0xffc3: _parse_start_of_frame_n,
        0xffc4: _parse_huffman_table,
        0xffc5: _parse_start_of_frame_n,
        0xffc6: _parse_start_of_frame_n,
        0xffc7: _parse_start_of_frame_n,
        0xffc9: _parse_start_of_frame_n,
        0xffca: _parse_start_of_frame_n,
        0xffcb: _parse_start_of_frame_n,
        0xffcd: _parse_start_of_frame_n,
        0xffce: _parse_start_of_frame_n,
        0xffcf: _parse_start_of_frame_n,
        HEADER_SOS: _parse_sos,
        HEADER_QUANT: _parse_quant_block,
        HEADER_EOI: _parse_end_of_image,
        0xfffe: _parse_comment
    }


def _parse_sof(readable, components):
    depth, height, width, n = readable.parse('>BHHB')
    if depth != 8:
        raise ValueError('Unsupported sample precision.')
    if n == 1:
        kind = 'g'
    elif n == 3:
        kind = 'rgb'
    elif n == 4:
        kind = 'cmyk'
    else:
        ValueError('Unsupported color type.')
    for i in range(n):
        identifier, sampling, destination = readable.parse('>BBB')
        h, v = sampling >> 4, sampling & 15
        if h not in (1, 2, 4):
            raise ValueError('Invalid horizontal sampling factor.')
        if v not in (1, 2, 4):
            raise ValueError('Invalid vertical sampling factor.')
        if i > 0:
            if h != 1 or v != 1:
                raise ValueError('Unsupported sampling factor.')
        if n == 1:
            h, v = 1, 1
        components.append(Component(identifier, h, v, destination))
    return width, height, kind, n


def _parse_dqt(readable, length, qtables):
    end = readable.position + length
    while readable.position < end:
        pqtq = readable.uint8()
        precision, destination = pqtq >> 4, pqtq & 15
        if precision != 0:
            raise ValueError('Unsuported qtable element precision.')
        if destination >= 4:
            raise ValueError('Invalid qtable destination identifier.')
        elements = readable.read(64)
        table = bytearray(64)
        table[0] = elements[0]
        i = 1
        for z in _z_z:
            table[z] = elements[i]
        qtables[destination] = table
    if readable.position != end:
        raise ValueError('Invalid DQT length.')


def _parse_dht(readable, length, htables):
    end = readable.position + length
    while readable.position < end:
        tcth = readable.uint8()
        kind, identifier = tcth >> 4, tcth & 15
        if kind >= 2:
            raise ValueError('Invalid htable class.')
        if identifier >= 2:
            raise ValueError('Unsupported htable destination identifier.')
        lengths = readable.read(16)
        values = readable.read(sum(lengths))
        htables[tcth] = HuffmanCachedTable(lengths, values)
    if readable.position != end:
        raise ValueError('Invalid DHT length.')


def _parse_sos(readable, scans):
    n = readable.uint8()
    for i in range(n):
        selector, destinations = readable.parse('>BB')
        dc, ac = destinations >> 4, destinations & 15
        # ACs always have Tc == 1
        scans[selector] = CodingDestination(dc, 16 | ac)
    # start, end, approximation
    readable.skip(3)


def _parse_dri(readable):
    interval = readable.uint16()
    return interval


def _parse_app1(readable, length, rotation):
    end = readable.position + length
    if readable.peek('Exif\0\0'):
        # header, padding
        readable.skip(5 + 1)
        order = readable.uint16()
        # MM
        if order == 0x4d4d:
            uint16, uint32 = readable.uint16, readable.uint32
        # II
        elif order == 0x4949:
            uint16, uint32 = readable.uint16le, readable.uint32le
        else:
            raise ValueError('Invalid byte order.')
        # 42
        readable.skip(2)
        offset = uint32()
        if offset < 8:
            raise ValueError('Invalid IFD0 offset.')
        readable.skip(offset - 8)
        n = uint16()
        # Reading IFD blocks
        for i in range(n):
            tag = uint16()
            # kind, size
            readable.skip(2 + 4)
            # orientation
            if tag == 0x112:
                orientation = uint16()
                if orientation < 1 or orientation > 8:
                    raise ValueError('Invalid orientation value.')
                if orientation == 1:
                    rotation = 0
                elif orientation == 6:
                    rotation = 90
                elif orientation == 3:
                    rotation = 180
                elif orientation == 8:
                    rotation = 270
                else:
                    raise ValueError('Unsupported orientation value.')
                break
            # value
            readable.skip(4)
    readable.jump(end)
    return rotation


def _parse_app14(readable):
    # tag, version, flags0, flags1
    readable.skip(6 + 1 + 2 + 2)
    transform = readable.uint8()
    return transform


class Component(object):
    __slots__ = 'identifier', 'h', 'v', 'destination'

    def __init__(self, identifier, h, v, destination):
        self.identifier, self.h, self.v, self.destination = identifier, h, v, destination


class CodingDestination(object):
    __slots__ = 'dc', 'ac'

    def __init__(self, dc, ac):
        self.dc, self.ac = dc, ac


class HuffmanCachedTable(object):
    def __init__(self, lengths, values):
        self.values = values
        self.offsets = offsets = array('H', [0])
        self.sizes = sizes = bytearray([255]*65536)
        code = index = 0
        size = 1
        for length in lengths:
            offsets.append(code - index)
            for i in range(length):
                hi = code << (16 - size)
                for lo in range(1 << (16 - size)):
                    sizes[hi|lo] = size
                code += 1
            code *= 2
            index += length
            size += 1

    def __str__(self):
        return "offs=%s sz=%s" % (str(self.offsets), len(self.sizes))


def _quantization_table(table, quality):
    quality = max(0, min(quality, 100))
    if quality < 50:
        q = 5000//quality
    else:
        q = 200 - quality*2
    return bytearray([max(1, min((i*q + 50)//100, 255)) for i in table])


def _huffman_table(lengths, values):
    table = [None]*(max(values) + 1)
    code = 0
    i = 0
    size = 1
    for a in lengths:
        for j in range(a):
            table[values[i]] = code, size
            code += 1
            i += 1
        code *= 2
        size += 1
    return table


def _scale_factor(table):
    factor = [0]*64
    factor[0] = table[0]*8
    i = 1
    for z in _z_z:
        factor[z] = table[i]*8
        i += 1
    return factor


def _marker_segment(marker, data):
    return bytes(b'\xff' + marker + pack('>H', len(data) + 2) + data)


class EntropyEncoder(object):
    _codes = [i for j in reversed(range(16)) for i in range(1 << j)]
    """
    Huffman entropy encoder
    Codes data to internal buffer
    """
    def __init__(self):
        s = [j for j in range(1, 16) for i in range(1 << (j - 1))]
        s = [0] + s + list(reversed(s))
        self.sizes = s
        self.value = 0
        self.length = 0
        # This is the storage for output data
        self.data = bytearray()

    def reset(self):
        """
        Reset all the internal state
        """
        s = [j for j in range(1, 16) for i in range(1 << (j - 1))]
        s = [0] + s + list(reversed(s))
        self.sizes = s
        self.value = 0
        self.length = 0
        # This is the storage for output data
        self.data = bytearray()

    def encode(self, previous, block, scale, dc, ac):
        _forward_dct(block)
        for i in range(64):
            block[i] = (((block[i] << 1)//scale[i]) + 1) >> 1
        d = block[0] - previous
        if d == 0:
            self.write(*dc[0])
        else:
            s = self.sizes[d]
            self.write(*dc[s])
            self.write(self._codes[d], s)
        n = 0
        for i in _z_z:
            if block[i] == 0:
                n += 1
            else:
                while n > 15:
                    self.write(*ac[0xf0])
                    n -= 16
                s = self.sizes[block[i]]
                self.write(*ac[n*16 + s])
                self.write(self._codes[block[i]], s)
                n = 0
        if n > 0:
            self.write(*ac[0])
        return block[0]

    def write(self, value, length):
        data = self.data
        value += (self.value << length)
        length += self.length
        while length > 7:
            length -= 8
            v = (value >> length) & 0xff
            if v == 0xff:
                data.append(0xff)
                data.append(0)
            else:
                data.append(v)
        self.value = value & 0xff
        self.length = length

    def dump(self):
        return bytes(self.data)  # TODO python 3: remove bytes


class ReferenceJpeg(object):
    """
    I use this jpeg clas as a reference
    """
    @staticmethod
    def valid(data):
        return data.startswith('\xff\xd8\xff')

    def __init__(self, data):
        self.readable = r = Readable(data)
        self.width, self.height, self.kind, self.n = 0, 0, '', 0
        self.components = []
        self.scans = {}
        self.pixels = None
        self.qtables = {}
        self.htables = {}
        self.reset_interval = 0
        self.rotation = 0
        self.progressive = False
        self.transform, app14 = False, False
        self.ecs = 0
        r.skip(2)  # SOI
        while True:
            marker = r.uint8()
            if marker != 0xff:
                raise ValueError('Invalid marker.')
            while marker == 0xff:
                marker = r.uint8()
            if marker == 0xd9:  # EOI
                raise ValueError('Invalid entropy-coded segment.')
            if 0xd0 <= marker <= 0xd7:  # RST
                raise ValueError('Unexpected RST marker.')
            length = r.uint16() - 2
            if 0xc0 <= marker <= 0xc2:  # SOF0, SOF1, SOF2
                self.width, self.height, self.kind, self.n = _parse_sof(r, self.components)
                self.progressive = marker == 0xc2
                if not app14:
                    self.transform = self.kind == 'rgb'
            elif marker == 0xdb:  # DQT
                _parse_dqt(r, length, self.qtables)
            elif marker == 0xc4:  # DHT
                _parse_dht(r, length, self.htables)
            elif marker == 0xda:  # SOS:
                _parse_sos(r, self.scans)
                self.ecs = r.position
                break
            elif marker == 0xdd:  # DRI
                self.reset_interval = _parse_dri(r)
            elif marker == 0xe1:  # APP1
                self.rotation = _parse_app1(r, length, self.rotation)
            elif marker == 0xee:  # APP14
                self.transform, app14 = _parse_app14(r), True
            elif 0xe0 <= marker <= 0xef or marker == 0xfe:  # APP, COM
                r.skip(length)
            else:
                if marker == 0xc3:  # SOF3
                    raise ValueError('Lossless mode not supported.')
                if 0xc5 <= marker == 0xc7:  # SOF5, SOF6, SOF7
                    raise ValueError('Differential mode not supported.')
                if 0xc8 <= marker == 0xcf:  # JPG, SOF9, SOF10, SOF11, DAC, SOF13, SOF14, SOF15
                    raise ValueError('Arithmetic coding not supported.')
                if marker == 0xdc:  # DNL
                    raise ValueError('Define number of lines not supported.')
                if marker == 0xde:  # DHP
                    raise ValueError('Define hierarchical progression not supported.')
                if marker == 0xdf:  # EXP
                    raise ValueError('Expand reference component(s) not supported.')
                raise ValueError('Unsupported marker.')

    def decompress(self):
        readable = Readable(self.readable.data[self.ecs:])
        data = decompress_impl(self, readable)

        self.pixels = data

        if not readable.peek(b'\xff\xd9'):  # EOI
            raise ValueError('Missing EOI segment.')
        return data

    def decompress_ref(self):
        if not self.components:
            raise ValueError('Missing SOF segment.')
        if not self.scans:
            raise ValueError('Missing SOS segment.')
        if not self.qtables:
            raise ValueError('Missing DQT segment.')
        if not self.htables:
            raise ValueError('Missing DHT segment.')
        if self.progressive:
            raise ValueError('Progressive DCT not supported.')
        self.readable.jump(self.ecs)
        w, h, n = self.width, self.height, len(self.components)
        interval, transform = self.reset_interval, self.transform
        d = EntropyDecoder(self.readable)
        data = bytearray(w * h * n)
        predictions = [0, 0, 0, 0]
        ublock, vblock, kblock = [0] * 64, [0] * 64, [0] * 64
        yblocks = [0] * 64, [0] * 64, [0] * 64, [0] * 64
        blocks = [yblocks, [ublock], [vblock], [kblock]]
        hs = [c.h for c in self.components]
        vs = [c.v for c in self.components]
        qs = [self.qtables[c.destination] for c in self.components]
        dcs = [self.htables[self.scans[c.identifier].dc] for c in self.components]
        acs = [self.htables[self.scans[c.identifier].ac] for c in self.components]
        h0, v0 = hs[0], vs[0]
        hb, vb = h0.bit_length() - 1, v0.bit_length() - 1
        count = 0
        if interval == 0:
            interval = ((w + 8 * h0 - 1) // (8 * h0)) * ((h + 8 * v0 - 1) // (8 * v0))
        for y in range(0, h, 8 * v0):
            for x in range(0, w, 8 * h0):
                count += 1
                if count > interval:
                    d.restart()
                    predictions[:] = [0, 0, 0, 0]
                    count = 1
                for i in range(n):
                    for j in range(hs[i] * vs[i]):
                        predictions[i] = d.decode_and_dct(predictions[i], blocks[i][j], qs[i], dcs[i], acs[i])
                for sy in range(v0):
                    for sx in range(h0):
                        yblock = yblocks[sx + sy * h0]
                        for by in range(min(8, h - y - sy * 8)):
                            for bx in range(min(8, w - x - sx * 8)):
                                i = ((sx * 8 + bx) >> hb) + ((sy * 8 + by) >> vb) * 8
                                j = (x + sx * 8 + bx + (y + sy * 8 + by) * w) * n
                                if n == 1:
                                    data[j] = clamp(yblock[i] + 128)
                                elif n == 3:
                                    t, u, v = yblock[bx + by * 8], ublock[i], vblock[i]
                                    t = (t << 16) + 8421376
                                    data[j] = clamp((t + 91881 * v) >> 16)
                                    data[j + 1] = clamp((t - 22554 * u - 46802 * v) >> 16)
                                    data[j + 2] = clamp((t + 116130 * u) >> 16)
                                else:  # n == 4
                                    t, u, v, k = yblock[bx + by * 8], ublock[i], vblock[i], kblock[i]
                                    if transform:
                                        t = (t << 16) + 8421376
                                        data[j] = 255 - clamp((t + 91881 * v) >> 16)
                                        data[j + 1] = 255 - clamp((t - 22554 * u - 46802 * v) >> 16)
                                        data[j + 2] = 255 - clamp((t + 116130 * u) >> 16)
                                        data[j + 3] = clamp(k + 128)
                                    else:
                                        data[j] = clamp(t + 128)
                                        data[j + 1] = clamp(u + 128)
                                        data[j + 2] = clamp(v + 128)
                                        data[j + 3] = clamp(k + 128)
        if not self.readable.peek(b'\xff\xd9'):  # EOI
            raise ValueError('Missing EOI segment.')

        self.pixels = data
        return data


def serialize_scanlines(image, quality, default_tables=True):
    """
    Serializes scanlines using default tables
    :param image:JpegFile with decoded pixel data
    :param quality:int quality level, in percents
    :return:bytearray with encoded scanlines
    """
    if image.kind not in ('g', 'rgb', 'cmyk'):
        raise ValueError('Invalid image kind.')

    w, h, n = image.width, image.height, image.n

    if image.pixels is None:
        raise ValueError('Image contains no pixel data')

    if w == 0 or h == 0:
        raise ValueError('Image has wrong size: %dx%d' % (w, h))

    ydc = udc = vdc = kdc = 0
    # This one serializes using standard huffman table
    yblock, ublock, vblock, kblock = [0] * 64, [0] * 64, [0] * 64, [0] * 64
    # TODO: We should able to use tables from JpegFile
    lq = _quantization_table(_luminance_quantization, quality)
    ld = _huffman_table(_lum_dc_code_length, _lum_dc_symbols)
    la = _huffman_table(_lum_ac_code_length, _lum_ac_symbols)
    ls = _scale_factor(lq)

    if n == 3:
        cq = _quantization_table(_chrominance_quantization, quality)
        cd = _huffman_table(_chm_dc_codelens, _chm_dc_symbols)
        ca = _huffman_table(_ca_lengths, _ca_values)
        cs = _scale_factor(cq)

    encoder = EntropyEncoder()

    data = image.pixels
    # For each block
    for y in range(0, h, 8):
        for x in range(0, w, 8):
            # For each pixel in the block - generate contents for the block
            # BTW, if we have just unpacked jpeg, we could keep this blocks there
            i = 0
            for yy in range(y, y + 8):
                for xx in range(x, x + 8):
                    j = (min(xx, w - 1) + min(yy, h - 1) * w) * n
                    if n == 1:
                        yblock[i] = data[j]
                    elif n == 3:
                        r, g, b = data[j], data[j + 1], data[j + 2]
                        yblock[i] = (19595 * r + 38470 * g + 7471 * b + 32768) >> 16
                        ublock[i] = (-11056 * r - 21712 * g + 32768 * b + 8421376) >> 16
                        vblock[i] = (32768 * r - 27440 * g - 5328 * b + 8421376) >> 16
                    else:  # n == 4
                        yblock[i] = data[j]
                        ublock[i] = data[j + 1]
                        vblock[i] = data[j + 2]
                        kblock[i] = data[j + 3]
                    i += 1
            ydc = encoder.encode(ydc, yblock, ls, ld, la)
            if n == 3:
                udc = encoder.encode(udc, ublock, cs, cd, ca)
                vdc = encoder.encode(vdc, vblock, cs, cd, ca)
            elif n == 4:
                udc = encoder.encode(udc, ublock, ls, ld, la)
                vdc = encoder.encode(vdc, vblock, ls, ld, la)
                kdc = encoder.encode(kdc, kblock, ls, ld, la)

    encoder.write(0x7f, 7)  # padding
    return encoder.dump()


def serialize(image, quality):
    """
    Serializes JPEG to a bytearray using standard MJPEG tables
    It can be dumped to jpeg file directly
    :param image:JpegFile or ReferenceJpeg with decoded image data
    :param quality:int quality, in percents
    :return:bytes serialized image
    """
    if image.kind not in ('g', 'rgb', 'cmyk'):
        raise ValueError('Invalid image kind.')

    w, h, n = image.width, image.height, len(image.components)
    data = serialize_scanlines(image, quality)

    lq = _quantization_table(_luminance_quantization, quality)
    ld = _huffman_table(_lum_dc_code_length, _lum_dc_symbols)
    la = _huffman_table(_lum_ac_code_length, _lum_ac_symbols)
    ls = _scale_factor(lq)
    if n == 3:
        cq = _quantization_table(_chrominance_quantization, quality)
        cd = _huffman_table(_chm_dc_codelens, _chm_dc_symbols)
        ca = _huffman_table(_ca_lengths, _ca_values)
        cs = _scale_factor(cq)

    app = b'Adobe\0\144\200\0\0\0\0'  # tag, version, flags0, flags1, transform
    sof = b'\10' + pack('>HHB', h, w, n) + b'\1\21\0'  # depth, id, sampling, qtable
    sos = pack('B', n) + b'\1\0'  # id, htable
    dqt = b'\0' + lq
    dht = b'\0' + _lum_dc_code_length + _lum_dc_symbols + b'\20' + _lum_ac_code_length + _lum_ac_symbols
    if n == 3:
        sof += b'\2\21\1\3\21\1'
        sos += b'\2\21\3\21'
        dqt += b'\1' + cq
        dht += b'\1' + _chm_dc_codelens + _chm_dc_symbols + b'\21' + _ca_lengths + _ca_values
    elif n == 4:
        sof += b'\2\21\0\3\21\0\4\21\0'
        sos += b'\2\0\3\0\4\0'
    sos += b'\0\77\0'  # start, end, approximation

    output = BytesIO()
    output.write(b'\xff\xd8')  # SOI
    if n == 4:
        output.write(_marker_segment(b'\xee', app))
    output.write(_marker_segment(b'\xdb', dqt))
    output.write(_marker_segment(b'\xc0', sof))
    output.write(_marker_segment(b'\xc4', dht))
    output.write(_marker_segment(b'\xda', sos))
    output.write(data)
    output.write(b'\xff\xd9')  # EOI
    return output.getvalue()