BaseJpegDecode.py

MCUの垂直サンプリングファクタを修正する。

#!/usr/bin/env python
# coding:utf-8
# BaseJpegDecode.py 2012.10.3
import abc
import logging
from collections import Counter

class BitPattern:
    def __init__(self, data=0, size=0):
        self.data = data
        self.size = size

    def clear(self):
        self.data = 0
        self.size = 0

    def put(self, c, size=8):
        self.data <<= size
        self.data |= c
        self.size += size
        if self.size > 32:
            logging.error("%08X %d" % (self.data, self.size))
            raise ValueError('over flow 32bit')

    def peek(self, size):
        return self.data >> (self.size-size)

    def get(self, size):
        r = self.peek(size)
        self.size -= size
        self.data &= (1<<self.size)-1
        return r

    def match(self, b):
        if b.size > self.size:
            return False
        return self.peek(b.size) == b.peek(b.size)

class Huff:
    def __init__(self, run, value_size, code):
        self.run = run
        self.value_size = value_size
        self.code = code

class HuffmanDecode(object):
    def __init__(self):
        self._ht = {}

    def _ht_clear(self, tc, th):
        self._ht[(tc,th)] = []

    def _ht_append(self, tc, th, huff):
        self._ht[(tc,th)].append(huff)

    def inputDHT(self, buf):
        pos = 0
        while pos < len(buf):
            uc = ord(buf[pos])
            pos += 1
            tc = uc >> 4
            th = uc & 0x0f
            logging.info("DHT: Tc=%d Th=%d" %(tc, th))
            self._ht_clear(tc, th)
            l_pos = pos
            pos += 16
            code = 0x0000
            for i in range(16):
                l = ord(buf[l_pos + i])
                for k in range(l):
                    value = ord(buf[pos])
                    run = value >> 4;
                    value_size = value & 0x0f
                    h = Huff(run, value_size, BitPattern(code, i+1))
                    self._ht_append(tc, th, h)
                    pos += 1
                    code += 1
                code <<= 1

    def Lookup(self, tc, th, bitpat):
        for h in self._ht[(tc,th)]:
            if h.code.size > bitpat.size:
                return None
            if bitpat.match(h.code):
                return h
        logging.error("(%d,%d)%08X %d" % (tc, th, bitpat.data, bitpat.size))
        raise ValueError('Huffman decode error')
        return None

    def getValue(self, huff, bitpat):
        if huff.value_size == 0:
            return 0
        value = bitpat.get(huff.value_size)
        if value & (1<<(huff.value_size-1)):
            return value
        value -= (1<<huff.value_size)-1
        return value

class BaseJpegDecode(object):
    __metaclass__ = abc.ABCMeta
    
    def __init__(self):
        self._hd = HuffmanDecode()
        self._seq = 0

    def clear(self):
        self._seq = 0

    @abc.abstractmethod
    def outputDC(self, mcu, block, value):
        pass

    @abc.abstractmethod
    def outputAC(self, mcu, block, scan, value):
        pass

    @abc.abstractmethod
    def outputMARK(self, c):
        pass

    def _inputScan(self, c):
        self._bitpat.put(ord(c))
        while self._bitpat.size > 0:
            if self._scan == 0:
                tc = 0 # DC
            else:
                tc = 1 # AC
            if self._block < self._yblock: # 2 or 4
                th = 0 # Y
            else:
                th = 1 # CbCr
            if self._huff == None:
                self._huff = self._hd.Lookup(tc, th, self._bitpat)
                if self._huff == None:
                    break
                self._bitpat.get(self._huff.code.size) # skip code
            if self._huff.value_size > self._bitpat.size:
                break
            value = self._hd.getValue(self._huff, self._bitpat)
            if self._scan == 0: #DC
                value += self._old_DC_value[th]
                self.outputDC(self._mcu, self._block, value)
                self._old_DC_value[th] = value
                self._scan += 1
            else: # AC
                if self._huff.run == 0 and self._huff.value_size == 0: # EOB
                    self._scan = 64
                else:
                    for i in range(self._huff.run):
                        self.outputAC(self._mcu, self._block, self._scan, 0)
                        self._scan += 1
                    self.outputAC(self._mcu, self._block, self._scan, value)
                    self._scan += 1
                if self._scan >= 64:
                    self._scan = 0
                    self._block += 1
                    if self._block >= (self._yblock+2): # 4 or 6
                        self._block = 0
                        self._mcu += 1
            self._huff = None

    def _restart(self):
        self._block = 0
        self._scan = 0
        self._old_DC_value = Counter()
        self._bitpat = BitPattern()
        self._huff = None

    def _inputSOF(self, buf):
        buf = map(ord, buf)
        self.height = (buf[1]<<8) + buf[2]
        self.width = (buf[3]<<8) + buf[4]
        logging.info("SOF: width=%d height=%d" % (self.width, self.height))
        if buf[7] == 0x22:
            self._yblock = 4
        elif buf[7] == 0x21:
            self._yblock = 2
        else:
            s = ",".join(["%02X" % c for c in buf[5:]])
            logging.error(s)
            raise ValueError('SOF error')

    def _inputSOS(self, buf):
        buf = map(ord, buf)
        s = ",".join(["%02X" % c for c in buf])
        logging.info("SOS: "+ s)

    def input(self, c):
        if self._seq == 0:
            if c == '\xff':
                self._seq += 1
        elif self._seq == 1:
            if c == '\xd8': # SOI
                self._seq += 1;
                self.outputMARK(c)
            else:
                self._seq -= 1
        elif self._seq == 2:
            if c == '\xff':
                self._seq += 1
        elif self._seq == 3:
                self.outputMARK(c)
                self._mark = c
                self._seq += 1
        elif self._seq == 4:
            self._skip = ord(c) << 8
            self._seq += 1
        elif self._seq == 5:
            self._skip += ord(c)
            self._skip -= 2
            self._buf = ""
            self._seq += 1
        elif self._seq == 6:
            self._buf += c
            self._skip -= 1
            if self._skip > 0:
                return
            if self._mark == '\xc4': # DHT
                self._hd.inputDHT(self._buf)
            if self._mark == '\xc0': # SOF0
                self._inputSOF(self._buf)
            if self._mark == '\xda': # SOS
                self._inputSOS(self._buf)
                self._mcu = 0
                self._restart()
                self._seq += 1
            else:
                self._seq = 2
        elif self._seq == 7:
            if c == '\xff':
                self._seq += 1
            else:
                self._inputScan(c)
        elif self._seq == 8:
            if c == '\x00':
                self._inputScan('\xff')
                self._seq -= 1
            elif c in '\xd0\xd1\xd2\xd3\xd4\xd5\xd6\xd7': # RSTx
                self._restart()
                self._seq -= 1
            elif c == '\xd9': # EOI
                self.outputMARK(c)
                self._seq += 1
            else:
                self.outputMARK(c)
                self._seq = 0
        elif self._seq == 9:
            pass
        else:
            pass


if __name__ == "__main__":
    #logging.basicConfig(level=logging.INFO)

    class DemoJpeg(BaseJpegDecode):
        def __init__(self):
            super(DemoJpeg, self).__init__()

        def outputDC(self, mcu, block, value):
            if self._yblock == 2:
                if block <= 1:
                    print "%02X" % (value+128),
                    if block == 1:
                        if (mcu % (self.width/16)) == (self.width/16)-1:
                            print ""
                return
            if block == 0:
                self._value = 0
            if block <= 3:
                self._value += (value+512)
                if block == 3:
                    print("%02X" % (self._value/16)),
                    if (mcu % (self.width/16)) == (self.width/16)-1:
                        print ""

        def outputAC(self, mcu, block, scan, value):
            pass

        def outputMARK(self, c):
            print("MARK: %02X" % ord(c))

    import argparse
    parser = argparse.ArgumentParser()
    parser.add_argument('infiles', nargs='*')
    args = parser.parse_args()

    jpeg = DemoJpeg()

    for filename in args.infiles:
        with open(filename, "rb") as f:
            data = f.read()
        print("%s %d" % (filename, len(data)))
        jpeg.clear()
        for c in data:
            jpeg.input(c)