alpcentaur
/
basabuuka_prototyp

#!/usr/bin/env python3
import sysimport ioimport structfrom .cmapdb import CMapDB, CMapParser, FileUnicodeMap, CMapfrom .encodingdb import EncodingDB, name2unicodefrom .psparser import PSStackParserfrom .psparser import PSEOFfrom .psparser import LIT, KWD, handle_errorfrom .psparser import PSLiteral, literal_namefrom .pdftypes import (PDFException, resolve1, int_value, num_value, list_value, dict_value,    stream_value)from .fontmetrics import FONT_METRICSfrom .utils import apply_matrix_norm, nunpack, choplist

def get_widths(seq):    widths = {}    r = []    for v in seq:        if isinstance(v, list):            if r:                char1 = r[-1]                for (i,w) in enumerate(v):                    widths[char1+i] = w                r = []        elif isinstance(v, int):            r.append(v)            if len(r) == 3:                (char1,char2,w) = r                for i in range(char1, char2+1):                    widths[i] = w                r = []    return widths#assert get_widths([1]) == {}#assert get_widths([1,2,3]) == {1:3, 2:3}#assert get_widths([1,[2,3],6,[7,8]]) == {1:2,2:3, 6:7,7:8}
def get_widths2(seq):    widths = {}    r = []    for v in seq:        if isinstance(v, list):            if r:                char1 = r[-1]                for (i,(w,vx,vy)) in enumerate(choplist(3,v)):                    widths[char1+i] = (w,(vx,vy))                r = []        elif isinstance(v, int):            r.append(v)            if len(r) == 5:                (char1,char2,w,vx,vy) = r                for i in range(char1, char2+1):                    widths[i] = (w,(vx,vy))                r = []    return widths#assert get_widths2([1]) == {}#assert get_widths2([1,2,3,4,5]) == {1:(3,(4,5)), 2:(3,(4,5))}#assert get_widths2([1,[2,3,4,5],6,[7,8,9]]) == {1:(2,(3,4)), 6:(7,(8,9))}

class FontMetricsDB:
    @classmethod    def get_metrics(klass, fontname):        return FONT_METRICS[fontname]

class Type1FontHeaderParser(PSStackParser):
    KEYWORD_BEGIN = KWD('begin')    KEYWORD_END = KWD('end')    KEYWORD_DEF = KWD('def')    KEYWORD_PUT = KWD('put')    KEYWORD_DICT = KWD('dict')    KEYWORD_ARRAY = KWD('array')    KEYWORD_READONLY = KWD('readonly')    KEYWORD_FOR = KWD('for')    KEYWORD_FOR = KWD('for')
    def __init__(self, data):        PSStackParser.__init__(self, data)        self._cid2unicode = {}
    def get_encoding(self):        while 1:            try:                (cid,name) = self.nextobject()            except PSEOF:                break            try:                self._cid2unicode[cid] = name2unicode(name)            except KeyError:                pass        return self._cid2unicode        def do_keyword(self, pos, token):        if token is self.KEYWORD_PUT:            ((_,key),(_,value)) = self.pop(2)            if (isinstance(key, int) and                isinstance(value, PSLiteral)):                self.add_results((key, literal_name(value)))
    ##  CFFFont##  (Format specified in Adobe Technical Note: #5176##   "The Compact Font Format Specification")##NIBBLES = ('0','1','2','3','4','5','6','7','8','9','.','e','e-',None,'-')def getdict(data):    d = {}    fp = io.BytesIO(data)    stack = []    while 1:        c = fp.read(1)        if not c: break        b0 = ord(c)        if b0 <= 21:            d[b0] = stack            stack = []            continue        if b0 == 30:            s = ''            loop = True            while loop:                b = ord(fp.read(1))                for n in (b >> 4, b & 15):                    if n == 15:                        loop = False                    else:                        s += NIBBLES[n]            value = float(s)        elif 32 <= b0 and b0 <= 246:            value = b0-139        else:            b1 = ord(fp.read(1))            if 247 <= b0 and b0 <= 250:                value = ((b0-247)<<8)+b1+108            elif 251 <= b0 and b0 <= 254:                value = -((b0-251)<<8)-b1-108            else:                b2 = ord(fp.read(1))                if 128 <= b1: b1 -= 256                if b0 == 28:                    value = b1<<8 | b2                else:                    value = b1<<24 | b2<<16 | struct.unpack('>H', fp.read(2))[0]        stack.append(value)    return d
class CFFFont:
    STANDARD_STRINGS = (      '.notdef', 'space', 'exclam', 'quotedbl', 'numbersign',      'dollar', 'percent', 'ampersand', 'quoteright', 'parenleft',      'parenright', 'asterisk', 'plus', 'comma', 'hyphen', 'period',      'slash', 'zero', 'one', 'two', 'three', 'four', 'five', 'six',      'seven', 'eight', 'nine', 'colon', 'semicolon', 'less', 'equal',      'greater', 'question', 'at', 'A', 'B', 'C', 'D', 'E', 'F', 'G',      'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T',      'U', 'V', 'W', 'X', 'Y', 'Z', 'bracketleft', 'backslash',      'bracketright', 'asciicircum', 'underscore', 'quoteleft', 'a',      'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n',      'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z',      'braceleft', 'bar', 'braceright', 'asciitilde', 'exclamdown',      'cent', 'sterling', 'fraction', 'yen', 'florin', 'section',      'currency', 'quotesingle', 'quotedblleft', 'guillemotleft',      'guilsinglleft', 'guilsinglright', 'fi', 'fl', 'endash',      'dagger', 'daggerdbl', 'periodcentered', 'paragraph', 'bullet',      'quotesinglbase', 'quotedblbase', 'quotedblright',      'guillemotright', 'ellipsis', 'perthousand', 'questiondown',      'grave', 'acute', 'circumflex', 'tilde', 'macron', 'breve',      'dotaccent', 'dieresis', 'ring', 'cedilla', 'hungarumlaut',      'ogonek', 'caron', 'emdash', 'AE', 'ordfeminine', 'Lslash',      'Oslash', 'OE', 'ordmasculine', 'ae', 'dotlessi', 'lslash',      'oslash', 'oe', 'germandbls', 'onesuperior', 'logicalnot', 'mu',      'trademark', 'Eth', 'onehalf', 'plusminus', 'Thorn',      'onequarter', 'divide', 'brokenbar', 'degree', 'thorn',      'threequarters', 'twosuperior', 'registered', 'minus', 'eth',      'multiply', 'threesuperior', 'copyright', 'Aacute',      'Acircumflex', 'Adieresis', 'Agrave', 'Aring', 'Atilde',      'Ccedilla', 'Eacute', 'Ecircumflex', 'Edieresis', 'Egrave',      'Iacute', 'Icircumflex', 'Idieresis', 'Igrave', 'Ntilde',      'Oacute', 'Ocircumflex', 'Odieresis', 'Ograve', 'Otilde',      'Scaron', 'Uacute', 'Ucircumflex', 'Udieresis', 'Ugrave',      'Yacute', 'Ydieresis', 'Zcaron', 'aacute', 'acircumflex',      'adieresis', 'agrave', 'aring', 'atilde', 'ccedilla', 'eacute',      'ecircumflex', 'edieresis', 'egrave', 'iacute', 'icircumflex',      'idieresis', 'igrave', 'ntilde', 'oacute', 'ocircumflex',      'odieresis', 'ograve', 'otilde', 'scaron', 'uacute',      'ucircumflex', 'udieresis', 'ugrave', 'yacute', 'ydieresis',      'zcaron', 'exclamsmall', 'Hungarumlautsmall', 'dollaroldstyle',      'dollarsuperior', 'ampersandsmall', 'Acutesmall',      'parenleftsuperior', 'parenrightsuperior', 'twodotenleader',      'onedotenleader', 'zerooldstyle', 'oneoldstyle', 'twooldstyle',      'threeoldstyle', 'fouroldstyle', 'fiveoldstyle', 'sixoldstyle',      'sevenoldstyle', 'eightoldstyle', 'nineoldstyle',      'commasuperior', 'threequartersemdash', 'periodsuperior',      'questionsmall', 'asuperior', 'bsuperior', 'centsuperior',      'dsuperior', 'esuperior', 'isuperior', 'lsuperior', 'msuperior',      'nsuperior', 'osuperior', 'rsuperior', 'ssuperior', 'tsuperior',      'ff', 'ffi', 'ffl', 'parenleftinferior', 'parenrightinferior',      'Circumflexsmall', 'hyphensuperior', 'Gravesmall', 'Asmall',      'Bsmall', 'Csmall', 'Dsmall', 'Esmall', 'Fsmall', 'Gsmall',      'Hsmall', 'Ismall', 'Jsmall', 'Ksmall', 'Lsmall', 'Msmall',      'Nsmall', 'Osmall', 'Psmall', 'Qsmall', 'Rsmall', 'Ssmall',      'Tsmall', 'Usmall', 'Vsmall', 'Wsmall', 'Xsmall', 'Ysmall',      'Zsmall', 'colonmonetary', 'onefitted', 'rupiah', 'Tildesmall',      'exclamdownsmall', 'centoldstyle', 'Lslashsmall', 'Scaronsmall',      'Zcaronsmall', 'Dieresissmall', 'Brevesmall', 'Caronsmall',      'Dotaccentsmall', 'Macronsmall', 'figuredash', 'hypheninferior',      'Ogoneksmall', 'Ringsmall', 'Cedillasmall', 'questiondownsmall',      'oneeighth', 'threeeighths', 'fiveeighths', 'seveneighths',      'onethird', 'twothirds', 'zerosuperior', 'foursuperior',      'fivesuperior', 'sixsuperior', 'sevensuperior', 'eightsuperior',      'ninesuperior', 'zeroinferior', 'oneinferior', 'twoinferior',      'threeinferior', 'fourinferior', 'fiveinferior', 'sixinferior',      'seveninferior', 'eightinferior', 'nineinferior',      'centinferior', 'dollarinferior', 'periodinferior',      'commainferior', 'Agravesmall', 'Aacutesmall',      'Acircumflexsmall', 'Atildesmall', 'Adieresissmall',      'Aringsmall', 'AEsmall', 'Ccedillasmall', 'Egravesmall',      'Eacutesmall', 'Ecircumflexsmall', 'Edieresissmall',      'Igravesmall', 'Iacutesmall', 'Icircumflexsmall',      'Idieresissmall', 'Ethsmall', 'Ntildesmall', 'Ogravesmall',      'Oacutesmall', 'Ocircumflexsmall', 'Otildesmall',      'Odieresissmall', 'OEsmall', 'Oslashsmall', 'Ugravesmall',      'Uacutesmall', 'Ucircumflexsmall', 'Udieresissmall',      'Yacutesmall', 'Thornsmall', 'Ydieresissmall', '001.000',      '001.001', '001.002', '001.003', 'Black', 'Bold', 'Book',      'Light', 'Medium', 'Regular', 'Roman', 'Semibold',      )
    class INDEX:
        def __init__(self, fp):            self.fp = fp            self.offsets = []            (count, offsize) = struct.unpack(b'>HB', self.fp.read(3))            for i in range(count+1):                self.offsets.append(nunpack(self.fp.read(offsize)))            self.base = self.fp.tell()-1            self.fp.seek(self.base+self.offsets[-1])
        def __repr__(self):            return '<INDEX: size=%d>' % len(self)
        def __len__(self):            return len(self.offsets)-1
        def __getitem__(self, i):            self.fp.seek(self.base+self.offsets[i])            return self.fp.read(self.offsets[i+1]-self.offsets[i])
        def __iter__(self):            return iter( self[i] for i in range(len(self)) )
    def __init__(self, name, fp):        self.name = name        self.fp = fp        # Header        (_major,_minor,hdrsize,offsize) = struct.unpack(b'BBBB', self.fp.read(4))        self.fp.read(hdrsize-4)        # Name INDEX        self.name_index = self.INDEX(self.fp)        # Top DICT INDEX        self.dict_index = self.INDEX(self.fp)        # String INDEX        self.string_index = self.INDEX(self.fp)        # Global Subr INDEX        self.subr_index = self.INDEX(self.fp)        # Top DICT DATA        self.top_dict = getdict(self.dict_index[0])        (charset_pos,) = self.top_dict.get(15, [0])        (encoding_pos,) = self.top_dict.get(16, [0])        (charstring_pos,) = self.top_dict.get(17, [0])        # CharStrings        self.fp.seek(charstring_pos)        self.charstring = self.INDEX(self.fp)        self.nglyphs = len(self.charstring)        # Encodings        self.code2gid = {}        self.gid2code = {}        self.fp.seek(encoding_pos)        format = self.fp.read(1)        if format == b'\x00':            # Format 0            (n,) = struct.unpack(b'B', self.fp.read(1))            for (code,gid) in enumerate(struct.unpack(b'B'*n, self.fp.read(n))):                self.code2gid[code] = gid                self.gid2code[gid] = code        elif format == b'\x01':            # Format 1            (n,) = struct.unpack(b'B', self.fp.read(1))            code = 0            for i in range(n):                (first,nleft) = struct.unpack(b'BB', self.fp.read(2))                for gid in range(first,first+nleft+1):                    self.code2gid[code] = gid                    self.gid2code[gid] = code                    code += 1        else:            raise ValueError('unsupported encoding format: %r' % format)        # Charsets        self.name2gid = {}        self.gid2name = {}        self.fp.seek(charset_pos)        format = self.fp.read(1)        if format == '\x00':            # Format 0            n = self.nglyphs-1            for (gid,sid) in enumerate(struct.unpack(b'>'+b'H'*n, self.fp.read(2*n))):                gid += 1                name = self.getstr(sid)                self.name2gid[name] = gid                self.gid2name[gid] = name        elif format == '\x01':            # Format 1            (n,) = struct.unpack(b'B', self.fp.read(1))            sid = 0            for i in range(n):                (first,nleft) = struct.unpack(b'BB', self.fp.read(2))                for gid in range(first,first+nleft+1):                    name = self.getstr(sid)                    self.name2gid[name] = gid                    self.gid2name[gid] = name                    sid += 1        elif format == '\x02':            # Format 2            assert 0        else:            raise ValueError('unsupported charset format: %r' % format)        #print self.code2gid        #print self.name2gid        #assert 0
    def getstr(self, sid):        if sid < len(self.STANDARD_STRINGS):            return self.STANDARD_STRINGS[sid]        return self.string_index[sid-len(self.STANDARD_STRINGS)]

class TrueTypeFont:
    class CMapNotFound(Exception): pass
    def __init__(self, name, fp):        self.name = name        self.fp = fp        self.tables = {}        self.fonttype = fp.read(4)        (ntables, _1, _2, _3) = struct.unpack(b'>HHHH', fp.read(8))        for _ in range(ntables):            (name, tsum, offset, length) = struct.unpack(b'>4sLLL', fp.read(16))            self.tables[name] = (offset, length)
    def create_unicode_map(self):        if 'cmap' not in self.tables:            raise TrueTypeFont.CMapNotFound        (base_offset, length) = self.tables['cmap']        fp = self.fp        fp.seek(base_offset)        (version, nsubtables) = struct.unpack(b'>HH', fp.read(4))        subtables = []        for i in range(nsubtables):            subtables.append(struct.unpack(b'>HHL', fp.read(8)))        char2gid = {}        # Only supports subtable type 0, 2 and 4.        for (_1, _2, st_offset) in subtables:            fp.seek(base_offset+st_offset)            (fmttype, fmtlen, fmtlang) = struct.unpack(b'>HHH', fp.read(6))            if fmttype == 0:                char2gid.update(enumerate(struct.unpack(b'>256B', fp.read(256))))            elif fmttype == 2:                subheaderkeys = struct.unpack(b'>256H', fp.read(512))                firstbytes = [0]*8192                for (i,k) in enumerate(subheaderkeys):                    firstbytes[k/8] = i                nhdrs = max(subheaderkeys)/8 + 1                hdrs = []                for i in range(nhdrs):                    (firstcode,entcount,delta,offset) = struct.unpack(b'>HHhH', fp.read(8))                    hdrs.append((i,firstcode,entcount,delta,fp.tell()-2+offset))                for (i,firstcode,entcount,delta,pos) in hdrs:                    if not entcount: continue                    first = firstcode + (firstbytes[i] << 8)                    fp.seek(pos)                    for c in range(entcount):                        gid = struct.unpack(b'>H', fp.read(2))                        if gid:                            gid += delta                        char2gid[first+c] = gid            elif fmttype == 4:                (segcount, _1, _2, _3) = struct.unpack(b'>HHHH', fp.read(8))                segcount /= 2                ecs = struct.unpack(b'>%dH' % segcount, fp.read(2*segcount))                fp.read(2)                scs = struct.unpack(b'>%dH' % segcount, fp.read(2*segcount))                idds = struct.unpack(b'>%dh' % segcount, fp.read(2*segcount))                pos = fp.tell()                idrs = struct.unpack(b'>%dH' % segcount, fp.read(2*segcount))                for (ec,sc,idd,idr) in zip(ecs, scs, idds, idrs):                    if idr:                        fp.seek(pos+idr)                        for c in range(sc, ec+1):                            char2gid[c] = (struct.unpack(b'>H', fp.read(2))[0] + idd) & 0xffff                    else:                        for c in range(sc, ec+1):                            char2gid[c] = (c + idd) & 0xffff            else:                assert 0        # create unicode map        unicode_map = FileUnicodeMap()        for (char,gid) in char2gid.items():            unicode_map.add_cid2unichr(gid, char)        return unicode_map

##  Fonts##
class PDFFontError(PDFException): passclass PDFUnicodeNotDefined(PDFFontError): pass
LITERAL_STANDARD_ENCODING = LIT('StandardEncoding')LITERAL_TYPE1C = LIT('Type1C')

class PDFFont:
    def __init__(self, descriptor, widths, default_width=None):        self.descriptor = descriptor        self.widths = widths        self.fontname = resolve1(descriptor.get('FontName', 'unknown'))        if isinstance(self.fontname, PSLiteral):            self.fontname = literal_name(self.fontname)        self.flags = int_value(descriptor.get('Flags', 0))        self.ascent = num_value(descriptor.get('Ascent', 0))        self.descent = num_value(descriptor.get('Descent', 0))        self.italic_angle = num_value(descriptor.get('ItalicAngle', 0))        self.default_width = default_width or num_value(descriptor.get('MissingWidth', 0))        self.leading = num_value(descriptor.get('Leading', 0))        self.bbox = list_value(descriptor.get('FontBBox', (0,0,0,0)))        self.hscale = self.vscale = .001
    def __repr__(self):        return '<PDFFont>'
    def is_vertical(self):        return False
    def is_multibyte(self):        return False
    def decode(self, s):        if isinstance(s, str):            return list(map(ord, s))        else: # it's already bytes            return s
    def get_ascent(self):        return self.ascent * self.vscale    def get_descent(self):        return self.descent * self.vscale
    def get_width(self):        w = self.bbox[2]-self.bbox[0]        if w == 0:            w = -self.default_width        return w * self.hscale    def get_height(self):        h = self.bbox[3]-self.bbox[1]        if h == 0:            h = self.ascent - self.descent        return h * self.vscale
    def char_width(self, cid):        return self.widths.get(cid, self.default_width) * self.hscale
    def char_disp(self, cid):        return 0
    def string_width(self, s):        return sum( self.char_width(cid) for cid in self.decode(s) )

class PDFSimpleFont(PDFFont):
    def __init__(self, descriptor, widths, spec):        # Font encoding is specified either by a name of        # built-in encoding or a dictionary that describes        # the differences.        if 'Encoding' in spec:            encoding = resolve1(spec['Encoding'])        else:            encoding = LITERAL_STANDARD_ENCODING        if isinstance(encoding, dict):            name = literal_name(encoding.get('BaseEncoding', LITERAL_STANDARD_ENCODING))            diff = list_value(encoding.get('Differences', None))            self.cid2unicode = EncodingDB.get_encoding(name, diff)        else:            self.cid2unicode = EncodingDB.get_encoding(literal_name(encoding))        self.unicode_map = None        if 'ToUnicode' in spec:            strm = stream_value(spec['ToUnicode'])            self.unicode_map = FileUnicodeMap()            CMapParser(self.unicode_map, io.BytesIO(strm.get_data())).run()        PDFFont.__init__(self, descriptor, widths)
    def to_unichr(self, cid):        if self.unicode_map:            try:                return self.unicode_map.get_unichr(cid)            except KeyError:                pass        try:            return self.cid2unicode[cid]        except KeyError:            raise PDFUnicodeNotDefined(None, cid)
class PDFType1Font(PDFSimpleFont):
    def __init__(self, rsrcmgr, spec):        try:            self.basefont = literal_name(spec['BaseFont'])        except KeyError:            handle_error(PDFFontError, 'BaseFont is missing')            self.basefont = 'unknown'        try:            (descriptor, widths) = FontMetricsDB.get_metrics(self.basefont)        except KeyError:            descriptor = dict_value(spec.get('FontDescriptor', {}))            firstchar = int_value(spec.get('FirstChar', 0))            lastchar = int_value(spec.get('LastChar', 255))            widths = list_value(spec.get('Widths', [0]*256))            widths = dict( (i+firstchar,w) for (i,w) in enumerate(widths) )        PDFSimpleFont.__init__(self, descriptor, widths, spec)        if 'Encoding' not in spec and 'FontFile' in descriptor:            # try to recover the missing encoding info from the font file.            self.fontfile = stream_value(descriptor.get('FontFile'))            length1 = int_value(self.fontfile['Length1'])            data = self.fontfile.get_data()[:length1]            parser = Type1FontHeaderParser(io.BytesIO(data))            self.cid2unicode = parser.get_encoding()
    def __repr__(self):        return '<PDFType1Font: basefont=%r>' % self.basefont
class PDFTrueTypeFont(PDFType1Font):
    def __repr__(self):        return '<PDFTrueTypeFont: basefont=%r>' % self.basefont
class PDFType3Font(PDFSimpleFont):
    def __init__(self, rsrcmgr, spec):        firstchar = int_value(spec.get('FirstChar', 0))        lastchar = int_value(spec.get('LastChar', 0))        widths = list_value(spec.get('Widths', [0]*256))        widths = dict( (i+firstchar,w) for (i,w) in enumerate(widths))        if 'FontDescriptor' in spec:            descriptor = dict_value(spec['FontDescriptor'])        else:            descriptor = {'Ascent':0, 'Descent':0,                          'FontBBox':spec['FontBBox']}        PDFSimpleFont.__init__(self, descriptor, widths, spec)        self.matrix = tuple(list_value(spec.get('FontMatrix')))        (_,self.descent,_,self.ascent) = self.bbox        (self.hscale,self.vscale) = apply_matrix_norm(self.matrix, (1,1))
    def __repr__(self):        return '<PDFType3Font>'

class PDFCIDFont(PDFFont):
    def __init__(self, rsrcmgr, spec):        try:            self.basefont = literal_name(spec['BaseFont'])        except KeyError:            handle_error(PDFFontError, 'BaseFont is missing')            self.basefont = 'unknown'        self.cidsysteminfo = dict_value(spec.get('CIDSystemInfo', {}))        self.cidcoding = '%s-%s' % (self.cidsysteminfo.get('Registry', 'unknown'),                                    self.cidsysteminfo.get('Ordering', 'unknown'))        try:            name = literal_name(spec['Encoding'])        except KeyError:            handle_error(PDFFontError, 'Encoding is unspecified')            name = 'unknown'        try:            self.cmap = CMapDB.get_cmap(name)        except CMapDB.CMapNotFound as e:            handle_error(PDFFontError, str(e))            self.cmap = CMap()        try:            descriptor = dict_value(spec['FontDescriptor'])        except KeyError:            handle_error(PDFFontError, 'FontDescriptor is missing')            descriptor = {}        ttf = None        if 'FontFile2' in descriptor:            self.fontfile = stream_value(descriptor.get('FontFile2'))            ttf = TrueTypeFont(self.basefont,                               io.BytesIO(self.fontfile.get_data()))        self.unicode_map = None        if 'ToUnicode' in spec:            strm = stream_value(spec['ToUnicode'])            self.unicode_map = FileUnicodeMap()            CMapParser(self.unicode_map, io.BytesIO(strm.get_data())).run()        elif self.cidcoding == 'Adobe-Identity':            if ttf:                try:                    self.unicode_map = ttf.create_unicode_map()                except TrueTypeFont.CMapNotFound:                    pass        else:            try:                self.unicode_map = CMapDB.get_unicode_map(self.cidcoding, self.cmap.is_vertical())            except CMapDB.CMapNotFound as e:                pass
        self.vertical = self.cmap.is_vertical()        if self.vertical:            # writing mode: vertical            widths = get_widths2(list_value(spec.get('W2', [])))            self.disps = dict( (cid,(vx,vy)) for (cid,(_,(vx,vy))) in widths.items() )            (vy,w) = spec.get('DW2', [880, -1000])            self.default_disp = (None,vy)            widths = dict( (cid,w) for (cid,(w,_)) in widths.items() )            default_width = w        else:            # writing mode: horizontal            self.disps = {}            self.default_disp = 0            widths = get_widths(list_value(spec.get('W', [])))            default_width = spec.get('DW', 1000)        PDFFont.__init__(self, descriptor, widths, default_width=default_width)
    def __repr__(self):        return '<PDFCIDFont: basefont=%r, cidcoding=%r>' % (self.basefont, self.cidcoding)
    def is_vertical(self):        return self.vertical
    def is_multibyte(self):        return True
    def decode(self, bytes):        return self.cmap.decode(bytes)
    def char_disp(self, cid):        "Returns an integer for horizontal fonts, a tuple for vertical fonts."        return self.disps.get(cid, self.default_disp)
    def to_unichr(self, cid):        try:            if not self.unicode_map:                raise KeyError(cid)            return self.unicode_map.get_unichr(cid)        except KeyError:            raise PDFUnicodeNotDefined(self.cidcoding, cid)

def main(argv):    for fname in argv[1:]:        fp = io.open(fname, 'rb')        #font = TrueTypeFont(fname, fp)        font = CFFFont(fname, fp)        print(font)        fp.close()
if __name__ == '__main__':    sys.exit(main(sys.argv))