shithub: riscv

ref: 4fb65ae3e84f536a9b924082b7c59a30d5802e6b
dir: /sys/lib/python/encodings/palmos.py/

View raw version
""" Python Character Mapping Codec for PalmOS 3.5.

Written by Sjoerd Mullender (sjoerd@acm.org); based on iso8859_15.py.

"""#"

import codecs

### Codec APIs

class Codec(codecs.Codec):
    def encode(self,input,errors='strict'):
        return codecs.charmap_encode(input,errors,encoding_map)

    def decode(self,input,errors='strict'):
        return codecs.charmap_decode(input,errors,decoding_map)

class IncrementalEncoder(codecs.IncrementalEncoder):
    def encode(self, input, final=False):
        return codecs.charmap_encode(input,self.errors,encoding_map)[0]

class IncrementalDecoder(codecs.IncrementalDecoder):
    def decode(self, input, final=False):
        return codecs.charmap_decode(input,self.errors,decoding_map)[0]

class StreamWriter(Codec,codecs.StreamWriter):
    pass

class StreamReader(Codec,codecs.StreamReader):
    pass

### encodings module API

def getregentry():
    return codecs.CodecInfo(
        name='palmos',
        encode=Codec().encode,
        decode=Codec().decode,
        incrementalencoder=IncrementalEncoder,
        incrementaldecoder=IncrementalDecoder,
        streamreader=StreamReader,
        streamwriter=StreamWriter,
    )

### Decoding Map

decoding_map = codecs.make_identity_dict(range(256))

# The PalmOS character set is mostly iso-8859-1 with some differences.
decoding_map.update({
        0x0080: 0x20ac, #       EURO SIGN
        0x0082: 0x201a, #       SINGLE LOW-9 QUOTATION MARK
        0x0083: 0x0192, #       LATIN SMALL LETTER F WITH HOOK
        0x0084: 0x201e, #       DOUBLE LOW-9 QUOTATION MARK
        0x0085: 0x2026, #       HORIZONTAL ELLIPSIS
        0x0086: 0x2020, #       DAGGER
        0x0087: 0x2021, #       DOUBLE DAGGER
        0x0088: 0x02c6, #       MODIFIER LETTER CIRCUMFLEX ACCENT
        0x0089: 0x2030, #       PER MILLE SIGN
        0x008a: 0x0160, #       LATIN CAPITAL LETTER S WITH CARON
        0x008b: 0x2039, #       SINGLE LEFT-POINTING ANGLE QUOTATION MARK
        0x008c: 0x0152, #       LATIN CAPITAL LIGATURE OE
        0x008d: 0x2666, #       BLACK DIAMOND SUIT
        0x008e: 0x2663, #       BLACK CLUB SUIT
        0x008f: 0x2665, #       BLACK HEART SUIT
        0x0090: 0x2660, #       BLACK SPADE SUIT
        0x0091: 0x2018, #       LEFT SINGLE QUOTATION MARK
        0x0092: 0x2019, #       RIGHT SINGLE QUOTATION MARK
        0x0093: 0x201c, #       LEFT DOUBLE QUOTATION MARK
        0x0094: 0x201d, #       RIGHT DOUBLE QUOTATION MARK
        0x0095: 0x2022, #       BULLET
        0x0096: 0x2013, #       EN DASH
        0x0097: 0x2014, #       EM DASH
        0x0098: 0x02dc, #       SMALL TILDE
        0x0099: 0x2122, #       TRADE MARK SIGN
        0x009a: 0x0161, #       LATIN SMALL LETTER S WITH CARON
        0x009c: 0x0153, #       LATIN SMALL LIGATURE OE
        0x009f: 0x0178, #       LATIN CAPITAL LETTER Y WITH DIAERESIS
})

### Encoding Map

encoding_map = codecs.make_encoding_map(decoding_map)