mirror of
https://github.com/python/cpython.git
synced 2025-07-27 13:14:41 +00:00

of tuple) that provides incremental decoders and encoders (a way to use stateful codecs without the stream API). Functions codecs.getincrementaldecoder() and codecs.getincrementalencoder() have been added.
83 lines
2.9 KiB
Python
83 lines
2.9 KiB
Python
""" Python Character Mapping Codec for PalmOS 3.5.
|
|
|
|
Written by Sjoerd Mullender (sjoerd@acm.org); based on iso8859_15.py.
|
|
|
|
"""#"
|
|
|
|
import codecs
|
|
|
|
### Codec APIs
|
|
|
|
class Codec(codecs.Codec):
|
|
def encode(self,input,errors='strict'):
|
|
return codecs.charmap_encode(input,errors,encoding_map)
|
|
|
|
def decode(self,input,errors='strict'):
|
|
return codecs.charmap_decode(input,errors,decoding_map)
|
|
|
|
class IncrementalEncoder(codecs.IncrementalEncoder):
|
|
def encode(self, input, final=False):
|
|
return codecs.charmap_encode(input,self.errors,encoding_map)[0]
|
|
|
|
class IncrementalDecoder(codecs.IncrementalDecoder):
|
|
def decode(self, input, final=False):
|
|
return codecs.charmap_decode(input,self.errors,decoding_map)[0]
|
|
|
|
class StreamWriter(Codec,codecs.StreamWriter):
|
|
pass
|
|
|
|
class StreamReader(Codec,codecs.StreamReader):
|
|
pass
|
|
|
|
### encodings module API
|
|
|
|
def getregentry():
|
|
return codecs.CodecInfo(
|
|
name='palmos',
|
|
encode=Codec().encode,
|
|
decode=Codec().decode,
|
|
incrementalencoder=IncrementalEncoder,
|
|
incrementaldecoder=IncrementalDecoder,
|
|
streamreader=StreamReader,
|
|
streamwriter=StreamWriter,
|
|
)
|
|
|
|
### Decoding Map
|
|
|
|
decoding_map = codecs.make_identity_dict(range(256))
|
|
|
|
# The PalmOS character set is mostly iso-8859-1 with some differences.
|
|
decoding_map.update({
|
|
0x0080: 0x20ac, # EURO SIGN
|
|
0x0082: 0x201a, # SINGLE LOW-9 QUOTATION MARK
|
|
0x0083: 0x0192, # LATIN SMALL LETTER F WITH HOOK
|
|
0x0084: 0x201e, # DOUBLE LOW-9 QUOTATION MARK
|
|
0x0085: 0x2026, # HORIZONTAL ELLIPSIS
|
|
0x0086: 0x2020, # DAGGER
|
|
0x0087: 0x2021, # DOUBLE DAGGER
|
|
0x0088: 0x02c6, # MODIFIER LETTER CIRCUMFLEX ACCENT
|
|
0x0089: 0x2030, # PER MILLE SIGN
|
|
0x008a: 0x0160, # LATIN CAPITAL LETTER S WITH CARON
|
|
0x008b: 0x2039, # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
|
|
0x008c: 0x0152, # LATIN CAPITAL LIGATURE OE
|
|
0x008d: 0x2666, # BLACK DIAMOND SUIT
|
|
0x008e: 0x2663, # BLACK CLUB SUIT
|
|
0x008f: 0x2665, # BLACK HEART SUIT
|
|
0x0090: 0x2660, # BLACK SPADE SUIT
|
|
0x0091: 0x2018, # LEFT SINGLE QUOTATION MARK
|
|
0x0092: 0x2019, # RIGHT SINGLE QUOTATION MARK
|
|
0x0093: 0x201c, # LEFT DOUBLE QUOTATION MARK
|
|
0x0094: 0x201d, # RIGHT DOUBLE QUOTATION MARK
|
|
0x0095: 0x2022, # BULLET
|
|
0x0096: 0x2013, # EN DASH
|
|
0x0097: 0x2014, # EM DASH
|
|
0x0098: 0x02dc, # SMALL TILDE
|
|
0x0099: 0x2122, # TRADE MARK SIGN
|
|
0x009a: 0x0161, # LATIN SMALL LETTER S WITH CARON
|
|
0x009c: 0x0153, # LATIN SMALL LIGATURE OE
|
|
0x009f: 0x0178, # LATIN CAPITAL LETTER Y WITH DIAERESIS
|
|
})
|
|
|
|
### Encoding Map
|
|
|
|
encoding_map = codecs.make_encoding_map(decoding_map)
|