mirror of
				https://github.com/python/cpython.git
				synced 2025-10-24 23:46:23 +00:00 
			
		
		
		
	 716cf91839
			
		
	
	
		716cf91839
		
	
	
	
	
		
			
			codec files to codecs.py and added logic so that multi mappings in the decoding maps now result in mappings to None (undefined mapping) in the encoding maps.
		
			
				
	
	
		
			82 lines
		
	
	
	
		
			2.4 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			82 lines
		
	
	
	
		
			2.4 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| """ Python Character Mapping Codec generated from 'CP1254.TXT' with gencodec.py.
 | |
| 
 | |
| Written by Marc-Andre Lemburg (mal@lemburg.com).
 | |
| 
 | |
| (c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
 | |
| (c) Copyright 2000 Guido van Rossum.
 | |
| 
 | |
| """#"
 | |
| 
 | |
| import codecs
 | |
| 
 | |
| ### Codec APIs
 | |
| 
 | |
| class Codec(codecs.Codec):
 | |
| 
 | |
|     def encode(self,input,errors='strict'):
 | |
| 
 | |
|         return codecs.charmap_encode(input,errors,encoding_map)
 | |
|         
 | |
|     def decode(self,input,errors='strict'):
 | |
| 
 | |
|         return codecs.charmap_decode(input,errors,decoding_map)
 | |
| 
 | |
| class StreamWriter(Codec,codecs.StreamWriter):
 | |
|     pass
 | |
|         
 | |
| class StreamReader(Codec,codecs.StreamReader):
 | |
|     pass
 | |
| 
 | |
| ### encodings module API
 | |
| 
 | |
| def getregentry():
 | |
| 
 | |
|     return (Codec().encode,Codec().decode,StreamReader,StreamWriter)
 | |
| 
 | |
| ### Decoding Map
 | |
| 
 | |
| decoding_map = codecs.make_identity_dict(range(256))
 | |
| decoding_map.update({
 | |
| 	0x0080: 0x20ac,	# EURO SIGN
 | |
| 	0x0081: None,	# UNDEFINED
 | |
| 	0x0082: 0x201a,	# SINGLE LOW-9 QUOTATION MARK
 | |
| 	0x0083: 0x0192,	# LATIN SMALL LETTER F WITH HOOK
 | |
| 	0x0084: 0x201e,	# DOUBLE LOW-9 QUOTATION MARK
 | |
| 	0x0085: 0x2026,	# HORIZONTAL ELLIPSIS
 | |
| 	0x0086: 0x2020,	# DAGGER
 | |
| 	0x0087: 0x2021,	# DOUBLE DAGGER
 | |
| 	0x0088: 0x02c6,	# MODIFIER LETTER CIRCUMFLEX ACCENT
 | |
| 	0x0089: 0x2030,	# PER MILLE SIGN
 | |
| 	0x008a: 0x0160,	# LATIN CAPITAL LETTER S WITH CARON
 | |
| 	0x008b: 0x2039,	# SINGLE LEFT-POINTING ANGLE QUOTATION MARK
 | |
| 	0x008c: 0x0152,	# LATIN CAPITAL LIGATURE OE
 | |
| 	0x008d: None,	# UNDEFINED
 | |
| 	0x008e: None,	# UNDEFINED
 | |
| 	0x008f: None,	# UNDEFINED
 | |
| 	0x0090: None,	# UNDEFINED
 | |
| 	0x0091: 0x2018,	# LEFT SINGLE QUOTATION MARK
 | |
| 	0x0092: 0x2019,	# RIGHT SINGLE QUOTATION MARK
 | |
| 	0x0093: 0x201c,	# LEFT DOUBLE QUOTATION MARK
 | |
| 	0x0094: 0x201d,	# RIGHT DOUBLE QUOTATION MARK
 | |
| 	0x0095: 0x2022,	# BULLET
 | |
| 	0x0096: 0x2013,	# EN DASH
 | |
| 	0x0097: 0x2014,	# EM DASH
 | |
| 	0x0098: 0x02dc,	# SMALL TILDE
 | |
| 	0x0099: 0x2122,	# TRADE MARK SIGN
 | |
| 	0x009a: 0x0161,	# LATIN SMALL LETTER S WITH CARON
 | |
| 	0x009b: 0x203a,	# SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
 | |
| 	0x009c: 0x0153,	# LATIN SMALL LIGATURE OE
 | |
| 	0x009d: None,	# UNDEFINED
 | |
| 	0x009e: None,	# UNDEFINED
 | |
| 	0x009f: 0x0178,	# LATIN CAPITAL LETTER Y WITH DIAERESIS
 | |
| 	0x00d0: 0x011e,	# LATIN CAPITAL LETTER G WITH BREVE
 | |
| 	0x00dd: 0x0130,	# LATIN CAPITAL LETTER I WITH DOT ABOVE
 | |
| 	0x00de: 0x015e,	# LATIN CAPITAL LETTER S WITH CEDILLA
 | |
| 	0x00f0: 0x011f,	# LATIN SMALL LETTER G WITH BREVE
 | |
| 	0x00fd: 0x0131,	# LATIN SMALL LETTER DOTLESS I
 | |
| 	0x00fe: 0x015f,	# LATIN SMALL LETTER S WITH CEDILLA
 | |
| })
 | |
| 
 | |
| ### Encoding Map
 | |
| 
 | |
| encoding_map = codecs.make_encoding_map(decoding_map)
 |