cp1253.py

来自「mallet是自然语言处理、机器学习领域的一个开源项目。」· Python 代码 · 共 152 行

PY
152
字号
""" Python Character Mapping Codec generated from 'CP1253.TXT' with gencodec.py.Written by Marc-Andre Lemburg (mal@lemburg.com).(c) Copyright CNRI, All Rights Reserved. NO WARRANTY.(c) Copyright 2000 Guido van Rossum."""#"import codecs### Codec APIsclass Codec(codecs.Codec):    def encode(self,input,errors='strict'):        return codecs.charmap_encode(input,errors,encoding_map)            def decode(self,input,errors='strict'):        return codecs.charmap_decode(input,errors,decoding_map)class StreamWriter(Codec,codecs.StreamWriter):    pass        class StreamReader(Codec,codecs.StreamReader):    pass### encodings module APIdef getregentry():    return (Codec().encode,Codec().decode,StreamReader,StreamWriter)### Decoding Mapdecoding_map = codecs.make_identity_dict(range(256))decoding_map.update({	0x0080: 0x20ac,	# EURO SIGN	0x0081: None,	# UNDEFINED	0x0082: 0x201a,	# SINGLE LOW-9 QUOTATION MARK	0x0083: 0x0192,	# LATIN SMALL LETTER F WITH HOOK	0x0084: 0x201e,	# DOUBLE LOW-9 QUOTATION MARK	0x0085: 0x2026,	# HORIZONTAL ELLIPSIS	0x0086: 0x2020,	# DAGGER	0x0087: 0x2021,	# DOUBLE DAGGER	0x0088: None,	# UNDEFINED	0x0089: 0x2030,	# PER MILLE SIGN	0x008a: None,	# UNDEFINED	0x008b: 0x2039,	# SINGLE LEFT-POINTING ANGLE QUOTATION MARK	0x008c: None,	# UNDEFINED	0x008d: None,	# UNDEFINED	0x008e: None,	# UNDEFINED	0x008f: None,	# UNDEFINED	0x0090: None,	# UNDEFINED	0x0091: 0x2018,	# LEFT SINGLE QUOTATION MARK	0x0092: 0x2019,	# RIGHT SINGLE QUOTATION MARK	0x0093: 0x201c,	# LEFT DOUBLE QUOTATION MARK	0x0094: 0x201d,	# RIGHT DOUBLE QUOTATION MARK	0x0095: 0x2022,	# BULLET	0x0096: 0x2013,	# EN DASH	0x0097: 0x2014,	# EM DASH	0x0098: None,	# UNDEFINED	0x0099: 0x2122,	# TRADE MARK SIGN	0x009a: None,	# UNDEFINED	0x009b: 0x203a,	# SINGLE RIGHT-POINTING ANGLE QUOTATION MARK	0x009c: None,	# UNDEFINED	0x009d: None,	# UNDEFINED	0x009e: None,	# UNDEFINED	0x009f: None,	# UNDEFINED	0x00a1: 0x0385,	# GREEK DIALYTIKA TONOS	0x00a2: 0x0386,	# GREEK CAPITAL LETTER ALPHA WITH TONOS	0x00aa: None,	# UNDEFINED	0x00af: 0x2015,	# HORIZONTAL BAR	0x00b4: 0x0384,	# GREEK TONOS	0x00b8: 0x0388,	# GREEK CAPITAL LETTER EPSILON WITH TONOS	0x00b9: 0x0389,	# GREEK CAPITAL LETTER ETA WITH TONOS	0x00ba: 0x038a,	# GREEK CAPITAL LETTER IOTA WITH TONOS	0x00bc: 0x038c,	# GREEK CAPITAL LETTER OMICRON WITH TONOS	0x00be: 0x038e,	# GREEK CAPITAL LETTER UPSILON WITH TONOS	0x00bf: 0x038f,	# GREEK CAPITAL LETTER OMEGA WITH TONOS	0x00c0: 0x0390,	# GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS	0x00c1: 0x0391,	# GREEK CAPITAL LETTER ALPHA	0x00c2: 0x0392,	# GREEK CAPITAL LETTER BETA	0x00c3: 0x0393,	# GREEK CAPITAL LETTER GAMMA	0x00c4: 0x0394,	# GREEK CAPITAL LETTER DELTA	0x00c5: 0x0395,	# GREEK CAPITAL LETTER EPSILON	0x00c6: 0x0396,	# GREEK CAPITAL LETTER ZETA	0x00c7: 0x0397,	# GREEK CAPITAL LETTER ETA	0x00c8: 0x0398,	# GREEK CAPITAL LETTER THETA	0x00c9: 0x0399,	# GREEK CAPITAL LETTER IOTA	0x00ca: 0x039a,	# GREEK CAPITAL LETTER KAPPA	0x00cb: 0x039b,	# GREEK CAPITAL LETTER LAMDA	0x00cc: 0x039c,	# GREEK CAPITAL LETTER MU	0x00cd: 0x039d,	# GREEK CAPITAL LETTER NU	0x00ce: 0x039e,	# GREEK CAPITAL LETTER XI	0x00cf: 0x039f,	# GREEK CAPITAL LETTER OMICRON	0x00d0: 0x03a0,	# GREEK CAPITAL LETTER PI	0x00d1: 0x03a1,	# GREEK CAPITAL LETTER RHO	0x00d2: None,	# UNDEFINED	0x00d3: 0x03a3,	# GREEK CAPITAL LETTER SIGMA	0x00d4: 0x03a4,	# GREEK CAPITAL LETTER TAU	0x00d5: 0x03a5,	# GREEK CAPITAL LETTER UPSILON	0x00d6: 0x03a6,	# GREEK CAPITAL LETTER PHI	0x00d7: 0x03a7,	# GREEK CAPITAL LETTER CHI	0x00d8: 0x03a8,	# GREEK CAPITAL LETTER PSI	0x00d9: 0x03a9,	# GREEK CAPITAL LETTER OMEGA	0x00da: 0x03aa,	# GREEK CAPITAL LETTER IOTA WITH DIALYTIKA	0x00db: 0x03ab,	# GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA	0x00dc: 0x03ac,	# GREEK SMALL LETTER ALPHA WITH TONOS	0x00dd: 0x03ad,	# GREEK SMALL LETTER EPSILON WITH TONOS	0x00de: 0x03ae,	# GREEK SMALL LETTER ETA WITH TONOS	0x00df: 0x03af,	# GREEK SMALL LETTER IOTA WITH TONOS	0x00e0: 0x03b0,	# GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS	0x00e1: 0x03b1,	# GREEK SMALL LETTER ALPHA	0x00e2: 0x03b2,	# GREEK SMALL LETTER BETA	0x00e3: 0x03b3,	# GREEK SMALL LETTER GAMMA	0x00e4: 0x03b4,	# GREEK SMALL LETTER DELTA	0x00e5: 0x03b5,	# GREEK SMALL LETTER EPSILON	0x00e6: 0x03b6,	# GREEK SMALL LETTER ZETA	0x00e7: 0x03b7,	# GREEK SMALL LETTER ETA	0x00e8: 0x03b8,	# GREEK SMALL LETTER THETA	0x00e9: 0x03b9,	# GREEK SMALL LETTER IOTA	0x00ea: 0x03ba,	# GREEK SMALL LETTER KAPPA	0x00eb: 0x03bb,	# GREEK SMALL LETTER LAMDA	0x00ec: 0x03bc,	# GREEK SMALL LETTER MU	0x00ed: 0x03bd,	# GREEK SMALL LETTER NU	0x00ee: 0x03be,	# GREEK SMALL LETTER XI	0x00ef: 0x03bf,	# GREEK SMALL LETTER OMICRON	0x00f0: 0x03c0,	# GREEK SMALL LETTER PI	0x00f1: 0x03c1,	# GREEK SMALL LETTER RHO	0x00f2: 0x03c2,	# GREEK SMALL LETTER FINAL SIGMA	0x00f3: 0x03c3,	# GREEK SMALL LETTER SIGMA	0x00f4: 0x03c4,	# GREEK SMALL LETTER TAU	0x00f5: 0x03c5,	# GREEK SMALL LETTER UPSILON	0x00f6: 0x03c6,	# GREEK SMALL LETTER PHI	0x00f7: 0x03c7,	# GREEK SMALL LETTER CHI	0x00f8: 0x03c8,	# GREEK SMALL LETTER PSI	0x00f9: 0x03c9,	# GREEK SMALL LETTER OMEGA	0x00fa: 0x03ca,	# GREEK SMALL LETTER IOTA WITH DIALYTIKA	0x00fb: 0x03cb,	# GREEK SMALL LETTER UPSILON WITH DIALYTIKA	0x00fc: 0x03cc,	# GREEK SMALL LETTER OMICRON WITH TONOS	0x00fd: 0x03cd,	# GREEK SMALL LETTER UPSILON WITH TONOS	0x00fe: 0x03ce,	# GREEK SMALL LETTER OMEGA WITH TONOS	0x00ff: None,	# UNDEFINED})### Encoding Mapencoding_map = codecs.make_encoding_map(decoding_map)

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?