⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 eucgb2312_cn.py

📁 python 中文显示
💻 PY
字号:
# Chen Chien-Hsun, modified from Tamito KAJIYAMA's original code. 

import codecs

from encodings.chinesecn import euc_gb23122utf, utf2euc_gb2312

class Codec(codecs.Codec):
    # Unicode to character buffer
    def encode(self, data, errors='strict',
               supported_errors=('strict', 'ignore', 'replace')):
        if errors not in supported_errors:
            raise UnicodeError, "unknown error handling"
        m = utf2euc_gb2312.mapping
        s = ''
        for c in data:
            if c < u'\u0080':
                s = s + c.encode("ascii")
            else:
                if m.has_key(c):
                    s = s + m[c]
                elif errors == 'replace':
                    s = s + '\x21\x21' # GB2312 IDEOGRAPHIC SPACE
                elif errors == 'strict':
                    raise UnicodeError, "cannot map \\u%04x to GB2312" % ord(c)
        return (s, len(s))
    # character buffer to Unicode
    def decode(self, data, errors='strict',
               supported_errors=('strict', 'ignore', 'replace')):
        if errors not in supported_errors:
            raise UnicodeError, "unknown error handling"
        m = euc_gb23122utf.mapping
        s = u''
        data = str(data) # character buffer compatible object
        size = len(data)
        p = 0
        while p < size:
            if data[p] < "\x80":
                s = s + unicode(data[p], "ascii")
                p = p + 1
            else:
                c = data[p:p+2]
                p = p + 2
                if m.has_key(c):
                    s = s + m[c]
                elif errors == 'replace':
                    s = s + u'\uFFFD' # REPLACEMENT CHARACTER
                elif errors == 'strict':
                    raise UnicodeError, "cannot map GB2312 \\x%02x%02x to Unicode" % (ord(c[0]), ord(c[1]))
        return (s, p)

class StreamWriter(Codec, codecs.StreamWriter):
    pass

class StreamReader(Codec, codecs.StreamReader):
    def __init__(self, stream, errors='strict'):
        codecs.StreamReader.__init__(self, stream, errors)
        self.data = ''
    def read(self, size=-1):
        if size < 0:
            data = self.data + self.stream.read()
            self.data = ''
        else:
            data = self.data + self.stream.read(size - len(self.data))
            size = len(data)
            p = 0
            while p < size:
                if data[p] < "\x80":
                    p = p + 1
                elif p + 2 <= size:
                    p = p + 2
                else:
                    break
            data, self.data = data[:p], data[p:]
        return self.decode(data)[0]
    def readline(self, size=None):
        if size is None:
            data = self.data + self.stream.readline()
        else:
            data = self.data + self.stream.readline(size - len(self.data))
        self.data = ''
        return self.decode(data)[0]
    def reset(self):
        self.data = ''

### encodings module API

def getregentry():

    return (Codec().encode,Codec().decode,StreamReader,StreamWriter)

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -