beautifulsupe.py

来自「bittorrent source by python. please enj」· Python 代码 · 共 133 行

133 行

# A very very minimal BeautifulSoup immitation.## BS uses SGMLlib to parse, which converts everything to lower case.# This uses real xml parsing to mimic the parts of BS we use.import xml.dom.minidomdef _getText(node):    nodelist = node.childNodes    rc = []    for node in nodelist:        if node.nodeType == node.TEXT_NODE:            rc.append(str(node.data))    return rcdef _getNodesAsTags(root):    nodelist = root.childNodes    tags = []    for node in nodelist:        if node.nodeType == node.ELEMENT_NODE:            tags.append(Tag(node))    return tagsclass Tag(object):    def __init__(self, node):        self.node = node        self.name = node.nodeName        self.contents = _getNodesAsTags(self.node)        text = _getText(self.node)        self.contents += text        self.text = ''.join(text)    def child_elements(self):        children = []        for tag in self.contents:            if isinstance(tag, Tag):                children.append(tag)        return children    def get(self, tagname):        got = self.first(tagname)        if got:            return got.text    def first(self, tagname):        found = None                for tag in self.contents:            if isinstance(tag, Tag):                if tag.name == tagname:                    found = tag                    break                return found   class BeautifulSupe(object):    def __init__(self, data):        #please don't give us your null terminators        data = data.strip(chr(0))        self.dom = xml.dom.minidom.parseString(data)        def first(self, tagname, root = None):        found = None        if root == None:            e = self.dom.getElementsByTagName(tagname)            if len(e) > 0:                found = e[0]        else:            for node in root.childNodes:                if node.nodeName == tagname:                    found = node                    break        if not found:            return None        tag = Tag(found)        return tag    def fetch(self, tagname, restraints = {}):        e = self.dom.getElementsByTagName(tagname)        matches = []        for node in e:            match = 1                        for restraint in restraints:                f = self.first(restraint, node)                if not f:                    match = 0                    break                text = restraints[restraint]                if not f.contents[0].startswith(text):                    match = 0                    break                            if match:                tag = Tag(node)                matches.append(tag)        return matches    def scour(self, prefix, suffix = None, node = None):        if node is None:            root = self.dom.getElementsByTagName(self.dom.documentElement.tagName)[0]            node = root        matches = []        for node in node.childNodes:            match = 0                        name = node.nodeName            if name.startswith(prefix):                if suffix:                    if name.endswith(suffix):                        match = 1                else:                    match = 1                                if match:                tag = Tag(node)                matches.append(tag)            matches += self.scour(prefix, suffix, node)        return matches

beautifulsupe.py - 源码说明

本页面展示了「bittorrent source by python. please enjoy」中的 beautifulsupe.py 源码文件，采用 Python 编程语言编写，共 133 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。

虫虫下载站收录了大量与bittorrent相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。

⌨️ 快捷键说明

复制代码Ctrl + C

搜索代码Ctrl + F

全屏模式F11

增大字号Ctrl + =

减小字号Ctrl + -

显示快捷键?