pop3graph.py

来自「用python实现的邮件过滤器」· Python 代码 · 共 92 行

92 行

#!/usr/bin/env python"""Analyse the pop3proxy's caches and produce a graph of how accurateclassifier has been over time.  Only really meaningful if you startedwith an empty database."""from __future__ import divisionimport sysimport getoptfrom spambayes import  mboxutilsfrom spambayes.FileCorpus import FileCorpus, FileMessageFactory, GzipFileMessageFactoryfrom spambayes.Options import optionsdef usage():    print __doc__def main(argv):    opts, args = getopt.getopt(argv, "h", ["help"])    for opt, arg in opts:        if opt in ("-h", "--help"):            usage()            return    # Create the corpuses and the factory that reads the messages.    if options["pop3proxy", "cache_use_gzip"]:        messageFactory = GzipFileMessageFactory()    else:        messageFactory = FileMessageFactory()    sc = get_pathname_option("Storage", "spam_cache")    hc = get_pathname_option("Storage", "ham_cache")    spamCorpus = FileCorpus(messageFactory, sc)    hamCorpus = FileCorpus(messageFactory, hc)    # Read in all the trained messages.    allTrained = {}    for corpus, disposition in [(spamCorpus, 'Yes'), (hamCorpus, 'No')]:        for m in corpus:            message = mboxutils.get_message(m.getSubstance())            message._pop3CacheDisposition = disposition            allTrained[m.key()] = message    # Sort the messages into the order they arrived, then work out a scaling    # factor for the graph - 'limit' is the widest it can be in characters.    keys = allTrained.keys()    keys.sort()    limit = 70    if len(keys) < limit:        scale = 1    else:        scale = len(keys) // (limit//2)    # Build the data - an array of cumulative success indexed by count.    count = successful = 0    successByCount = []    for key in keys:        message = allTrained[key]        disposition = message[options["Headers",                                      "classification_header_name"]]        if (message._pop3CacheDisposition == disposition):            successful += 1        count += 1        if count % scale == (scale-1):            successByCount.append(successful // scale)    # Build the graph, as a list of rows of characters.    size = count // scale    graph = [[" " for i in range(size+3)] for j in range(size)]    for c in range(size):        graph[c][1] = "|"        graph[c][c+3] = "."        graph[successByCount[c]][c+3] = "*"    graph.reverse()    # Print the graph.    print "\n   Success of the classifier over time:\n"    print "   . - Number of messages over time"    print "   * - Number of correctly classified messages over time\n\n"    for row in range(size):        line = ''.join(graph[row])        if row == 0:            print line + " %d" % count        elif row == (count - successful) // scale:            print line + " %d" % successful        else:            print line    print " " + "_" * (size+2)if __name__ == '__main__':    main(sys.argv[1:])

pop3graph.py - 源码说明

本页面展示了「用python实现的邮件过滤器」中的 pop3graph.py 源码文件，采用 Python 编程语言编写，共 92 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。

虫虫下载站收录了大量与python相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。

⌨️ 快捷键说明

复制代码Ctrl + C

搜索代码Ctrl + F

全屏模式F11

增大字号Ctrl + =

减小字号Ctrl + -

显示快捷键?