📄 printstats.py
字号:
"""printstats.py - Print project statistics and informationby reading the user's crawls database.Created by Anand B Pillai <abpillai at gmail dot com> May 30 2008Copyright (C) 2008 Anand B Pillai."""import sysimport osimport timetry: import sqlite3except ImportError: sys.exit('sqlite3 module not found!')conn = sqlite3.connect(os.path.expanduser("~/.harvestman/db/crawls.db"))c1 = conn.cursor()cur = c1.execute("select * from projects order by id")for member in c1: # project id is first member proj_id = member[0] print 'Project #%d crawled at [%s] with URL {%s}, saved to name "<%s>"...' % (proj_id, time.ctime(float(member[1])), member[3], member[2]) c2 = conn.cursor() c2.execute("select * from project_stats where project_id=%d" % proj_id) data = c2.fetchall() if len(data)==0: continue data = data[0] print 'Statistics' print '----------' print ' Total # of URLs=>',data[1] print ' Processed URLs=>',data[2] print ' Filtered URLs=>',data[3] print ' Failed URLs=>',data[4] print ' Broken URLs=>',data[5] print ' URLs found in Cache=>',data[6] print ' # of domains=>',data[7] print ' # of directories=>',data[8] print ' # of files=>',data[9] print ' Data downloaded=>',data[10],'bytes.' print ' Duration=>',data[11],'seconds.' c2.close()c1.close()conn.close()
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -