📄 topics.py
字号:
#! /usr/bin/python# usage: python topics.py <beta file> <vocab file> <num words>## <beta file> is output from the lda-c code# <vocab file> is a list of words, one per line# <num words> is the number of words to print from each topicimport sysdef print_topics(beta_file, vocab_file, nwords = 25): # get the vocabulary vocab = file(vocab_file, 'r').readlines() # vocab = map(lambda x: x.split()[0], vocab) vocab = map(lambda x: x.strip(), vocab) # for each line in the beta file indices = range(len(vocab)) topic_no = 0 for topic in file(beta_file, 'r'): print 'topic %03d' % topic_no topic = map(float, topic.split()) indices.sort(lambda x,y: -cmp(topic[x], topic[y])) for i in range(nwords): print ' %s' % vocab[indices[i]] topic_no = topic_no + 1 print '\n'if (__name__ == '__main__'): if (len(sys.argv) != 4): print 'usage: python topics.py <beta-file> <vocab-file> <num words>\n' sys.exit(1) beta_file = sys.argv[1] vocab_file = sys.argv[2] nwords = int(sys.argv[3]) print_topics(beta_file, vocab_file, nwords)
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -