diff --git a/test/extract_tags.py b/test/extract_tags.py index 58e7de3..3298749 100644 --- a/test/extract_tags.py +++ b/test/extract_tags.py @@ -5,29 +5,26 @@ import jieba import jieba.analyse from optparse import OptionParser -USAGE ="usage: python extract_tags.py [file name] -k [top k]" +USAGE = "usage: python extract_tags.py [file name] -k [top k]" parser = OptionParser(USAGE) -parser.add_option("-k",dest="topK") +parser.add_option("-k", dest="topK") opt, args = parser.parse_args() -if len(args) <1: - print USAGE - sys.exit(1) +if len(args) < 1: + print USAGE + sys.exit(1) file_name = args[0] -if opt.topK==None: - topK=10 +if opt.topK is None: + topK = 10 else: - topK = int(opt.topK) + topK = int(opt.topK) +content = open(file_name, 'rb').read() -content = open(file_name,'rb').read() - -tags = jieba.analyse.extract_tags(content,topK=topK) +tags = jieba.analyse.extract_tags(content, topK=topK) print ",".join(tags) - -