From cc81135429e63fa11c2e4bac401d911a338bf024 Mon Sep 17 00:00:00 2001 From: gwdwyy Date: Tue, 20 Aug 2013 20:08:03 +0800 Subject: [PATCH] sed -i 's/not \(.*\) in/\1 not in/g' ... --- jieba/__init__.py | 12 ++++++------ jieba/posseg/__init__.py | 4 ++-- 2 files changed, 8 insertions(+), 8 deletions(-) diff --git a/jieba/__init__.py b/jieba/__init__.py index 307f8b8..36bdc2a 100644 --- a/jieba/__init__.py +++ b/jieba/__init__.py @@ -38,7 +38,7 @@ def gen_trie(f_name): ltotal+=freq p = trie for c in word: - if not c in p: + if c not in p: p[c] ={} p = p[c] p['']='' #ending flag @@ -150,7 +150,7 @@ def get_DAG(sentence): if c in p: p = p[c] if '' in p: - if not i in DAG: + if i not in DAG: DAG[i]=[] DAG[i].append(j) j+=1 @@ -163,7 +163,7 @@ def get_DAG(sentence): i+=1 j=i for i in xrange(len(sentence)): - if not i in DAG: + if i not in DAG: DAG[i] =[i] return DAG @@ -186,7 +186,7 @@ def __cut_DAG(sentence): yield buf buf=u'' else: - if not (buf in FREQ): + if (buf not in FREQ): regognized = finalseg.cut(buf) for t in regognized: yield t @@ -201,7 +201,7 @@ def __cut_DAG(sentence): if len(buf)==1: yield buf else: - if not (buf in FREQ): + if (buf not in FREQ): regognized = finalseg.cut(buf) for t in regognized: yield t @@ -281,7 +281,7 @@ def add_word(word, freq, tag=None): user_word_tag_tab[word] = tag.strip() p = trie for c in word: - if not c in p: + if c not in p: p[c] = {} p = p[c] p[''] = '' # ending flag diff --git a/jieba/posseg/__init__.py b/jieba/posseg/__init__.py index 40d0427..31013f2 100644 --- a/jieba/posseg/__init__.py +++ b/jieba/posseg/__init__.py @@ -136,7 +136,7 @@ def __cut_DAG(sentence): yield pair(buf,word_tag_tab.get(buf,'x')) buf=u'' else: - if not (buf in jieba.FREQ): + if (buf not in jieba.FREQ): regognized = __cut_detail(buf) for t in regognized: yield t @@ -151,7 +151,7 @@ def __cut_DAG(sentence): if len(buf)==1: yield pair(buf,word_tag_tab.get(buf,'x')) else: - if not (buf in jieba.FREQ): + if (buf not in jieba.FREQ): regognized = __cut_detail(buf) for t in regognized: yield t