lowercased before check the some dict
This commit is contained in:
parent
6480991bbb
commit
a542bbc229
@ -198,3 +198,8 @@ here is the query result
|
||||
|
||||
|
||||
have fun.
|
||||
|
||||
常见问题:
|
||||
|
||||
1.自定义词典为什么没有生效?
|
||||
清确保你的扩展词典的文本格式为UTF8编码
|
4
pom.xml
4
pom.xml
@ -6,7 +6,7 @@
|
||||
<modelVersion>4.0.0</modelVersion>
|
||||
<groupId>org.elasticsearch</groupId>
|
||||
<artifactId>elasticsearch-analysis-ik</artifactId>
|
||||
<version>1.2.3</version>
|
||||
<version>1.2.4</version>
|
||||
<packaging>jar</packaging>
|
||||
<description>IK Analyzer for ElasticSearch</description>
|
||||
<inceptionYear>2009</inceptionYear>
|
||||
@ -31,7 +31,7 @@
|
||||
</parent>
|
||||
|
||||
<properties>
|
||||
<elasticsearch.version>0.90.6</elasticsearch.version>
|
||||
<elasticsearch.version>0.90.2</elasticsearch.version>
|
||||
</properties>
|
||||
|
||||
<repositories>
|
||||
|
@ -25,14 +25,14 @@
|
||||
*/
|
||||
package org.wltea.analyzer.dic;
|
||||
|
||||
import java.io.*;
|
||||
import java.util.Collection;
|
||||
import java.util.List;
|
||||
|
||||
import org.elasticsearch.common.logging.ESLogger;
|
||||
import org.elasticsearch.common.logging.Loggers;
|
||||
import org.wltea.analyzer.cfg.Configuration;
|
||||
|
||||
import java.io.*;
|
||||
import java.util.Collection;
|
||||
import java.util.List;
|
||||
|
||||
/**
|
||||
* 词典管理类,单子模式
|
||||
*/
|
||||
@ -152,7 +152,7 @@ public class Dictionary {
|
||||
* @return Hit 匹配结果描述
|
||||
*/
|
||||
public Hit matchInMainDict(char[] charArray , int begin, int length){
|
||||
return singleton._MainDict.match(charArray, begin, length);
|
||||
return singleton._MainDict.match(String.valueOf(charArray).trim().toLowerCase().toCharArray(), begin, length);
|
||||
}
|
||||
|
||||
/**
|
||||
@ -160,7 +160,7 @@ public class Dictionary {
|
||||
* @return Hit 匹配结果描述
|
||||
*/
|
||||
public Hit matchInQuantifierDict(char[] charArray , int begin, int length){
|
||||
return singleton._QuantifierDict.match(charArray, begin, length);
|
||||
return singleton._QuantifierDict.match(String.valueOf(charArray).trim().toLowerCase().toCharArray(), begin, length);
|
||||
}
|
||||
|
||||
|
||||
@ -179,7 +179,7 @@ public class Dictionary {
|
||||
* @return boolean
|
||||
*/
|
||||
public boolean isStopWord(char[] charArray , int begin, int length){
|
||||
return singleton._StopWords.match(charArray, begin, length).isMatch();
|
||||
return singleton._StopWords.match(String.valueOf(charArray).trim().toLowerCase().toCharArray(), begin, length).isMatch();
|
||||
}
|
||||
|
||||
/**
|
||||
@ -253,7 +253,7 @@ public class Dictionary {
|
||||
String theWord = null;
|
||||
do {
|
||||
theWord = br.readLine();
|
||||
if (theWord != null && !"".equals(theWord.trim())) {
|
||||
if (theWord != null && !"".equals(theWord.trim())) {
|
||||
//加载扩展词典数据到主内存词典中
|
||||
_MainDict.fillSegment(theWord.trim().toLowerCase().toCharArray());
|
||||
}
|
||||
|
Loading…
x
Reference in New Issue
Block a user