文件名称:siuying_segment
介绍说明--下载内容来自于网络,使用问题请自行百度
「我是中國人」,ChineseTokenizer會將之分割為五個中文字:「我、是、中、國、人」,CJKTokenizer則會將之分割為「我是、是中、中國、國人」四個二節的詞。前者的問題是沒有考慮中文詞語的問題,如搜尋「國中」一樣搜尋到「我是中國人」。後者的問題則是制做了大量沒意義的詞如「是中」「國人」,讓索引沒必要地增大、降低搜尋效率。
(系统自动生成,下载前可以参看下载内容)
下载文件列表
build.xml
src/org/apache/lucene/analysis/cjk/CJKAnalyzer.java
src/org/apache/lucene/analysis/cjk/CJKTokenizer.java
src/org/apache/lucene/analysis/cjk
src/org/apache/lucene/analysis/cn/ChineseAnalyzer.java
src/org/apache/lucene/analysis/cn/ChineseFilter.java
src/org/apache/lucene/analysis/cn/ChineseTokenizer.java
src/org/apache/lucene/analysis/cn
src/org/apache/lucene/analysis/cw/bothlexu8.txt
src/org/apache/lucene/analysis/cw/CharStream.java
src/org/apache/lucene/analysis/cw/CStandardTokenizer.java
src/org/apache/lucene/analysis/cw/CStandardTokenizer.jj
src/org/apache/lucene/analysis/cw/CStandardTokenizerConstants.java
src/org/apache/lucene/analysis/cw/CStandardTokenizerTokenManager.java
src/org/apache/lucene/analysis/cw/CWordAnalyzer.java
src/org/apache/lucene/analysis/cw/CWordFilter.java
src/org/apache/lucene/analysis/cw/CWordFilter.java~
src/org/apache/lucene/analysis/cw/CWordTokenizer.java
src/org/apache/lucene/analysis/cw/CWordTokenizer.java~
src/org/apache/lucene/analysis/cw/data/sforeign_u8.txt
src/org/apache/lucene/analysis/cw/data/snotname_u8.txt
src/org/apache/lucene/analysis/cw/data/snumbers_u8.txt
src/org/apache/lucene/analysis/cw/data/ssurname_u8.txt
src/org/apache/lucene/analysis/cw/data/tforeign_u8.txt
src/org/apache/lucene/analysis/cw/data/tnotname_u8.txt
src/org/apache/lucene/analysis/cw/data/tnumbers_u8.txt
src/org/apache/lucene/analysis/cw/data/tsurname_u8.txt
src/org/apache/lucene/analysis/cw/data
src/org/apache/lucene/analysis/cw/ParseException.java
src/org/apache/lucene/analysis/cw/Segmenter.jav.old
src/org/apache/lucene/analysis/cw/segmenter.java
src/org/apache/lucene/analysis/cw/segmenter.java~
src/org/apache/lucene/analysis/cw/SegmenterUtils.java
src/org/apache/lucene/analysis/cw/SegmenterUtils.java~
src/org/apache/lucene/analysis/cw/simplexu8.txt
src/org/apache/lucene/analysis/cw/test/SegmenterUtilsTest.java
src/org/apache/lucene/analysis/cw/test/SegmenterUtilsTest.java~
src/org/apache/lucene/analysis/cw/test
src/org/apache/lucene/analysis/cw/Token.java
src/org/apache/lucene/analysis/cw/TokenMgrError.java
src/org/apache/lucene/analysis/cw/tradlexu8.txt
src/org/apache/lucene/analysis/cw
src/org/apache/lucene/analysis
src/org/apache/lucene/demo/DeleteFiles.java
src/org/apache/lucene/demo/FileDocument.java
src/org/apache/lucene/demo/IndexCJKFiles.java
src/org/apache/lucene/demo/IndexFiles.java
src/org/apache/lucene/demo/SearchCJKFiles.java
src/org/apache/lucene/demo/SearchFiles.java
src/org/apache/lucene/demo
src/org/apache/lucene
src/org/apache
src/org
src
www.dssz.com.txt
src/org/apache/lucene/analysis/cjk/CJKAnalyzer.java
src/org/apache/lucene/analysis/cjk/CJKTokenizer.java
src/org/apache/lucene/analysis/cjk
src/org/apache/lucene/analysis/cn/ChineseAnalyzer.java
src/org/apache/lucene/analysis/cn/ChineseFilter.java
src/org/apache/lucene/analysis/cn/ChineseTokenizer.java
src/org/apache/lucene/analysis/cn
src/org/apache/lucene/analysis/cw/bothlexu8.txt
src/org/apache/lucene/analysis/cw/CharStream.java
src/org/apache/lucene/analysis/cw/CStandardTokenizer.java
src/org/apache/lucene/analysis/cw/CStandardTokenizer.jj
src/org/apache/lucene/analysis/cw/CStandardTokenizerConstants.java
src/org/apache/lucene/analysis/cw/CStandardTokenizerTokenManager.java
src/org/apache/lucene/analysis/cw/CWordAnalyzer.java
src/org/apache/lucene/analysis/cw/CWordFilter.java
src/org/apache/lucene/analysis/cw/CWordFilter.java~
src/org/apache/lucene/analysis/cw/CWordTokenizer.java
src/org/apache/lucene/analysis/cw/CWordTokenizer.java~
src/org/apache/lucene/analysis/cw/data/sforeign_u8.txt
src/org/apache/lucene/analysis/cw/data/snotname_u8.txt
src/org/apache/lucene/analysis/cw/data/snumbers_u8.txt
src/org/apache/lucene/analysis/cw/data/ssurname_u8.txt
src/org/apache/lucene/analysis/cw/data/tforeign_u8.txt
src/org/apache/lucene/analysis/cw/data/tnotname_u8.txt
src/org/apache/lucene/analysis/cw/data/tnumbers_u8.txt
src/org/apache/lucene/analysis/cw/data/tsurname_u8.txt
src/org/apache/lucene/analysis/cw/data
src/org/apache/lucene/analysis/cw/ParseException.java
src/org/apache/lucene/analysis/cw/Segmenter.jav.old
src/org/apache/lucene/analysis/cw/segmenter.java
src/org/apache/lucene/analysis/cw/segmenter.java~
src/org/apache/lucene/analysis/cw/SegmenterUtils.java
src/org/apache/lucene/analysis/cw/SegmenterUtils.java~
src/org/apache/lucene/analysis/cw/simplexu8.txt
src/org/apache/lucene/analysis/cw/test/SegmenterUtilsTest.java
src/org/apache/lucene/analysis/cw/test/SegmenterUtilsTest.java~
src/org/apache/lucene/analysis/cw/test
src/org/apache/lucene/analysis/cw/Token.java
src/org/apache/lucene/analysis/cw/TokenMgrError.java
src/org/apache/lucene/analysis/cw/tradlexu8.txt
src/org/apache/lucene/analysis/cw
src/org/apache/lucene/analysis
src/org/apache/lucene/demo/DeleteFiles.java
src/org/apache/lucene/demo/FileDocument.java
src/org/apache/lucene/demo/IndexCJKFiles.java
src/org/apache/lucene/demo/IndexFiles.java
src/org/apache/lucene/demo/SearchCJKFiles.java
src/org/apache/lucene/demo/SearchFiles.java
src/org/apache/lucene/demo
src/org/apache/lucene
src/org/apache
src/org
src
www.dssz.com.txt
本网站为编程资源及源代码搜集、介绍的搜索网站,版权归原作者所有! 粤ICP备11031372号
1999-2046 搜珍网 All Rights Reserved.