?? testrussiananalyzer.java

?? Lucene a java open-source SearchEngine Framework
?? JAVA
字號:
package org.apache.lucene.analysis.ru;/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements.  See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */import junit.framework.TestCase;import java.io.*;import org.apache.lucene.analysis.TokenStream;import org.apache.lucene.analysis.Token;/** * Test case for RussianAnalyzer. * * * @version   $Id: TestRussianAnalyzer.java 564236 2007-08-09 15:21:19Z gsingers $ */public class TestRussianAnalyzer extends TestCase{    private InputStreamReader inWords;    private InputStreamReader sampleUnicode;    private Reader inWordsKOI8;    private Reader sampleKOI8;    private Reader inWords1251;    private Reader sample1251;    private File dataDir;    protected void setUp() throws Exception    {      dataDir = new File(System.getProperty("dataDir", "./bin"));    }    public void testUnicode() throws IOException    {        RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.UnicodeRussian);        inWords =            new InputStreamReader(                new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/testUnicode.txt")),                "Unicode");        sampleUnicode =            new InputStreamReader(                new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/resUnicode.htm")),                "Unicode");        TokenStream in = ra.tokenStream("all", inWords);        RussianLetterTokenizer sample =            new RussianLetterTokenizer(                sampleUnicode,                RussianCharsets.UnicodeRussian);        for (;;)        {            Token token = in.next();            if (token == null)            {                break;            }            Token sampleToken = sample.next();            assertEquals(                "Unicode",                token.termText(),                sampleToken == null                ? null                : sampleToken.termText());        }        inWords.close();        sampleUnicode.close();    }    public void testKOI8() throws IOException    {        //System.out.println(new java.util.Date());        RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.KOI8);        // KOI8        inWordsKOI8 = new InputStreamReader(new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/testKOI8.txt")), "iso-8859-1");        sampleKOI8 = new InputStreamReader(new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/resKOI8.htm")), "iso-8859-1");        TokenStream in = ra.tokenStream("all", inWordsKOI8);        RussianLetterTokenizer sample =            new RussianLetterTokenizer(                sampleKOI8,                RussianCharsets.KOI8);        for (;;)        {            Token token = in.next();            if (token == null)            {                break;            }            Token sampleToken = sample.next();            assertEquals(                "KOI8",                token.termText(),                sampleToken == null                ? null                : sampleToken.termText());        }        inWordsKOI8.close();        sampleKOI8.close();    }    public void test1251() throws IOException    {        // 1251        inWords1251 = new InputStreamReader(new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/test1251.txt")), "iso-8859-1");        sample1251 = new InputStreamReader(new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/res1251.htm")), "iso-8859-1");        RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.CP1251);        TokenStream in = ra.tokenStream("", inWords1251);        RussianLetterTokenizer sample =            new RussianLetterTokenizer(                sample1251,                RussianCharsets.CP1251);        for (;;)        {            Token token = in.next();            if (token == null)            {                break;            }            Token sampleToken = sample.next();            assertEquals(                "1251",                token.termText(),                sampleToken == null                ? null                : sampleToken.termText());        }        inWords1251.close();        sample1251.close();    }}
?? 文件大小 5390 K
?? 上傳用戶 rickie936
?? 所屬分類 Java編程
??? 相關標簽

#SearchEngine #open-source #Framework #Lucene
?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

?? testrussiananalyzer.java

?? 快捷鍵說明