当前位置: 首页>>代码示例>>Java>>正文


Java ClassicAnalyzer类代码示例

本文整理汇总了Java中org.apache.lucene.analysis.standard.ClassicAnalyzer的典型用法代码示例。如果您正苦于以下问题:Java ClassicAnalyzer类的具体用法?Java ClassicAnalyzer怎么用?Java ClassicAnalyzer使用的例子?那么, 这里精选的类代码示例或许可以为您提供帮助。


ClassicAnalyzer类属于org.apache.lucene.analysis.standard包,在下文中一共展示了ClassicAnalyzer类的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。

示例1: testMaxTermLength2

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testMaxTermLength2() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer();
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "toolong", "xy", "z"});
  sa.setMaxTokenLength(5);
  
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "xy", "z"}, new int[]{1, 1, 2, 1});
}
 
开发者ID:europeana,项目名称:search,代码行数:8,代码来源:TestClassicAnalyzer.java

示例2: testLucene1140

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testLucene1140() throws Exception {
  try {
    ClassicAnalyzer analyzer = new ClassicAnalyzer();
    assertAnalyzesTo(analyzer, "www.nutch.org.", new String[]{ "www.nutch.org" }, new String[] { "<HOST>" });
  } catch (NullPointerException e) {
    fail("Should not throw an NPE and it did");
  }

}
 
开发者ID:europeana,项目名称:search,代码行数:10,代码来源:TestClassicAnalyzer.java

示例3: testMaxTermLength2

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testMaxTermLength2() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer(TEST_VERSION_CURRENT);
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "toolong", "xy", "z"});
  sa.setMaxTokenLength(5);
  
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "xy", "z"}, new int[]{1, 1, 2, 1});
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:8,代码来源:TestClassicAnalyzer.java

示例4: testLucene1140

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testLucene1140() throws Exception {
  try {
    ClassicAnalyzer analyzer = new ClassicAnalyzer(TEST_VERSION_CURRENT);
    assertAnalyzesTo(analyzer, "www.nutch.org.", new String[]{ "www.nutch.org" }, new String[] { "<HOST>" });
  } catch (NullPointerException e) {
    fail("Should not throw an NPE and it did");
  }

}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:10,代码来源:TestClassicAnalyzer.java

示例5: testMaxTermLength

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testMaxTermLength() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer();
  sa.setMaxTokenLength(5);
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "xy", "z"});
}
 
开发者ID:europeana,项目名称:search,代码行数:6,代码来源:TestClassicAnalyzer.java

示例6: testJava14BWCompatibility

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testJava14BWCompatibility() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer(Version.LUCENE_3_0);
  assertAnalyzesTo(sa, "test\u02C6test", new String[] { "test", "test" });
}
 
开发者ID:europeana,项目名称:search,代码行数:5,代码来源:TestClassicAnalyzer.java

示例7: testWickedLongTerm

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/**
 * Make sure we skip wicked long terms.
*/
public void testWickedLongTerm() throws IOException {
  RAMDirectory dir = new RAMDirectory();
  IndexWriter writer = new IndexWriter(dir, new IndexWriterConfig(TEST_VERSION_CURRENT, new ClassicAnalyzer()));

  char[] chars = new char[IndexWriter.MAX_TERM_LENGTH];
  Arrays.fill(chars, 'x');
  Document doc = new Document();
  final String bigTerm = new String(chars);

  // This produces a too-long term:
  String contents = "abc xyz x" + bigTerm + " another term";
  doc.add(new TextField("content", contents, Field.Store.NO));
  writer.addDocument(doc);

  // Make sure we can add another normal document
  doc = new Document();
  doc.add(new TextField("content", "abc bbb ccc", Field.Store.NO));
  writer.addDocument(doc);
  writer.close();

  IndexReader reader = IndexReader.open(dir);

  // Make sure all terms < max size were indexed
  assertEquals(2, reader.docFreq(new Term("content", "abc")));
  assertEquals(1, reader.docFreq(new Term("content", "bbb")));
  assertEquals(1, reader.docFreq(new Term("content", "term")));
  assertEquals(1, reader.docFreq(new Term("content", "another")));

  // Make sure position is still incremented when
  // massive term is skipped:
  DocsAndPositionsEnum tps = MultiFields.getTermPositionsEnum(reader,
                                                              MultiFields.getLiveDocs(reader),
                                                              "content",
                                                              new BytesRef("another"));
  assertTrue(tps.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
  assertEquals(1, tps.freq());
  assertEquals(3, tps.nextPosition());

  // Make sure the doc that has the massive term is in
  // the index:
  assertEquals("document with wicked long term should is not in the index!", 2, reader.numDocs());

  reader.close();

  // Make sure we can add a document with exactly the
  // maximum length term, and search on that term:
  doc = new Document();
  doc.add(new TextField("content", bigTerm, Field.Store.NO));
  ClassicAnalyzer sa = new ClassicAnalyzer();
  sa.setMaxTokenLength(100000);
  writer  = new IndexWriter(dir, new IndexWriterConfig(TEST_VERSION_CURRENT, sa));
  writer.addDocument(doc);
  writer.close();
  reader = IndexReader.open(dir);
  assertEquals(1, reader.docFreq(new Term("content", bigTerm)));
  reader.close();

  dir.close();
}
 
开发者ID:europeana,项目名称:search,代码行数:63,代码来源:TestClassicAnalyzer.java

示例8: testRandomStrings

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/** blast some random strings through the analyzer */
public void testRandomStrings() throws Exception {
  checkRandomData(random(), new ClassicAnalyzer(), 1000*RANDOM_MULTIPLIER);
}
 
开发者ID:europeana,项目名称:search,代码行数:5,代码来源:TestClassicAnalyzer.java

示例9: testRandomHugeStrings

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/** blast some random large strings through the analyzer */
public void testRandomHugeStrings() throws Exception {
  Random random = random();
  checkRandomData(random, new ClassicAnalyzer(), 100*RANDOM_MULTIPLIER, 8192);
}
 
开发者ID:europeana,项目名称:search,代码行数:6,代码来源:TestClassicAnalyzer.java

示例10: testGetClassic

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
@Test
public void testGetClassic() {
    Analyzer analyzer = PreBuiltAnalyzers.CLASSIC.get();
    Assert.assertEquals(ClassicAnalyzer.class, analyzer.getClass());
}
 
开发者ID:Stratio,项目名称:stratio-cassandra,代码行数:6,代码来源:PreBuiltAnalyzersTest.java

示例11: testMaxTermLength

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testMaxTermLength() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer(TEST_VERSION_CURRENT);
  sa.setMaxTokenLength(5);
  assertAnalyzesTo(sa, "ab cd toolong xy z", new String[]{"ab", "cd", "xy", "z"});
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:6,代码来源:TestClassicAnalyzer.java

示例12: testJava14BWCompatibility

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
public void testJava14BWCompatibility() throws Exception {
  ClassicAnalyzer sa = new ClassicAnalyzer(Version.LUCENE_30);
  assertAnalyzesTo(sa, "test\u02C6test", new String[] { "test", "test" });
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:5,代码来源:TestClassicAnalyzer.java

示例13: testWickedLongTerm

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/**
 * Make sure we skip wicked long terms.
*/
public void testWickedLongTerm() throws IOException {
  RAMDirectory dir = new RAMDirectory();
  IndexWriter writer = new IndexWriter(dir, new IndexWriterConfig(
    TEST_VERSION_CURRENT, new ClassicAnalyzer(TEST_VERSION_CURRENT)));

  char[] chars = new char[IndexWriter.MAX_TERM_LENGTH];
  Arrays.fill(chars, 'x');
  Document doc = new Document();
  final String bigTerm = new String(chars);

  // This produces a too-long term:
  String contents = "abc xyz x" + bigTerm + " another term";
  doc.add(new TextField("content", contents, Field.Store.NO));
  writer.addDocument(doc);

  // Make sure we can add another normal document
  doc = new Document();
  doc.add(new TextField("content", "abc bbb ccc", Field.Store.NO));
  writer.addDocument(doc);
  writer.close();

  IndexReader reader = IndexReader.open(dir);

  // Make sure all terms < max size were indexed
  assertEquals(2, reader.docFreq(new Term("content", "abc")));
  assertEquals(1, reader.docFreq(new Term("content", "bbb")));
  assertEquals(1, reader.docFreq(new Term("content", "term")));
  assertEquals(1, reader.docFreq(new Term("content", "another")));

  // Make sure position is still incremented when
  // massive term is skipped:
  DocsAndPositionsEnum tps = MultiFields.getTermPositionsEnum(reader,
                                                              MultiFields.getLiveDocs(reader),
                                                              "content",
                                                              new BytesRef("another"));
  assertTrue(tps.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
  assertEquals(1, tps.freq());
  assertEquals(3, tps.nextPosition());

  // Make sure the doc that has the massive term is in
  // the index:
  assertEquals("document with wicked long term should is not in the index!", 2, reader.numDocs());

  reader.close();

  // Make sure we can add a document with exactly the
  // maximum length term, and search on that term:
  doc = new Document();
  doc.add(new TextField("content", bigTerm, Field.Store.NO));
  ClassicAnalyzer sa = new ClassicAnalyzer(TEST_VERSION_CURRENT);
  sa.setMaxTokenLength(100000);
  writer  = new IndexWriter(dir, new IndexWriterConfig(TEST_VERSION_CURRENT, sa));
  writer.addDocument(doc);
  writer.close();
  reader = IndexReader.open(dir);
  assertEquals(1, reader.docFreq(new Term("content", bigTerm)));
  reader.close();

  dir.close();
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:64,代码来源:TestClassicAnalyzer.java

示例14: testRandomStrings

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/** blast some random strings through the analyzer */
public void testRandomStrings() throws Exception {
  checkRandomData(random(), new ClassicAnalyzer(TEST_VERSION_CURRENT), 1000*RANDOM_MULTIPLIER);
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:5,代码来源:TestClassicAnalyzer.java

示例15: testRandomHugeStrings

import org.apache.lucene.analysis.standard.ClassicAnalyzer; //导入依赖的package包/类
/** blast some random large strings through the analyzer */
public void testRandomHugeStrings() throws Exception {
  Random random = random();
  checkRandomData(random, new ClassicAnalyzer(TEST_VERSION_CURRENT), 100*RANDOM_MULTIPLIER, 8192);
}
 
开发者ID:pkarmstr,项目名称:NYBC,代码行数:6,代码来源:TestClassicAnalyzer.java


注:本文中的org.apache.lucene.analysis.standard.ClassicAnalyzer类示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。