当前位置: 首页>>代码示例>>Java>>正文


Java BuildIndex.run方法代码示例

本文整理汇总了Java中org.lemurproject.galago.core.tools.apps.BuildIndex.run方法的典型用法代码示例。如果您正苦于以下问题:Java BuildIndex.run方法的具体用法?Java BuildIndex.run怎么用?Java BuildIndex.run使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在org.lemurproject.galago.core.tools.apps.BuildIndex的用法示例。


在下文中一共展示了BuildIndex.run方法的4个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。

示例1: run

import org.lemurproject.galago.core.tools.apps.BuildIndex; //导入方法依赖的package包/类
@Override
public void run(Parameters argp) throws Exception {
  System.err.println(argp.getString("indexPath"));
  List<FactQuery> facts = Athena.init(argp).getDataset().getAllFacts();

  File temp = FileUtility.createTemporary();
  PrintWriter pw = new PrintWriter(temp);

  for(FactQuery fq: facts) {
    pw.println(Parameters.parseArray(
        "name", fq.id,
        "text", fq.text,
        "meta", Parameters.parseArray(
            "year", fq.rel
        )
    ));
  }

  pw.close();

  Parameters buildP = argp.clone();
  buildP.put("fields", "a");
  buildP.put("filetype", JSONDocParser.class.getName());
  buildP.put("inputPath", temp.getAbsolutePath());

  BuildIndex build = new BuildIndex();
  build.run(buildP, System.out);

  System.out.println("Cleaned up temporary file:"+temp.delete());
}
 
开发者ID:jjfiv,项目名称:ecir2015timebooks,代码行数:31,代码来源:CreateFactIndex.java

示例2: testDefaultyBehavior

import org.lemurproject.galago.core.tools.apps.BuildIndex; //导入方法依赖的package包/类
@Test
public void testDefaultyBehavior() throws Exception {
    File index = FileUtility.createTemporaryDirectory();
    File dataDir = FileUtility.createTemporaryDirectory();
    try {

        createTxtDoc(dataDir, "d1.txt"); // 1 doc
        createXMLDoc(dataDir, "d2.xml"); // 1 doc
        createTrecTextDoc(dataDir, "d3.trectext"); // 10 docs
        createTrecWebDoc(dataDir, "d4.trecweb"); // 10 docs
        createTwitterDoc(dataDir, "d5.twitter"); // 10 docs

        Parameters p = Parameters.create();
        p.set("inputPath", Collections.singletonList(dataDir.getAbsolutePath()));
        p.set("indexPath", index.getAbsolutePath());

        BuildIndex bi = new BuildIndex();
        bi.run(p, System.err);

        Retrieval ret = RetrievalFactory.instance(index.getAbsolutePath(), Parameters.create());

        FieldStatistics cs = ret.getCollectionStatistics("#lengths:part=lengths()");
        assertEquals(cs.collectionLength, 553);
        assertEquals(cs.documentCount, 32);
        assertEquals(cs.maxLength, 22);
        assertEquals(cs.minLength, 11);

        IndexPartStatistics is1 = ret.getIndexPartStatistics("postings");
        assertEquals(is1.collectionLength, 553);

        IndexPartStatistics is2 = ret.getIndexPartStatistics("postings.krovetz");
        assertEquals(is2.collectionLength, 553);

        // should have about the same vocabs
        assertEquals(is1.vocabCount, is2.vocabCount);

    } finally {
        FSUtil.deleteDirectory(index);
        FSUtil.deleteDirectory(dataDir);
    }
}
 
开发者ID:teanalab,项目名称:demidovii,代码行数:42,代码来源:UniversalParserTest.java

示例3: testAllIsOneBehavior

import org.lemurproject.galago.core.tools.apps.BuildIndex; //导入方法依赖的package包/类
@Test
public void testAllIsOneBehavior() throws Exception {
    File index = FileUtility.createTemporaryDirectory();
    File dataDir = FileUtility.createTemporaryDirectory();
    try {

        createTxtDoc(dataDir, "d1"); // 1 doc
        createXMLDoc(dataDir, "d2"); // 1 doc
        createTxtDoc(dataDir, "d3"); // 1 doc
        createXMLDoc(dataDir, "d4"); // 1 doc
        createTxtDoc(dataDir, "d5"); // 1 doc
        createXMLDoc(dataDir, "d6"); // 1 doc

        Parameters p = Parameters.create();
        p.set("inputPath", Collections.singletonList(dataDir.getAbsolutePath()));
        p.set("indexPath", index.getAbsolutePath());
        p.set("filetype", "txt");

        BuildIndex bi = new BuildIndex();
        bi.run(p, System.err);

        Retrieval ret = RetrievalFactory.instance(index.getAbsolutePath(), Parameters.create());

        FieldStatistics cs = ret.getCollectionStatistics("#lengths:part=lengths()");
        assertEquals(cs.collectionLength, 129);
        assertEquals(cs.documentCount, 6);
        assertEquals(cs.maxLength, 22);
        assertEquals(cs.minLength, 21);

        IndexPartStatistics is1 = ret.getIndexPartStatistics("postings");
        assertEquals(is1.collectionLength, 129);

        IndexPartStatistics is2 = ret.getIndexPartStatistics("postings.krovetz");
        assertEquals(is2.collectionLength, 129);

        // should have about the same vocabs
        assertEquals(is1.vocabCount, is2.vocabCount);

    } finally {
        FSUtil.deleteDirectory(index);
        FSUtil.deleteDirectory(dataDir);
    }
}
 
开发者ID:teanalab,项目名称:demidovii,代码行数:44,代码来源:UniversalParserTest.java

示例4: testManualOverrideBehavior

import org.lemurproject.galago.core.tools.apps.BuildIndex; //导入方法依赖的package包/类
@Test
public void testManualOverrideBehavior() throws Exception {
    File index = FileUtility.createTemporaryDirectory();
    File dataDir = FileUtility.createTemporaryDirectory();
    try {

        createTrecTextDoc(dataDir, "d1.qqe"); // 10 docs - trectext
        createTrecWebDoc(dataDir, "d2.qwe"); // 10 docs - trecweb
        createTrecTextDoc(dataDir, "d3.trectext"); // 10 docs - trectext
        createTrecWebDoc(dataDir, "d4.trecweb"); // 10 docs - trectext
        createTxtDoc(dataDir, "d5.txt"); // 1 docs - txt

        Parameters p = Parameters.create();
        p.set("inputPath", Collections.singletonList(dataDir.getAbsolutePath()));
        p.set("indexPath", index.getAbsolutePath());
        p.set("parser", Parameters.create());

        List<Parameters> kinds = new ArrayList<Parameters>();
        kinds.add(Parameters.parseString("{\"filetype\" : \"qqe\", \"class\" :\"" + TrecTextParser.class.getName() + "\"}"));
        kinds.add(Parameters.parseString("{\"filetype\" : \"qwe\", \"class\" :\"" + TrecWebParser.class.getName() + "\"}"));
        kinds.add(Parameters.parseString("{\"filetype\" : \"trecweb\", \"class\" :\"" + TrecTextParser.class.getName() + "\"}"));
        p.getMap("parser").put("externalParsers", kinds);

        BuildIndex bi = new BuildIndex();
        bi.run(p, System.err);

        Retrieval ret = RetrievalFactory.instance(index.getAbsolutePath(), Parameters.create());

        FieldStatistics cs = ret.getCollectionStatistics("#lengths:part=lengths()");
        assertEquals(cs.collectionLength, 622); // trecweb with trectext will be empty
        assertEquals(cs.documentCount, 41);
        assertEquals(cs.maxLength, 22);
        assertEquals(cs.minLength, 20);

        IndexPartStatistics is1 = ret.getIndexPartStatistics("postings");
        assertEquals(is1.collectionLength, 622);

        IndexPartStatistics is2 = ret.getIndexPartStatistics("postings.krovetz");
        assertEquals(is2.collectionLength, 622);

        // should have about the same vocabs
        assertEquals(is1.vocabCount, is2.vocabCount);

    } finally {
        FSUtil.deleteDirectory(index);
        FSUtil.deleteDirectory(dataDir);
    }
}
 
开发者ID:teanalab,项目名称:demidovii,代码行数:49,代码来源:UniversalParserTest.java


注:本文中的org.lemurproject.galago.core.tools.apps.BuildIndex.run方法示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。