Examples with CreateIndexTask - org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask

Example 1 with CreateIndexTask

use of org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask in project lucene-solr by apache.

the class LineDocSourceTest method doIndexAndSearchTestWithRepeats.

private void doIndexAndSearchTestWithRepeats(Path file, Class<? extends LineParser> lineParserClass, int numAdds, String storedField) throws Exception {
    IndexReader reader = null;
    IndexSearcher searcher = null;
    PerfRunData runData = null;
    try {
        Properties props = new Properties();
        // LineDocSource specific settings.
        props.setProperty("docs.file", file.toAbsolutePath().toString());
        if (lineParserClass != null) {
            props.setProperty("line.parser", lineParserClass.getName());
        }
        // Indexing configuration.
        props.setProperty("analyzer", WhitespaceAnalyzer.class.getName());
        props.setProperty("content.source", LineDocSource.class.getName());
        props.setProperty("directory", "RAMDirectory");
        props.setProperty("doc.stored", "true");
        props.setProperty("doc.index.props", "true");
        // Create PerfRunData
        Config config = new Config(props);
        runData = new PerfRunData(config);
        TaskSequence tasks = new TaskSequence(runData, "testBzip2", null, false);
        tasks.addTask(new CreateIndexTask(runData));
        for (int i = 0; i < numAdds; i++) {
            tasks.addTask(new AddDocTask(runData));
        }
        tasks.addTask(new CloseIndexTask(runData));
        try {
            tasks.doLogic();
        } finally {
            tasks.close();
        }
        reader = DirectoryReader.open(runData.getDirectory());
        searcher = newSearcher(reader);
        TopDocs td = searcher.search(new TermQuery(new Term("body", "body")), 10);
        assertEquals(numAdds, td.totalHits);
        assertNotNull(td.scoreDocs[0]);
        if (storedField == null) {
            // added to all docs and satisfies field-name == value
            storedField = DocMaker.BODY_FIELD;
        }
        assertEquals("Wrong field value", storedField, searcher.doc(0).get(storedField));
    } finally {
        IOUtils.close(reader, runData);
    }
}

Also used : IndexSearcher(org.apache.lucene.search.IndexSearcher) WhitespaceAnalyzer(org.apache.lucene.analysis.core.WhitespaceAnalyzer) CloseIndexTask(org.apache.lucene.benchmark.byTask.tasks.CloseIndexTask) TermQuery(org.apache.lucene.search.TermQuery) Config(org.apache.lucene.benchmark.byTask.utils.Config) CreateIndexTask(org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask) Term(org.apache.lucene.index.Term) Properties(java.util.Properties) TopDocs(org.apache.lucene.search.TopDocs) TaskSequence(org.apache.lucene.benchmark.byTask.tasks.TaskSequence) IndexReader(org.apache.lucene.index.IndexReader) PerfRunData(org.apache.lucene.benchmark.byTask.PerfRunData) AddDocTask(org.apache.lucene.benchmark.byTask.tasks.AddDocTask)

Example 2 with CreateIndexTask

use of org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask in project lucene-solr by apache.

the class DocMakerTest method doTestIndexProperties.

private void doTestIndexProperties(boolean setIndexProps, boolean indexPropsVal, int numExpectedResults) throws Exception {
    Properties props = new Properties();
    // Indexing configuration.
    props.setProperty("analyzer", WhitespaceAnalyzer.class.getName());
    props.setProperty("content.source", OneDocSource.class.getName());
    props.setProperty("directory", "RAMDirectory");
    if (setIndexProps) {
        props.setProperty("doc.index.props", Boolean.toString(indexPropsVal));
    }
    // Create PerfRunData
    Config config = new Config(props);
    PerfRunData runData = new PerfRunData(config);
    TaskSequence tasks = new TaskSequence(runData, getTestName(), null, false);
    tasks.addTask(new CreateIndexTask(runData));
    tasks.addTask(new AddDocTask(runData));
    tasks.addTask(new CloseIndexTask(runData));
    tasks.doLogic();
    IndexReader reader = DirectoryReader.open(runData.getDirectory());
    IndexSearcher searcher = newSearcher(reader);
    TopDocs td = searcher.search(new TermQuery(new Term("key", "value")), 10);
    assertEquals(numExpectedResults, td.totalHits);
    reader.close();
}

Also used : WhitespaceAnalyzer(org.apache.lucene.analysis.core.WhitespaceAnalyzer) CloseIndexTask(org.apache.lucene.benchmark.byTask.tasks.CloseIndexTask) IndexSearcher(org.apache.lucene.search.IndexSearcher) TermQuery(org.apache.lucene.search.TermQuery) Config(org.apache.lucene.benchmark.byTask.utils.Config) CreateIndexTask(org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask) Term(org.apache.lucene.index.Term) Properties(java.util.Properties) TopDocs(org.apache.lucene.search.TopDocs) TaskSequence(org.apache.lucene.benchmark.byTask.tasks.TaskSequence) IndexReader(org.apache.lucene.index.IndexReader) PerfRunData(org.apache.lucene.benchmark.byTask.PerfRunData) AddDocTask(org.apache.lucene.benchmark.byTask.tasks.AddDocTask)

Example 3 with CreateIndexTask

use of org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask in project lucene-solr by apache.

the class Sample method main.

public static void main(String[] args) throws Exception {
    Properties p = initProps();
    Config conf = new Config(p);
    PerfRunData runData = new PerfRunData(conf);
    // 1. top sequence
    // top level, not parallel
    TaskSequence top = new TaskSequence(runData, null, null, false);
    // 2. task to create the index
    CreateIndexTask create = new CreateIndexTask(runData);
    top.addTask(create);
    // 3. task seq to add 500 docs (order matters - top to bottom - add seq to top, only then add to seq)
    TaskSequence seq1 = new TaskSequence(runData, "AddDocs", top, false);
    seq1.setRepetitions(500);
    seq1.setNoChildReport();
    top.addTask(seq1);
    // 4. task to add the doc
    AddDocTask addDoc = new AddDocTask(runData);
    //addDoc.setParams("1200"); // doc size limit if supported
    // order matters 9see comment above)
    seq1.addTask(addDoc);
    // 5. task to close the index
    CloseIndexTask close = new CloseIndexTask(runData);
    top.addTask(close);
    // task to report
    RepSumByNameTask rep = new RepSumByNameTask(runData);
    top.addTask(rep);
    // print algorithm
    System.out.println(top.toString());
    // execute
    top.doLogic();
}

Also used : CloseIndexTask(org.apache.lucene.benchmark.byTask.tasks.CloseIndexTask) RepSumByNameTask(org.apache.lucene.benchmark.byTask.tasks.RepSumByNameTask) TaskSequence(org.apache.lucene.benchmark.byTask.tasks.TaskSequence) Config(org.apache.lucene.benchmark.byTask.utils.Config) CreateIndexTask(org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask) PerfRunData(org.apache.lucene.benchmark.byTask.PerfRunData) Properties(java.util.Properties) AddDocTask(org.apache.lucene.benchmark.byTask.tasks.AddDocTask)

Aggregations

Properties (java.util.Properties)3 PerfRunData (org.apache.lucene.benchmark.byTask.PerfRunData)3 AddDocTask (org.apache.lucene.benchmark.byTask.tasks.AddDocTask)3 CloseIndexTask (org.apache.lucene.benchmark.byTask.tasks.CloseIndexTask)3 CreateIndexTask (org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask)3 TaskSequence (org.apache.lucene.benchmark.byTask.tasks.TaskSequence)3 Config (org.apache.lucene.benchmark.byTask.utils.Config)3 WhitespaceAnalyzer (org.apache.lucene.analysis.core.WhitespaceAnalyzer)2 IndexReader (org.apache.lucene.index.IndexReader)2 Term (org.apache.lucene.index.Term)2 IndexSearcher (org.apache.lucene.search.IndexSearcher)2 TermQuery (org.apache.lucene.search.TermQuery)2 TopDocs (org.apache.lucene.search.TopDocs)2 RepSumByNameTask (org.apache.lucene.benchmark.byTask.tasks.RepSumByNameTask)1