xref: /Lucene/lucene/benchmark/conf/indexLineFile.alg (revision b3906e96eaeaeea537b810fd6062bc53708950e8)
1#/**
2# * Licensed to the Apache Software Foundation (ASF) under one or more
3# * contributor license agreements.  See the NOTICE file distributed with
4# * this work for additional information regarding copyright ownership.
5# * The ASF licenses this file to You under the Apache License, Version 2.0
6# * (the "License"); you may not use this file except in compliance with
7# * the License.  You may obtain a copy of the License at
8# *
9# *     http://www.apache.org/licenses/LICENSE-2.0
10# *
11# * Unless required by applicable law or agreed to in writing, software
12# * distributed under the License is distributed on an "AS IS" BASIS,
13# * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14# * See the License for the specific language governing permissions and
15# * limitations under the License.
16# */
17# -------------------------------------------------------------------------------------
18
19#
20# This file indexes documents contained in a single text file, one per
21# line.  See createLineFile.alg for how to create this file.  The
22# benefit of this is it removes the IO cost of opening one file per
23# document to let you more accurately measure time spent analyzing and
24# indexing your documents vs time spent creating the documents.
25#
26# To use this, you must first run the createLineFile.alg, then run:
27#
28#   gradlew :lucene:benchmark:run -Ptask.alg=conf/indexLineFile.alg
29#
30
31analyzer=org.apache.lucene.analysis.core.SimpleAnalyzer
32
33# Feed that knows how to process the line file format:
34content.source=org.apache.lucene.benchmark.byTask.feeds.LineDocSource
35
36# File that contains one document per line:
37docs.file=work/reuters.lines.txt
38
39# Process documents only once:
40content.source.forever=false
41
42# -------------------------------------------------------------------------------------
43
44# Reset the system, create a new index, index all docs from the line
45# file, close the index, produce a report.
46
47ResetSystemErase
48CreateIndex
49{AddDoc}: *
50CloseIndex
51
52RepSumByPref AddDoc
53