source: gs3-extensions/fedora/fedoragsearch-files/index.properties.in@ 26391

Last change on this file since 26391 was 26391, checked in by ak19, 12 years ago
  1. Added index.properties.in template file in order to set the indexwritelocktimeout (which had been defaulting to 0 until then), which build.xml then uses to write out the index.properties file with the placeholder string replaced. 2. README updated, including with instructions on manually deleting pids from the fedora repository and gsearch index.
File size: 5.7 KB
Line 
1# $Id: index.properties $
2
3fgsindex.indexName = INDEXNAME
4
5fgsindex.operationsImpl = dk.defxws.fgslucene.OperationsImpl
6
7fgsindex.defaultUpdateIndexDocXslt = INDEXINGDOCXSLT
8fgsindex.defaultUpdateIndexResultXslt = updateIndexToResultPage
9fgsindex.defaultGfindObjectsResultXslt = gfindObjectsToResultPage
10fgsindex.defaultBrowseIndexResultXslt = browseIndexToResultPage
11fgsindex.defaultGetIndexInfoResultXslt = copyXml
12
13#fgsindex.indexDir = <...>
14fgsindex.indexDir = INDEXDIR
15
16fgsindex.analyzer = org.apache.lucene.analysis.standard.StandardAnalyzer
17fgsindex.fieldAnalyzers = dc.title::org.apache.lucene.analysis.standard.StandardAnalyzer dc.creator::org.apache.lucene.analysis.standard.StandardAnalyzer
18# used to index and query TOKENIZED index fields
19# for UN_TOKENIZED index fields see fgsindex.untokenizedFields further down
20
21#Stopwords file for the analyzer, comment the line if no stopwords
22#fgsindex.stopwordsLocation = /stopwords.txt
23
24fgsindex.defaultQueryFields = dc.description dc.title
25
26# setting of org.apache.lucene.queryParser.QueryParser setAllowLeadingWildcard()
27# Set to true to allow leading wildcard characters, * or ?
28# Default: false.
29fgsindex.allowLeadingWildcard = false
30
31# setting of org.apache.lucene.queryParser.QueryParser setLowercaseExpandedTerms()
32# Whether terms of wildcard, prefix, fuzzy and range queries are to be automatically lower-cased or not.
33# Default: true.
34fgsindex.lowercaseExpandedTerms = true
35
36#sortFields may be given as parameter to gfindObjects, or as config default.
37###########
38
39# as parameter: ?operation=gfindObjects&sortFields=[sortFieldsValue]&...
40
41# as config default:
42
43#fgsindex.defaultSortFields = sortFieldsValue
44
45#examples:
46
47#fgsindex.defaultSortFields = PID,STRING,true
48
49#fgsindex.defaultSortFields = sf1,SCORE;sf2,cy-GB-var,true
50
51# sortFieldsValue ::= [sortField[';'sortField]*]
52# sortField ::= sortFieldName[','(sortType | locale | comparatorClass)[','reverse]]]]
53# sortFieldName ::= #the name of an index field, which is UN_TOKENIZED and contains a single term per document
54# sortType ::= 'BYTE' | 'DOC' | 'DOUBLE' | 'FLOAT' | 'INT' | 'LONG' | 'SCORE' | 'SHORT' | 'STRING' | 'STRING_VAL'
55# locale ::= language['-'country['-'variant]]
56# comparatorClass ::= package-path'.'className['('param['-'param]*')']
57# reverse ::= 'false' (default) | 'true' | 'reverse'
58
59# sortType 'AUTO' is removed in Lucene 3.x
60
61# The test class dk.defxws.fedoragsearch.test.ComparatorSourceTest has been removed in GSearch 2.3,
62# because the interface org.apache.lucene.search.SortComparatorSource is deprecated in Lucene 3.x
63
64# Briefly, one or more sortFields will determine the sequence of search results,
65# as defined either by sortType or by locale, and it may be in reverse.
66
67# If no sortFieldsValue is given, then this code from GSearch is run
68
69# TopDocs hits = searcher.search(query, numHits); // in dk.defxws.fgslucene.Statement.java
70
71# where the sequence is by default.
72
73# If a sortFieldsValue is given, then this code is run
74
75# TopDocs hits = searcher.search(query, numHits, sort);
76
77# where sort is an instance of org.apache.lucene.search.Sort, see
78
79# http://lucene.apache.org/java/3_3_0/api/index.html
80
81# See org.apache.lucene.search.SortField for more about sortType, locale and reverse values.
82
83
84#fgsindex.untokenizedFields = list of index fields created as UN_TOKENIZED
85###########################
86# Effect: during search the KeywordAnalyzer is used for untokenized fields,
87# while the fgsindex.analyzer is used for other fields.
88# Only untokenized fields, which do not occur in every index document,
89# need be listed here.
90# example:
91
92#fgsindex.untokenizedFields = fgs.contentModel uf1 uf2
93fgsindex.untokenizedFields = PID
94
95
96# snippets
97##########
98#fgsindex.snippetBegin = <span class=\"highlight\">
99fgsindex.snippetBegin = <span class=\"highlight\">
100## this value is default if not specified
101#fgsindex.snippetEnd = </span>
102fgsindex.snippetEnd = </span>
103## this value is default if not specified
104
105
106# optimization see e.g. http://www.onjava.com/pub/a/onjava/2003/03/05/lucene.html
107##############
108# fgsindex.mergeFactor = 10
109fgsindex.mergeFactor = 100
110## 10 is default if not specified
111# fgsindex.maxBufferedDocs = 10
112fgsindex.maxBufferedDocs = 100
113## 10 is default if not specified
114# fgsindex.defaultWriteLockTimeout = 1000
115#fgsindex.defaultWriteLockTimeout = 0
116fgsindex.defaultWriteLockTimeout = @indexwritelocktimeout@
117## 0 is default if not specified
118# from http://lucene.apache.org/java/2_3_0/api/IndexWriter.html :
119## mergeFactor
120## determines how often segment indices are merged by addDocument().
121## With smaller values, less RAM is used while indexing, and searches on unoptimized indices are faster,
122## but indexing speed is slower. With larger values, more RAM is used during indexing,
123## and while searches on unoptimized indices are slower, indexing is faster.
124## Thus larger values (> 10) are best for batch index creation,
125## and smaller values (< 10) for indices that are interactively maintained.
126## maxBufferedDocs
127## determines the minimal number of documents required
128## before the buffered in-memory documents are merged and a new Segment is created.
129## Since Documents are merged in a RAMDirectory, large value gives faster indexing.
130## At the same time, mergeFactor limits the number of files open in a FSDirectory.
131## defaultWriteLockTimeout
132## sets the default maximum time to wait for a write lock (in milliseconds).
133
134# ...?operation=updateIndex&action=optimize
135## will perform IndexWriter.optimize()
136## which merges all segments together into a single segment, optimizing an index for search.
137
138# custom URIResolver
139####################
140#fgsindex.uriResolver = dk.defxws.fedoragsearch.server.URIResolverImpl
Note: See TracBrowser for help on using the repository browser.