1 |
8497
|
leinfelder
|
<?xml version="1.0" ?>
|
2 |
|
|
<!--
|
3 |
|
|
THE OFFICIAL DataONE Index Solr Schema definition file.
|
4 |
|
|
This schema is copied into the dataone-cn-index buildout for deployment on cn nodes.
|
5 |
|
|
|
6 |
|
|
The Solr schema file. This file should be named "schema.xml" and
|
7 |
|
|
should be in the conf directory under the solr home
|
8 |
|
|
(i.e. ./solr/conf/schema.xml by default)
|
9 |
|
|
or located where the classloader for the Solr webapp can find it.
|
10 |
|
|
|
11 |
|
|
For more information, on how to customize this file, please see...
|
12 |
|
|
http://wiki.apache.org/solr/SchemaXml
|
13 |
|
|
-->
|
14 |
|
|
|
15 |
|
|
<schema name="dataone" version="1.1">
|
16 |
|
|
<types>
|
17 |
|
|
<!-- field type definitions. The "name" attribute is
|
18 |
|
|
just a label to be used by field definitions. The "class"
|
19 |
|
|
attribute and any other attributes determine the real
|
20 |
|
|
behavior of the fieldtype. -->
|
21 |
|
|
|
22 |
|
|
<!-- The StringField type is not analyzed, but indexed/stored verbatim -->
|
23 |
|
|
<fieldtype name="string" class="solr.StrField" sortMissingLast="true"/>
|
24 |
|
|
|
25 |
|
|
<!-- boolean type: "true" or "false" -->
|
26 |
|
|
<fieldtype name="boolean" class="solr.BoolField" sortMissingLast="true"/>
|
27 |
|
|
|
28 |
|
|
<!-- The optional sortMissingLast and sortMissingFirst attributes are
|
29 |
|
|
currently supported on types that are sorted internally as a strings.
|
30 |
|
|
- If sortMissingLast="true" then a sort on this field will cause documents
|
31 |
|
|
without the field to come after documents with the field,
|
32 |
|
|
regardless of the requested sort order (asc or desc).
|
33 |
|
|
- If sortMissingFirst="true" then a sort on this field will cause documents
|
34 |
|
|
without the field to come before documents with the field,
|
35 |
|
|
regardless of the requested sort order.
|
36 |
|
|
- If sortMissingLast="false" and sortMissingFirst="false" (the default),
|
37 |
|
|
then default lucene sorting will be used which places docs without the field
|
38 |
|
|
first in an ascending sort and last in a descending sort.
|
39 |
|
|
-->
|
40 |
|
|
|
41 |
|
|
<!-- numeric field types that store and index the text
|
42 |
|
|
value verbatim (and hence don't support range queries since the
|
43 |
|
|
lexicographic ordering isn't equal to the numeric ordering) -->
|
44 |
|
|
<fieldtype name="integer" class="solr.IntField"/>
|
45 |
|
|
<fieldtype name="long" class="solr.LongField"/>
|
46 |
|
|
<fieldtype name="float" class="solr.FloatField"/>
|
47 |
|
|
<fieldtype name="double" class="solr.DoubleField"/>
|
48 |
|
|
|
49 |
|
|
<!-- Numeric field types that manipulate the value into
|
50 |
|
|
a string value that isn't human readable in it's internal form,
|
51 |
|
|
but with a lexicographic ordering the same as the numeric ordering
|
52 |
|
|
so that range queries correctly work. -->
|
53 |
|
|
<fieldtype name="sint" class="solr.SortableIntField" sortMissingLast="true"/>
|
54 |
|
|
<fieldtype name="slong" class="solr.SortableLongField" sortMissingLast="true"/>
|
55 |
|
|
<fieldtype name="sfloat" class="solr.SortableFloatField" sortMissingLast="true"/>
|
56 |
|
|
<fieldtype name="sdouble" class="solr.SortableDoubleField" sortMissingLast="true"/>
|
57 |
|
|
|
58 |
|
|
<!-- The format for this date field is of the form 1995-12-31T23:59:59Z, and
|
59 |
|
|
is a more restricted form of the canonical representation of dateTime
|
60 |
|
|
http://www.w3.org/TR/xmlschema-2/#dateTime
|
61 |
|
|
The trailing "Z" designates UTC time and is mandatory.
|
62 |
|
|
Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
|
63 |
|
|
All other components are mandatory. -->
|
64 |
|
|
<fieldtype name="date" class="solr.DateField" sortMissingLast="true"/>
|
65 |
|
|
|
66 |
|
|
<!-- solr.TextField allows the specification of custom text analyzers
|
67 |
|
|
specified as a tokenizer and a list of token filters. Different
|
68 |
|
|
analyzers may be specified for indexing and querying.
|
69 |
|
|
|
70 |
|
|
The optional positionIncrementGap puts space between multiple fields of
|
71 |
|
|
this type on the same document, with the purpose of preventing false phrase
|
72 |
|
|
matching across fields.
|
73 |
|
|
|
74 |
|
|
For more info on customizing your analyzer chain, please see...
|
75 |
|
|
http://wiki.apache.org/solr/AnalyzersTokenizersTokenFilters
|
76 |
|
|
|
77 |
|
|
-->
|
78 |
|
|
|
79 |
|
|
<!-- Standard analyzer commonly used by Lucene developers
|
80 |
|
|
-->
|
81 |
|
|
<!-- Standard analyzer commonly used by Lucene developers -->
|
82 |
|
|
<!--
|
83 |
|
|
<fieldtype name="text_lu" class="solr.TextField" positionIncrementGap="100">
|
84 |
|
|
<analyzer>
|
85 |
|
|
<tokenizer class="solr.StandardTokenizerFactory"/>
|
86 |
|
|
<filter class="solr.StandardFilterFactory"/>
|
87 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
88 |
|
|
<filter class="solr.StopFilterFactory"/>
|
89 |
|
|
<filter class="solr.EnglishPorterFilterFactory"/>
|
90 |
|
|
</analyzer>
|
91 |
|
|
</fieldtype>
|
92 |
|
|
-->
|
93 |
|
|
<!-- One could also specify an existing Analyzer implementation in Java
|
94 |
|
|
via the class attribute on the analyzer element:
|
95 |
|
|
<fieldtype name="text_lu" class="solr.TextField">
|
96 |
|
|
<analyzer class="org.apache.lucene.analysis.snowball.SnowballAnalyzer"/>
|
97 |
|
|
</fieldType>
|
98 |
|
|
-->
|
99 |
9154
|
leinfelder
|
|
100 |
8497
|
leinfelder
|
<!-- A text field that only splits on whitespace for more exact matching -->
|
101 |
|
|
<fieldtype name="text_ws" class="solr.TextField" positionIncrementGap="100">
|
102 |
|
|
<analyzer>
|
103 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
104 |
|
|
</analyzer>
|
105 |
|
|
</fieldtype>
|
106 |
|
|
|
107 |
|
|
<fieldtype name="text" class="solr.TextField" positionIncrementGap="100">
|
108 |
|
|
<analyzer type="index">
|
109 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
110 |
|
|
<filter class="solr.WordDelimiterFilterFactory"
|
111 |
|
|
generateWordParts="1"
|
112 |
|
|
catenateWords="1"
|
113 |
|
|
generateNumberParts="1"
|
114 |
|
|
splitOnNumerics="0"/>
|
115 |
|
|
|
116 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
117 |
|
|
<filter class="solr.StopFilterFactory" />
|
118 |
|
|
<filter class="solr.PorterStemFilterFactory" />
|
119 |
|
|
<filter class="solr.ReversedWildcardFilterFactory" withOriginal="true"/>
|
120 |
|
|
</analyzer>
|
121 |
|
|
<analyzer type="query">
|
122 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
123 |
|
|
|
124 |
|
|
<filter class="solr.WordDelimiterFilterFactory"
|
125 |
|
|
generateWordParts="1"
|
126 |
|
|
catenateWords="0"
|
127 |
|
|
generateNumberParts="1"
|
128 |
|
|
splitOnNumerics="0"/>
|
129 |
|
|
|
130 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
131 |
|
|
<filter class="solr.StopFilterFactory"/>
|
132 |
|
|
<filter class="solr.PorterStemFilterFactory" />
|
133 |
|
|
</analyzer>
|
134 |
|
|
</fieldtype>
|
135 |
|
|
|
136 |
|
|
<fieldtype name="text_no_token" class="solr.TextField" positionIncrementGap="100">
|
137 |
|
|
<analyzer type="index">
|
138 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
139 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
140 |
|
|
<filter class="solr.StopFilterFactory" />
|
141 |
|
|
</analyzer>
|
142 |
|
|
<analyzer type="query">
|
143 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
144 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
145 |
|
|
<filter class="solr.StopFilterFactory"/>
|
146 |
|
|
</analyzer>
|
147 |
|
|
</fieldtype>
|
148 |
|
|
|
149 |
|
|
<!--
|
150 |
|
|
<fieldtype name="text_all" class="solr.TextField" positionIncrementGap="100">
|
151 |
|
|
<analyzer type="index">
|
152 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
153 |
|
|
in this example, we will only use synonyms at query time
|
154 |
|
|
<filter class="solr.SynonymFilterFactory" synonyms="index_synonyms.txt" ignoreCase="true" expand="false"/>
|
155 |
|
|
|
156 |
|
|
<filter class="solr.StopFilterFactory" ignoreCase="true"/>
|
157 |
|
|
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1"
|
158 |
|
|
catenateWords="1" catenateNumbers="1" catenateAll="0"/>
|
159 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
160 |
|
|
<filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
|
161 |
|
|
</analyzer>
|
162 |
|
|
<analyzer type="query">
|
163 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
164 |
|
|
<filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
|
165 |
|
|
<filter class="solr.StopFilterFactory" ignoreCase="true"/>
|
166 |
|
|
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1"
|
167 |
|
|
catenateWords="0" catenateNumbers="0" catenateAll="0"/>
|
168 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
169 |
|
|
<filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
|
170 |
|
|
</analyzer>
|
171 |
|
|
</fieldtype>
|
172 |
|
|
-->
|
173 |
|
|
|
174 |
|
|
<!-- Less flexible matching, but less false matches. Probably not ideal for product names
|
175 |
|
|
but may be good for SKUs. Can insert dashes in the wrong place and still match. -->
|
176 |
|
|
<fieldtype name="textTight" class="solr.TextField" positionIncrementGap="100">
|
177 |
|
|
<analyzer>
|
178 |
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
179 |
|
|
<filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="false"/>
|
180 |
|
|
<filter class="solr.StopFilterFactory" ignoreCase="true"/>
|
181 |
|
|
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="0" generateNumberParts="0"
|
182 |
|
|
catenateWords="1" catenateNumbers="1" catenateAll="0"/>
|
183 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
184 |
|
|
<filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
|
185 |
|
|
</analyzer>
|
186 |
|
|
</fieldtype>
|
187 |
|
|
|
188 |
|
|
<fieldType name="alphaOnlySort" class="solr.TextField" sortMissingLast="true">
|
189 |
|
|
<analyzer>
|
190 |
|
|
<tokenizer class="solr.KeywordTokenizerFactory"/>
|
191 |
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
192 |
|
|
<filter class="solr.TrimFilterFactory"/>
|
193 |
|
|
<filter class="solr.PatternReplaceFilterFactory" pattern="([^a-z])" replacement="" replace="all"/>
|
194 |
|
|
</analyzer>
|
195 |
|
|
</fieldType>
|
196 |
|
|
|
197 |
|
|
</types>
|
198 |
|
|
|
199 |
|
|
|
200 |
|
|
<!-- ======================================================================= -->
|
201 |
|
|
<fields>
|
202 |
|
|
<!-- Valid attributes for fields:
|
203 |
|
|
name: mandatory - the name for the field
|
204 |
|
|
type: mandatory - the name of a previously defined type from the <types> section
|
205 |
|
|
indexed: true if this field should be indexed (searchable)
|
206 |
|
|
stored: true if this field should be retrievable
|
207 |
|
|
multiValued: true if this field may contain multiple values per document
|
208 |
|
|
omitNorms: (expert) set to true to omit the norms associated with this field
|
209 |
|
|
(this disables length normalization and index-time boosting for the field)
|
210 |
|
|
-->
|
211 |
|
|
|
212 |
|
|
<field name="id" type="string" indexed="true" stored="true" multiValued="false"/>
|
213 |
9405
|
leinfelder
|
<field name="seriesId" type="string" indexed="true" stored="true" multiValued="false" />
|
214 |
9411
|
leinfelder
|
<field name="fileName" type="string" indexed="true" stored="true" multiValued="false" />
|
215 |
|
|
<field name="mediaType" type="string" indexed="true" stored="true" multiValued="false" />
|
216 |
|
|
<field name="mediaTypeProperty" type="string" indexed="true" stored="true" multiValued="true" />
|
217 |
8497
|
leinfelder
|
<field name="formatId" type="string" indexed="true" stored="true" multiValued="false"/>
|
218 |
|
|
<field name="formatType" type="string" indexed="true" stored="true" multiValued="false"/>
|
219 |
|
|
<field name="size" type="slong" indexed="true" stored="true" multiValued="false"/>
|
220 |
|
|
<field name="checksum" type="string" indexed="false" stored="true" multiValued="false"/>
|
221 |
|
|
<field name="checksumAlgorithm" type="string" indexed="false" stored="true"/>
|
222 |
|
|
<field name="dateUploaded" type="date" indexed="true" stored="true" multiValued="false"/>
|
223 |
|
|
<field name="dateModified" type="date" indexed="true" stored="true" multiValued="false"/>
|
224 |
|
|
<field name="submitter" type="string" indexed="true" stored="true" multiValued="false"/>
|
225 |
|
|
<field name="rightsHolder" type="string" indexed="true" stored="true" multiValued="false"/>
|
226 |
|
|
<field name="authoritativeMN" type="string" indexed="false" stored="true" multiValued="false"/>
|
227 |
|
|
<field name="replicationAllowed" type="boolean" indexed="false" stored="true" multiValued="false"/>
|
228 |
|
|
<field name="numberReplicas" type="integer" indexed="false" stored="true" multiValued="false"/>
|
229 |
|
|
<field name="preferredReplicationMN" type="string" indexed="false" stored="true" multiValued="true"/>
|
230 |
|
|
<field name="blockedReplicationMN" type="string" indexed="false" stored="true" multiValued="true"/>
|
231 |
|
|
<field name="replicaMN" type="string" indexed="false" stored="true" multiValued="true"/>
|
232 |
|
|
<field name="replicaVerifiedDate" type="date" indexed="false" stored="true" multiValued="true"/>
|
233 |
|
|
<field name="datasource" type="string" indexed="true" stored="true" multiValued="false"/>
|
234 |
|
|
<field name="obsoletes" type="string" indexed="true" stored="true" multiValued="false"/>
|
235 |
|
|
<field name="obsoletedBy" type="string" indexed="true" stored="true" multiValued="false"/>
|
236 |
|
|
|
237 |
|
|
<!-- Object relationships -->
|
238 |
|
|
<field name="resourceMap" type="string" indexed="true" stored="true" multiValued="true"/>
|
239 |
|
|
<field name="documents" type="string" indexed="true" stored="true" multiValued="true"/>
|
240 |
|
|
<field name="isDocumentedBy" type="string" indexed="true" stored="true" multiValued="true"/>
|
241 |
|
|
|
242 |
|
|
<!--Permissions-->
|
243 |
|
|
<field name="readPermission" type="string" indexed="true" stored="true" multiValued="true"/>
|
244 |
|
|
<field name="writePermission" type="string" indexed="true" stored="true" multiValued="true"/>
|
245 |
|
|
<field name="changePermission" type="string" indexed="true" stored="true" multiValued="true"/>
|
246 |
|
|
<field name="isPublic" type="boolean" indexed="true" stored="true" />
|
247 |
|
|
|
248 |
|
|
<!-- Science metadata properties -->
|
249 |
|
|
|
250 |
|
|
<field name="author" type="string" multiValued="false" indexed="true" stored="true" />
|
251 |
|
|
<field name="authorSurName" type="string" multiValued="false" indexed="true" stored="true" />
|
252 |
|
|
<field name="authorGivenName" type="string" multiValued="false" indexed="true" stored="true" />
|
253 |
|
|
<field name="authorSurNameSort" type="alphaOnlySort" multiValued="false" indexed="true" stored="true" />
|
254 |
|
|
<field name="authorGivenNameSort" type="alphaOnlySort" multiValued="false" indexed="true" stored="true" />
|
255 |
|
|
|
256 |
|
|
<field name="authorLastName" type="string" multiValued="true" indexed="true" stored="true" />
|
257 |
|
|
|
258 |
|
|
<field name="abstract" type="text" multiValued="false" indexed="true" stored="true" />
|
259 |
|
|
<field name="keywords" type="string" multiValued="true" indexed="true" stored="true" />
|
260 |
|
|
<field name="keyConcept" type="string" multiValued="true" indexed="true" stored="true" />
|
261 |
|
|
<field name="southBoundCoord" type="sfloat" multiValued="false" indexed="true" stored="true"/>
|
262 |
|
|
<field name="northBoundCoord" type="sfloat" multiValued="false" indexed="true" stored="true"/>
|
263 |
|
|
<field name="westBoundCoord" type="sfloat" multiValued="false" indexed="true" stored="true"/>
|
264 |
|
|
<field name="eastBoundCoord" type="sfloat" multiValued="false" indexed="true" stored="true"/>
|
265 |
|
|
<field name="namedLocation" type="string" multiValued="true" indexed="true" stored="true" />
|
266 |
|
|
<field name="beginDate" type="date" multiValued="false" indexed="true" stored="true" />
|
267 |
|
|
<field name="endDate" type="date" multiValued="false" indexed="true" stored="true" />
|
268 |
|
|
|
269 |
|
|
<field name="title" type="text" multiValued="false" indexed="true" stored="true" />
|
270 |
|
|
<field name="scientificName" type="string" multiValued="true" indexed="true" stored="true" />
|
271 |
|
|
<field name="relatedOrganizations" type="string" multiValued="true" indexed="true" stored="true" />
|
272 |
|
|
<field name="datePublished" type="date" multiValued="false" indexed="true" stored="true" />
|
273 |
9154
|
leinfelder
|
<field name="pubDate" type="date" multiValued="false" indexed="true" stored="true"/>
|
274 |
8497
|
leinfelder
|
|
275 |
|
|
<field name="investigator" type="string" indexed="true" stored="true" multiValued="true"/>
|
276 |
|
|
<field name="investigatorText" type="text" indexed="true" stored="false" multiValued="true"/>
|
277 |
|
|
<field name="ogcUrl" type="text" indexed="false" stored="true"/>
|
278 |
|
|
<field name="sku" type="textTight" indexed="true" stored="true"/>
|
279 |
|
|
<field name="identifier" type="textTight" indexed="true" stored="true"/>
|
280 |
|
|
<field name="LTERSite" type="string" indexed="true" stored="true"/>
|
281 |
|
|
<field name="origin" type="string" indexed="true" stored="true" multiValued="true"/>
|
282 |
|
|
<field name="originText" type="text" indexed="true" stored="false" multiValued="true"/>
|
283 |
|
|
<field name="titlestr" type="string" indexed="true" stored="false"/>
|
284 |
|
|
<field name="geoform" type="string" indexed="true" stored="true"/>
|
285 |
|
|
<field name="presentationCat" type="string" indexed="true" stored="true"/>
|
286 |
|
|
<field name="purpose" type="text" indexed="true" stored="true"/>
|
287 |
|
|
<field name="updateDate" type="date" indexed="true" stored="true"/>
|
288 |
|
|
<field name="edition" type="text" indexed="true" stored="true"/>
|
289 |
|
|
<field name="dataUrl" type="string" indexed="false" stored="true"/>
|
290 |
|
|
<field name="originator" type="string" indexed="true" stored="true" multiValued="true"/>
|
291 |
|
|
<field name="originatorText" type="text" indexed="true" stored="false" multiValued="true"/>
|
292 |
|
|
<field name="family" type="string" indexed="true" stored="true" multiValued="true"/>
|
293 |
|
|
<field name="species" type="string" indexed="true" stored="true" multiValued="true"/>
|
294 |
|
|
<field name="genus" type="string" indexed="true" stored="true" multiValued="true"/>
|
295 |
|
|
<field name="kingdom" type="string" indexed="true" stored="true" multiValued="true"/>
|
296 |
|
|
<field name="phylum" type="string" indexed="true" stored="true" multiValued="true"/>
|
297 |
|
|
<field name="order" type="string" indexed="true" stored="true" multiValued="true"/>
|
298 |
|
|
<field name="class" type="string" indexed="true" stored="true" multiValued="true"/>
|
299 |
|
|
|
300 |
|
|
<field name="attributeName" type="string" indexed="true" stored="true" multiValued="true" />
|
301 |
|
|
<field name="attributeLabel" type="string" indexed="true" stored="true" multiValued="true" />
|
302 |
|
|
<field name="attributeDescription" type="text" indexed="true" stored="true" multiValued="true" />
|
303 |
|
|
<field name="attributeUnit" type="string" indexed="true" stored="true" multiValued="true" />
|
304 |
|
|
<field name="attribute" type="text" indexed="true" stored="true" multiValued="true" />
|
305 |
|
|
|
306 |
|
|
<field name="webUrl" type="string" indexed="false" stored="true" multiValued="true"/>
|
307 |
|
|
|
308 |
|
|
<field name="contactOrganization" type="string" indexed="true" stored="true" multiValued="true"/>
|
309 |
|
|
<field name="contactOrganizationText" type="text" indexed="true" stored="false" multiValued="true"/>
|
310 |
|
|
|
311 |
|
|
<field name="keywordsText" type="text" indexed="true" stored="false" multiValued="true"/>
|
312 |
|
|
<field name="placeKey" type="text" indexed="true" stored="true" multiValued="true"/>
|
313 |
|
|
|
314 |
|
|
<field name="noBoundingBox" type="string" indexed="true" stored="true"/>
|
315 |
|
|
<field name="isSpatial" type="string" indexed="true" stored="true"/>
|
316 |
|
|
|
317 |
|
|
<field name="decade" type="string" indexed="true" stored="true"/>
|
318 |
|
|
<field name="gcmdKeyword" type="text" indexed="true" stored="true" multiValued="true"/>
|
319 |
|
|
|
320 |
|
|
<!-- these are ornl daac fields, may not be populated for nbii, but are required to be here for indexing purpose-->
|
321 |
|
|
<field name="project" type="string" indexed="true" stored="true"/>
|
322 |
|
|
<field name="projectText" type="text" indexed="true" stored="false"/>
|
323 |
|
|
|
324 |
|
|
<field name="site" type="string" indexed="true" stored="true" multiValued="true"/>
|
325 |
|
|
<field name="siteText" type="text" indexed="true" stored="false" multiValued="true"/>
|
326 |
|
|
|
327 |
|
|
<field name="parameter" type="string" indexed="true" stored="true" multiValued="true"/>
|
328 |
|
|
<field name="parameterText" type="text" indexed="true" stored="false" multiValued="true"/>
|
329 |
|
|
|
330 |
|
|
<field name="sensor" type="string" indexed="true" stored="true" multiValued="true"/>
|
331 |
|
|
<field name="sensorText" type="text" indexed="true" stored="false" multiValued="true"/>
|
332 |
|
|
|
333 |
|
|
<field name="source" type="string" indexed="true" stored="true" multiValued="true"/>
|
334 |
|
|
<field name="sourceText" type="text" indexed="true" stored="false" multiValued="true"/>
|
335 |
|
|
|
336 |
|
|
<field name="term" type="string" indexed="true" stored="true" multiValued="true"/>
|
337 |
|
|
<field name="termText" type="text" indexed="true" stored="false" multiValued="true"/>
|
338 |
|
|
|
339 |
|
|
<field name="topic" type="string" indexed="true" stored="true" multiValued="true"/>
|
340 |
|
|
<field name="topicText" type="text" indexed="true" stored="false" multiValued="true"/>
|
341 |
|
|
|
342 |
|
|
<field name="fileID" type="string" indexed="true" stored="true"/>
|
343 |
|
|
<field name="text" type="text" indexed="true" stored="true" multiValued="false" />
|
344 |
8796
|
slaughter
|
<field name="geohash_1" type="string" indexed="true" stored="true" multiValued="true"/>
|
345 |
|
|
<field name="geohash_2" type="string" indexed="true" stored="true" multiValued="true"/>
|
346 |
|
|
<field name="geohash_3" type="string" indexed="true" stored="true" multiValued="true"/>
|
347 |
|
|
<field name="geohash_4" type="string" indexed="true" stored="true" multiValued="true"/>
|
348 |
|
|
<field name="geohash_5" type="string" indexed="true" stored="true" multiValued="true"/>
|
349 |
|
|
<field name="geohash_6" type="string" indexed="true" stored="true" multiValued="true"/>
|
350 |
|
|
<field name="geohash_7" type="string" indexed="true" stored="true" multiValued="true"/>
|
351 |
|
|
<field name="geohash_8" type="string" indexed="true" stored="true" multiValued="true"/>
|
352 |
|
|
<field name="geohash_9" type="string" indexed="true" stored="true" multiValued="true"/>
|
353 |
8497
|
leinfelder
|
|
354 |
9154
|
leinfelder
|
<!-- Provenance-based fields -->
|
355 |
|
|
<field name="prov_wasDerivedFrom" type="string" indexed="true" stored="true" multiValued="true" />
|
356 |
|
|
<field name="prov_wasGeneratedBy" type="string" indexed="true" stored="true" multiValued="true" />
|
357 |
|
|
<field name="prov_wasInformedBy" type="string" indexed="true" stored="true" multiValued="true" />
|
358 |
|
|
<field name="prov_used" type="string" indexed="true" stored="true" multiValued="true" />
|
359 |
10073
|
tao
|
<field name="prov_generated" type="string" indexed="true" stored="true" multiValued="true" />
|
360 |
9154
|
leinfelder
|
<field name="prov_generatedByProgram" type="string" indexed="true" stored="true" multiValued="true" />
|
361 |
|
|
<field name="prov_generatedByExecution" type="string" indexed="true" stored="true" multiValued="true" />
|
362 |
|
|
<field name="prov_generatedByUser" type="string" indexed="true" stored="true" multiValued="true" />
|
363 |
|
|
<field name="prov_usedByProgram" type="string" indexed="true" stored="true" multiValued="true" />
|
364 |
|
|
<field name="prov_usedByExecution" type="string" indexed="true" stored="true" multiValued="true" />
|
365 |
|
|
<field name="prov_usedByUser" type="string" indexed="true" stored="true" multiValued="true" />
|
366 |
|
|
<field name="prov_wasExecutedByExecution" type="string" indexed="true" stored="true" multiValued="true" />
|
367 |
|
|
<field name="prov_wasExecutedByUser" type="string" indexed="true" stored="true" multiValued="true" />
|
368 |
|
|
<field name="prov_hasSources" type="string" indexed="true" stored="true" multiValued="true" />
|
369 |
|
|
<field name="prov_hasDerivations" type="string" indexed="true" stored="true" multiValued="true" />
|
370 |
|
|
<field name="prov_instanceOfClass" type="string" indexed="true" stored="true" multiValued="true" />
|
371 |
|
|
|
372 |
10073
|
tao
|
|
373 |
9154
|
leinfelder
|
<!-- semantic fields -->
|
374 |
|
|
<field name="sem_annotation" type="string" indexed="true" stored="true" multiValued="true" />
|
375 |
|
|
<field name="sem_annotated_by" type="string" indexed="true" stored="true" multiValued="true" />
|
376 |
|
|
<field name="sem_annotates" type="string" indexed="true" stored="true" multiValued="true" />
|
377 |
|
|
<field name="sem_comment" type="string" indexed="true" stored="true" multiValued="true" />
|
378 |
|
|
|
379 |
9524
|
tao
|
|
380 |
|
|
<!-- member node service fields -->
|
381 |
|
|
<field name="isService" type="boolean" indexed="true" stored="true" multiValued="false" default="false" />
|
382 |
|
|
<field name="serviceCoupling" type="string" indexed="true" stored="true" multiValued="false" default="false" />
|
383 |
|
|
<field name="serviceTitle" type="text" indexed="true" stored="true" multiValued="false" />
|
384 |
|
|
<field name="serviceDescription" type="text" indexed="true" stored="true" multiValued="false" />
|
385 |
|
|
<field name="serviceType" type="string" indexed="true" stored="true" multiValued="true" />
|
386 |
|
|
<field name="serviceEndpoint" type="string" indexed="true" stored="true" multiValued="true" />
|
387 |
|
|
<field name="serviceInput" type="string" indexed="true" stored="true" multiValued="true" />
|
388 |
|
|
<field name="serviceOutput" type="string" indexed="true" stored="true" multiValued="true" />
|
389 |
|
|
|
390 |
8497
|
leinfelder
|
<!-- ======================================================================= -->
|
391 |
|
|
<!-- Dynamic field definitions. If a field name is not found, dynamicFields
|
392 |
|
|
will be used if the name matches any of the patterns.
|
393 |
|
|
RESTRICTION: the glob-like pattern in the name attribute must have
|
394 |
|
|
a "*" only at the start or the end.
|
395 |
|
|
EXAMPLE: name="*_i" will match any field ending in _i (like myid_i, z_i)
|
396 |
|
|
Longer patterns will be matched first. if equal size patterns
|
397 |
|
|
both match, the first appearing in the schema will be used. -->
|
398 |
|
|
<dynamicField name="*_i" type="sint" indexed="true" stored="true"/>
|
399 |
|
|
<dynamicField name="*_s" type="string" indexed="true" stored="true"/>
|
400 |
|
|
<dynamicField name="*_l" type="slong" indexed="true" stored="true"/>
|
401 |
|
|
<dynamicField name="*_t" type="text" indexed="true" stored="true"/>
|
402 |
|
|
<dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
|
403 |
|
|
<dynamicField name="*_f" type="sfloat" indexed="true" stored="true"/>
|
404 |
|
|
<dynamicField name="*_d" type="sdouble" indexed="true" stored="true"/>
|
405 |
|
|
<dynamicField name="*_dt" type="date" indexed="true" stored="true"/>
|
406 |
|
|
|
407 |
|
|
<!-- allow multivalued dynamic fields as well -->
|
408 |
|
|
<dynamicField name="*_im" type="sint" indexed="true" stored="true" multiValued="true"/>
|
409 |
|
|
<dynamicField name="*_sm" type="string" indexed="true" stored="true" multiValued="true"/>
|
410 |
|
|
<dynamicField name="*_lm" type="slong" indexed="true" stored="true" multiValued="true"/>
|
411 |
|
|
<dynamicField name="*_tm" type="text" indexed="true" stored="true" multiValued="true"/>
|
412 |
|
|
<dynamicField name="*_bm" type="boolean" indexed="true" stored="true" multiValued="true"/>
|
413 |
|
|
<dynamicField name="*_fm" type="sfloat" indexed="true" stored="true" multiValued="true"/>
|
414 |
|
|
<dynamicField name="*_dm" type="sdouble" indexed="true" stored="true" multiValued="true"/>
|
415 |
|
|
<dynamicField name="*_dtm" type="date" indexed="true" stored="true" multiValued="true"/>
|
416 |
9154
|
leinfelder
|
|
417 |
8497
|
leinfelder
|
</fields>
|
418 |
|
|
|
419 |
|
|
<!-- ======================================================================= -->
|
420 |
|
|
<!-- field to use to determine and enforce document uniqueness. -->
|
421 |
|
|
<uniqueKey>id</uniqueKey>
|
422 |
|
|
|
423 |
|
|
<!-- field for the QueryParser to use when an explicit fieldname is absent -->
|
424 |
|
|
<defaultSearchField>text</defaultSearchField>
|
425 |
|
|
|
426 |
|
|
<!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
|
427 |
|
|
<solrQueryParser defaultOperator="AND"/>
|
428 |
|
|
|
429 |
|
|
<!-- ======================================================================= -->
|
430 |
|
|
<!-- copyField commands copy one field to another at the time a document
|
431 |
|
|
is added to the index. It's used either to index the same field different
|
432 |
|
|
ways, or to add multiple fields to the same field for easier/faster searching. -->
|
433 |
|
|
|
434 |
|
|
<copyField source="id" dest="sku"/>
|
435 |
|
|
<copyField source="id" dest="identifier"/>
|
436 |
|
|
|
437 |
|
|
<copyField source="title" dest="titlestr"/>
|
438 |
|
|
|
439 |
|
|
<copyField source="origin" dest="originText"/>
|
440 |
|
|
<copyField source="origin" dest="originatorText"/>
|
441 |
|
|
|
442 |
|
|
<copyField source="project" dest="projectText"/>
|
443 |
|
|
|
444 |
|
|
<copyField source="site" dest="siteText"/>
|
445 |
|
|
<copyField source="parameter" dest="parameterText"/>
|
446 |
|
|
<copyField source="sensor" dest="sensorText"/>
|
447 |
|
|
<copyField source="source" dest="sourceText"/>
|
448 |
|
|
<copyField source="term" dest="termText"/>
|
449 |
|
|
<copyField source="topic" dest="topicText"/>
|
450 |
|
|
<copyField source="investigator" dest="investigatorText"/>
|
451 |
|
|
<copyField source="keywords" dest="keywordsText"/>
|
452 |
9154
|
leinfelder
|
<copyField source="pubDate" dest="datePublished"/>
|
453 |
|
|
<copyField source="dateUploaded" dest="updateDate"/>
|
454 |
8497
|
leinfelder
|
<copyField source="contactOrganization" dest="contactOrganizationText"/>
|
455 |
9154
|
leinfelder
|
|
456 |
8497
|
leinfelder
|
|
457 |
|
|
<!-- Similarity is the scoring routine for each document vs a query.
|
458 |
|
|
A custom similarity may be specified here, but the default is fine
|
459 |
|
|
for most applications. -->
|
460 |
|
|
<!-- <similarity class="org.apache.lucene.search.DefaultSimilarity"/> -->
|
461 |
|
|
|
462 |
|
|
</schema>
|