1+ <?xml version =" 1.0" encoding =" UTF-8" ?>
2+ <!--
3+ The schema name property is constructed as follows
4+
5+ tx_solr - The extension key
6+ x-y-z - The extension version this schema is meant to work with
7+ YYYYMMDD - The date the schema file was changed the last time
8+
9+ When changing the schema the name property must be updated. There is a
10+ status report - tx_solr_report_SchemaStatus - checking against this
11+ name property, that status check must be updated as well.
12+ -->
13+ <schema name =" tx_solr-6-0-0--20161209" version =" 1.6" >
14+ <!-- attribute "name" is the name of this schema and is only used for display purposes.
15+ Applications should change this to reflect the nature of the search collection.
16+ version="1.4" is Solr's version number for the schema syntax and semantics. It should
17+ not normally be changed by applications.
18+ 1.0: multiValued attribute did not exist, all fields are multiValued by nature
19+ 1.1: multiValued attribute introduced, false by default
20+ 1.2: omitTermFreqAndPositions attribute introduced, true by default except for text fields.
21+ 1.3: removed optional field compress feature
22+ 1.4: default auto-phrase (QueryParser feature) to off
23+ 1.5: omitNorms defaults to true for primitive field types (int, float, boolean, string...)
24+ 1.6: useDocValuesAsStored defaults to true.
25+ -->
26+
27+ <uniqueKey >id</uniqueKey >
28+
29+ <!-- xinclude fields -->
30+ <xi : include href =" ../general_schema_types.xml" xmlns : xi =" http://www.w3.org/2001/XInclude" />
31+
32+ <!-- xinclude fields-->
33+ <xi : include href =" ../general_schema_fields.xml" xmlns : xi =" http://www.w3.org/2001/XInclude" />
34+
35+
36+ <!-- A text field that uses WordDelimiterFilter to enable splitting and matching of
37+ words on case-change, alpha numeric boundaries, and non-alphanumeric chars,
38+ so that a query of "wifi" or "wi fi" could match a document containing "Wi-Fi".
39+ Synonyms and stopwords are customized by external files, and stemming is enabled.
40+ Duplicate tokens at the same position (which may result from Stemmed Synonyms or
41+ WordDelim parts) are removed.
42+ -->
43+ <fieldType name =" text" class =" solr.TextField" positionIncrementGap =" 100" >
44+ <analyzer type =" index" >
45+ <tokenizer class =" solr.WhitespaceTokenizerFactory" />
46+
47+ <filter class =" solr.WordDelimiterFilterFactory"
48+ generateWordParts=" 1"
49+ generateNumberParts=" 1"
50+ catenateWords=" 1"
51+ catenateNumbers=" 1"
52+ catenateAll=" 0"
53+ splitOnCaseChange=" 1"
54+ preserveOriginal=" 1"
55+ protected=" arabic/protwords.txt"
56+ />
57+ <filter class =" solr.LowerCaseFilterFactory" />
58+
59+ <filter class =" solr.ManagedSynonymFilterFactory" managed =" arabic" />
60+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
61+
62+ <filter class =" solr.ArabicNormalizationFilterFactory" />
63+ <filter class =" solr.KeywordMarkerFilterFactory" protected =" arabic/protwords.txt" />
64+ <filter class =" solr.ArabicStemFilterFactory" />
65+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
66+ </analyzer >
67+ <analyzer type =" query" >
68+ <tokenizer class =" solr.WhitespaceTokenizerFactory" />
69+
70+ <filter class =" solr.WordDelimiterFilterFactory"
71+ generateWordParts=" 1"
72+ generateNumberParts=" 1"
73+ catenateWords=" 0"
74+ catenateNumbers=" 0"
75+ catenateAll=" 0"
76+ splitOnCaseChange=" 1"
77+ preserveOriginal=" 1"
78+ protected=" arabic/protwords.txt"
79+ />
80+ <filter class =" solr.LowerCaseFilterFactory" />
81+
82+ <filter class =" solr.ManagedSynonymFilterFactory" managed =" arabic" />
83+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
84+
85+ <filter class =" solr.ArabicNormalizationFilterFactory" />
86+ <filter class =" solr.KeywordMarkerFilterFactory" protected =" arabic/protwords.txt" />
87+ <filter class =" solr.ArabicStemFilterFactory" />
88+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
89+ </analyzer >
90+ </fieldType >
91+
92+
93+ <!-- Less flexible matching, but less false matches. Probably not ideal for product names,
94+ but may be good for SKUs. Can insert dashes in the wrong place and still match. -->
95+ <fieldType name =" textTight" class =" solr.TextField" positionIncrementGap =" 100" >
96+ <analyzer >
97+ <tokenizer class =" solr.WhitespaceTokenizerFactory" />
98+
99+ <filter class =" solr.WordDelimiterFilterFactory"
100+ generateWordParts=" 0"
101+ generateNumberParts=" 0"
102+ catenateWords=" 1"
103+ catenateNumbers=" 1"
104+ catenateAll=" 0"
105+ preserveOriginal=" 1"
106+ protected=" arabic/protwords.txt"
107+ />
108+ <filter class =" solr.LowerCaseFilterFactory" />
109+
110+ <filter class =" solr.ManagedSynonymFilterFactory" managed =" arabic" />
111+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
112+
113+ <filter class =" solr.KeywordMarkerFilterFactory" protected =" arabic/protwords.txt" />
114+ <filter class =" solr.ArabicStemFilterFactory" />
115+ <filter class =" solr.ArabicNormalizationFilterFactory" />
116+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
117+ </analyzer >
118+ </fieldType >
119+
120+ <!-- Exact matching of words like textWhiteSpaceTokenized,
121+ but with enabled Synonym and Stop Filter
122+ -->
123+ <fieldType name =" textExact" class =" solr.TextField" positionIncrementGap =" 100" >
124+ <analyzer >
125+ <tokenizer class =" solr.WhitespaceTokenizerFactory" />
126+
127+ <filter class =" solr.LowerCaseFilterFactory" />
128+ <filter class =" solr.ManagedSynonymFilterFactory" managed =" arabic" />
129+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
130+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
131+ </analyzer >
132+ </fieldType >
133+
134+ <!-- Setup simple analysis for spell checking -->
135+ <fieldType name =" textSpell" class =" solr.TextField" positionIncrementGap =" 100" omitNorms =" true" >
136+ <analyzer type =" index" >
137+ <tokenizer class =" solr.StandardTokenizerFactory" />
138+
139+ <filter class =" solr.LowerCaseFilterFactory" />
140+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
141+
142+ <filter class =" solr.StandardFilterFactory" />
143+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
144+ <filter class =" solr.ArabicNormalizationFilterFactory" />
145+ <filter class =" solr.ArabicStemFilterFactory" />
146+ </analyzer >
147+ <analyzer type =" query" >
148+ <tokenizer class =" solr.StandardTokenizerFactory" />
149+
150+ <filter class =" solr.LowerCaseFilterFactory" />
151+
152+ <filter class =" solr.ManagedSynonymFilterFactory" managed =" arabic" />
153+ <filter class =" solr.ManagedStopFilterFactory" managed =" arabic" />
154+
155+ <filter class =" solr.StandardFilterFactory" />
156+ <filter class =" solr.ArabicNormalizationFilterFactory" />
157+ <filter class =" solr.ArabicStemFilterFactory" />
158+ <filter class =" solr.RemoveDuplicatesTokenFilterFactory" />
159+ </analyzer >
160+ </fieldType >
161+
162+ </schema >
0 commit comments