557472a6d6
The duplicated _version_ definition in the template prevented the proper query of Chinese indexed content from Solr. After the patch had been applied restart Solr and reindex Chinese content: sudo service jetty restart cd /srv/askbot-sites/slot0/config sudo python manage.py askbot_rebuild_index -l zh Change-Id: Iaeabc73febc64c45996425225d3ee38db7f36f72
176 lines
8.8 KiB
Plaintext
176 lines
8.8 KiB
Plaintext
<?xml version="1.0" ?>
|
|
<!--
|
|
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
contributor license agreements. See the NOTICE file distributed with
|
|
this work for additional information regarding copyright ownership.
|
|
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
(the "License"); you may not use this file except in compliance with
|
|
the License. You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
-->
|
|
|
|
<schema name="default" version="1.4">
|
|
<types>
|
|
<fieldtype name="string" class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
|
|
<fieldType name="boolean" class="solr.BoolField" sortMissingLast="true" omitNorms="true"/>
|
|
<fieldtype name="binary" class="solr.BinaryField"/>
|
|
|
|
<!-- Numeric field types that manipulate the value into
|
|
a string value that isn't human-readable in its internal form,
|
|
but with a lexicographic ordering the same as the numeric ordering,
|
|
so that range queries work correctly. -->
|
|
<fieldType name="int" class="solr.TrieIntField" precisionStep="0" omitNorms="true" sortMissingLast="true" positionIncrementGap="0"/>
|
|
<fieldType name="float" class="solr.TrieFloatField" precisionStep="0" omitNorms="true" sortMissingLast="true" positionIncrementGap="0"/>
|
|
<fieldType name="long" class="solr.TrieLongField" precisionStep="0" omitNorms="true" sortMissingLast="true" positionIncrementGap="0"/>
|
|
<fieldType name="double" class="solr.TrieDoubleField" precisionStep="0" omitNorms="true" sortMissingLast="true" positionIncrementGap="0"/>
|
|
|
|
<fieldType name="tint" class="solr.TrieIntField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
|
|
<fieldType name="tfloat" class="solr.TrieFloatField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
|
|
<fieldType name="tlong" class="solr.TrieLongField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
|
|
<fieldType name="tdouble" class="solr.TrieDoubleField" precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
|
|
|
|
<fieldType name="date" class="solr.TrieDateField" omitNorms="true" precisionStep="0" positionIncrementGap="0"/>
|
|
<!-- A Trie based date field for faster date range queries and date faceting. -->
|
|
<fieldType name="tdate" class="solr.TrieDateField" omitNorms="true" precisionStep="6" positionIncrementGap="0"/>
|
|
|
|
<fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
|
|
<fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
|
|
<fieldtype name="geohash" class="solr.GeoHashField"/>
|
|
|
|
<fieldType name="text_general" class="solr.TextField" positionIncrementGap="100">
|
|
<analyzer type="index">
|
|
|
|
<tokenizer class="solr.SmartChineseSentenceTokenizerFactory"/>
|
|
<filter class="solr.SmartChineseWordTokenFilterFactory"/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
<!-- <filter class="solr.PositionFilterFactory" /> -->
|
|
|
|
</analyzer>
|
|
<analyzer type="query">
|
|
|
|
<tokenizer class="solr.SmartChineseSentenceTokenizerFactory"/>
|
|
<filter class="solr.SmartChineseWordTokenFilterFactory"/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
<!-- <filter class="solr.PositionFilterFactory" /> -->
|
|
|
|
</analyzer>
|
|
</fieldType>
|
|
|
|
<fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
|
|
<analyzer type="index">
|
|
<tokenizer class="solr.StandardTokenizerFactory"/>
|
|
<filter class="solr.StopFilterFactory"
|
|
ignoreCase="true"
|
|
words="stopwords.txt"
|
|
enablePositionIncrements="true"
|
|
/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
<filter class="solr.EnglishPossessiveFilterFactory"/>
|
|
<filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
|
|
<!-- Optionally you may want to use this less aggressive stemmer instead of PorterStemFilterFactory:
|
|
<filter class="solr.EnglishMinimalStemFilterFactory"/>
|
|
-->
|
|
<filter class="solr.PorterStemFilterFactory"/>
|
|
</analyzer>
|
|
<analyzer type="query">
|
|
<tokenizer class="solr.StandardTokenizerFactory"/>
|
|
<filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
|
|
<filter class="solr.StopFilterFactory"
|
|
ignoreCase="true"
|
|
words="stopwords.txt"
|
|
enablePositionIncrements="true"
|
|
/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
<filter class="solr.EnglishPossessiveFilterFactory"/>
|
|
<filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
|
|
<!-- Optionally you may want to use this less aggressive stemmer instead of PorterStemFilterFactory:
|
|
<filter class="solr.EnglishMinimalStemFilterFactory"/>
|
|
-->
|
|
<filter class="solr.PorterStemFilterFactory"/>
|
|
</analyzer>
|
|
</fieldType>
|
|
|
|
<fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
|
|
<analyzer>
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
|
|
</analyzer>
|
|
</fieldType>
|
|
|
|
<fieldType name="ngram" class="solr.TextField" >
|
|
<analyzer type="index">
|
|
<tokenizer class="solr.KeywordTokenizerFactory"/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
<filter class="solr.NGramFilterFactory" minGramSize="3" maxGramSize="15" />
|
|
</analyzer>
|
|
<analyzer type="query">
|
|
<tokenizer class="solr.KeywordTokenizerFactory"/>
|
|
<filter class="solr.LowerCaseFilterFactory"/>
|
|
</analyzer>
|
|
</fieldType>
|
|
|
|
<fieldType name="edge_ngram" class="solr.TextField" positionIncrementGap="1">
|
|
<analyzer type="index">
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory" />
|
|
<filter class="solr.LowerCaseFilterFactory" />
|
|
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="1"/>
|
|
<filter class="solr.EdgeNGramFilterFactory" minGramSize="2" maxGramSize="15" side="front" />
|
|
</analyzer>
|
|
<analyzer type="query">
|
|
<tokenizer class="solr.WhitespaceTokenizerFactory" />
|
|
<filter class="solr.LowerCaseFilterFactory" />
|
|
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="1"/>
|
|
</analyzer>
|
|
</fieldType>
|
|
</types>
|
|
|
|
<fields>
|
|
<field name="_version_" type="long" indexed="true" stored="true"/>
|
|
<field name="_root_" type="string" indexed="true" stored="false"/>
|
|
|
|
<!-- general -->
|
|
<field name="id" type="string" indexed="true" stored="true" multiValued="false" required="true"/>
|
|
<field name="django_ct" type="string" indexed="true" stored="true" multiValued="false"/>
|
|
<field name="django_id" type="string" indexed="true" stored="true" multiValued="false"/>
|
|
|
|
<dynamicField name="*_i" type="int" indexed="true" stored="true"/>
|
|
<dynamicField name="*_s" type="string" indexed="true" stored="true"/>
|
|
<dynamicField name="*_l" type="long" indexed="true" stored="true"/>
|
|
<dynamicField name="*_t" type="text_en" indexed="true" stored="true"/>
|
|
<dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
|
|
<dynamicField name="*_f" type="float" indexed="true" stored="true"/>
|
|
<dynamicField name="*_d" type="double" indexed="true" stored="true"/>
|
|
<dynamicField name="*_dt" type="date" indexed="true" stored="true"/>
|
|
<dynamicField name="*_p" type="location" indexed="true" stored="true"/>
|
|
<dynamicField name="*_coordinate" type="tdouble" indexed="true" stored="false"/>
|
|
|
|
|
|
<field name="thread_id" type="long" indexed="true" stored="true" multiValued="false" />
|
|
|
|
<field name="author" type="text_en" indexed="true" stored="true" multiValued="false" />
|
|
|
|
<field name="text" type="text_en" indexed="true" stored="true" multiValued="false" />
|
|
|
|
<field name="post_text" type="text_en" indexed="true" stored="true" multiValued="false" />
|
|
|
|
<field name="tags" type="text_en" indexed="true" stored="true" multiValued="true" />
|
|
|
|
<field name="title" type="text_en" indexed="true" stored="true" multiValued="false" />
|
|
|
|
</fields>
|
|
|
|
<!-- field to use to determine and enforce document uniqueness. -->
|
|
<uniqueKey>id</uniqueKey>
|
|
|
|
<!-- field for the QueryParser to use when an explicit fieldname is absent -->
|
|
<defaultSearchField>text</defaultSearchField>
|
|
|
|
<!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
|
|
<solrQueryParser defaultOperator="AND"/>
|
|
</schema> |