| <?xml version="1.0" ?> |
| <!-- |
| Licensed to the Apache Software Foundation (ASF) under one or more |
| contributor license agreements. See the NOTICE file distributed with |
| this work for additional information regarding copyright ownership. |
| The ASF licenses this file to You under the Apache License, Version 2.0 |
| (the "License"); you may not use this file except in compliance with |
| the License. You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| --> |
| |
| <schema name="phrase-identification" version="1.6"> |
| <field name="id" type="string" indexed="true" stored="true" multiValued="false" required="true"/> |
| <field name="_version_" type="long" indexed="true" stored="true"/> |
| |
| <field name="title" type="text" indexed="true" stored="true" /> |
| <field name="body" type="text" indexed="true" stored="true" /> |
| |
| <field name="multigrams_title" type="multigrams_3_7" indexed="true" stored="false" /> |
| <field name="multigrams_body" type="multigrams_3_7" indexed="true" stored="false" /> |
| |
| <field name="multigrams_title_short" type="multigrams_3" indexed="true" stored="false" /> |
| <field name="multigrams_body_short" type="multigrams_3" indexed="true" stored="false" /> |
| |
| <field name="multigrams_title_stop" type="multigrams_3_7_stop" indexed="true" stored="false" /> |
| |
| <copyField source="title" dest="multigrams_title" /> |
| <copyField source="title" dest="multigrams_title_short" /> |
| <copyField source="title" dest="multigrams_title_stop" /> |
| |
| <copyField source="body" dest="multigrams_body_short" /> |
| <copyField source="body" dest="multigrams_body" /> |
| |
| <uniqueKey>id</uniqueKey> |
| |
| <fieldType name="text" class="solr.TextField"> |
| <analyzer> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.StopFilterFactory"/> |
| </analyzer> |
| </fieldType> |
| |
| <fieldType name="multigrams_3_7" class="solr.TextField" positionIncrementGap="100"> |
| <analyzer type="index"> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.ASCIIFoldingFilterFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.ShingleFilterFactory" minShingleSize="2" maxShingleSize="3" outputUnigrams="true"/> |
| </analyzer> |
| <analyzer type="query"> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.ASCIIFoldingFilterFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.ShingleFilterFactory" minShingleSize="2" maxShingleSize="7" outputUnigramsIfNoShingles="true" outputUnigrams="true"/> |
| </analyzer> |
| </fieldType> |
| |
| <fieldType name="multigrams_3" class="solr.TextField" positionIncrementGap="100"> |
| <!-- only one analyzer --> |
| <analyzer> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.ASCIIFoldingFilterFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.ShingleFilterFactory" minShingleSize="2" maxShingleSize="3" outputUnigrams="true"/> |
| </analyzer> |
| </fieldType> |
| |
| <fieldType name="multigrams_3_7_stop" class="solr.TextField" positionIncrementGap="100"> |
| <analyzer type="index"> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.ASCIIFoldingFilterFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.StopFilterFactory"/> |
| <filter class="solr.ShingleFilterFactory" minShingleSize="2" maxShingleSize="3" outputUnigrams="true"/> |
| </analyzer> |
| <analyzer type="query"> |
| <tokenizer class="solr.StandardTokenizerFactory"/> |
| <filter class="solr.ASCIIFoldingFilterFactory"/> |
| <filter class="solr.LowerCaseFilterFactory"/> |
| <filter class="solr.StopFilterFactory"/> |
| <filter class="solr.ShingleFilterFactory" minShingleSize="2" maxShingleSize="7" outputUnigramsIfNoShingles="true" outputUnigrams="true"/> |
| </analyzer> |
| </fieldType> |
| |
| |
| <fieldType name="long" class="${solr.tests.LongFieldType}" docValues="${solr.tests.numeric.dv}" precisionStep="0" positionIncrementGap="0"/> |
| <fieldType name="string" class="solr.StrField" sortMissingLast="true"/> |
| |
| </schema> |