Skip to content

Instantly share code, notes, and snippets.

@izacus
Created September 6, 2013 17:01
Show Gist options
  • Save izacus/6466630 to your computer and use it in GitHub Desktop.
Save izacus/6466630 to your computer and use it in GitHub Desktop.
<schema name="default" version="1.1">
<types>
<fieldtype name="string" class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
<fieldType name="date" class="solr.TrieDateField" sortMissingLast="true" omitNorms="true"/>
<fieldType name="int" class="solr.TrieIntField" precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
<fieldType name="long" class="solr.LongField" />
<fieldType name="text" class="solr.TextField" positionIncrementGap="100">
<analyzer type="index">
<charFilter class="solr.HTMLStripCharFilterFactory"/>
<tokenizer class="solr.StandardTokenizerFactory"/>
<filter class="solr.ClassicFilterFactory" />
<filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true" />
<filter class="solr.LowerCaseFilterFactory" />
<filter class="solr.ASCIIFoldingFilterFactory" />
<filter class="si.virag.solr.RdrLemmatizerFactory" dictionary="/var/solr/lem-me-sl.bin" />
<filter class="solr.ShingleFilterFactory" maxShingleSize="3" outputUnigrams="true" />
</analyzer>
<analyzer type="query">
<charFilter class="solr.HTMLStripCharFilterFactory"/>
<tokenizer class="solr.StandardTokenizerFactory"/>
<filter class="solr.ClassicFilterFactory" />
<filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true" />
<filter class="solr.LowerCaseFilterFactory" />
<filter class="solr.ASCIIFoldingFilterFactory" />
<filter class="si.virag.solr.RdrLemmatizerFactory" dictionary="/var/solr/lem-me-sl.bin" />
<filter class="solr.ShingleFilterFactory" maxShingleSize="3" outputUnigrams="true" />
</analyzer>
</fieldType>
</types>
<fields>
<field name="_version_" type="long" indexed="true" stored="true" multiValued="false" />
<field name="id" type="string" indexed="true" stored="true" multiValued="false" required="true" />
<!-- Name, caption or title -->
<field name="title" type="text" indexed="true" stored="true" multiValued="false" required="true" termVectors="true" termPositions="true" termOffsets="true" />
<field name="source" type="string" indexed="true" stored="true" multiValued="false" required="true" />
<field name="source_url" type="string" indexed="false" stored="true" multiValued="false" required="true" />
<field name="author" type="text" indexed="true" stored="false" multiValued="false" required="false" termVectors="true" termPositions="true" termOffsets="true" />
<field name="author_exact" type="string" indexed="false" stored="true" multiValued="false" required="false" />
<field name="language" type="string" indexed="true" stored="true" multiValued="false" required="false" />
<field name="content" type="text" indexed="true" stored="true" multiValued="false" required="false" termVectors="true" termPositions="true" termOffsets="true" />
<field name="published" type="date" indexed="true" stored="true" multiValued="false" required="true" />
<field name="all_text" type="text" indexed="true" stored="true" multiValued="true" required="true" />
</fields>
<!-- field to use to determine and enforce document uniqueness. -->
<uniqueKey>id</uniqueKey>
<!-- field for the QueryParser to use when an explicit fieldname is absent -->
<defaultSearchField>all_text</defaultSearchField>
<copyField source="title" dest="all_text" />
<copyField source="content" dest="all_text" />
<copyField source="source" dest="all_text" />
<copyField source="author" dest="author_exact" />
<!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
<solrQueryParser defaultOperator="AND" />
</schema>
<config>
<luceneMatchVersion>LUCENE_40</luceneMatchVersion>
<!-- The DirectoryFactory to use for indexes.
solr.StandardDirectoryFactory, the default, is filesystem based.
solr.RAMDirectoryFactory is memory based, not persistent, and doesn't work with replication. -->
<directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.StandardDirectoryFactory}"/>
<dataDir>${solr.en.data.dir:}</dataDir>
<searchComponent name="highlight" class="solr.HighlightComponent">
<boundaryScanner name="breakIterator" class="solr.highlight.BreakIteratorBoundaryScanner">
<lst name="defaults">
<str name="hl.bs.type">WORD</str>
<str name="hl.bs.language">sl</str>
<str name="hl.bs.country">SI</str>
</lst>
</boundaryScanner>
</searchComponent>
<updateHandler class="solr.DirectUpdateHandler2">
<updateLog>
<str name="dir">${solr.en.data.dir:}</str>
</updateLog>
</updateHandler>
<requestDispatcher handleSelect="true" >
<requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048" />
</requestDispatcher>
<requestHandler name="/select" class="solr.SearchHandler" default="true">
<lst name="defaults">
<str name="defType">edismax</str>
<str name="qt">title^4.0 content all_text^0.4</str>
<str name="wt">json</str>
<str name="json.nl">map</str>
<str name="hl">true</str>
<str name="hl.fl">title,content</str>
<str name="hl.snippets">5</str>
<str name="hl.useFastVectorHighlighter">true</str>
<str name="hl.tag.pre"><![CDATA[<em><strong>]]></str>
<str name="hl.tag.post"><![CDATA[</strong></em>]]></str>
<str name="hl.fragsize">200</str>
<str name="f.title.hl.fragsize">1000</str>
<str name="fl">id,title,published,source,source_url,content</str>
<str name="facet">true</str>
<str name="facet.field">source</str>
<str name="facet.field">author</str>
<str name="facet.mincount">1</str>
<str name="facet.range">published</str>
<str name="facet.range.start">NOW/MONTHS-1MONTH</str>
<str name="facet.range.end">NOW</str>
<str name="facet.range.gap">+1DAY</str>
<str name="facet.range.other">before</str>
<str name="mlt.match.include">false</str>
<str name="mlt.boost">true</str>
<str name="mlt.mindf">2</str>
</lst>
</requestHandler>
<requestHandler name="/mlt" class="solr.MoreLikeThisHandler" />
<requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
<requestHandler name="/update" class="solr.UpdateRequestHandler" />
<requestHandler name="/update/json" class="solr.JsonUpdateRequestHandler" />
<requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers" />
<requestHandler name="/admin/ping" class="solr.PingRequestHandler">
<lst name="invariants">
<str name="q">solrpingquery</str>
</lst>
<lst name="defaults">
<str name="echoParams">all</str>
</lst>
</requestHandler>
<!-- config for the admin interface -->
<admin>
<defaultQuery>solr</defaultQuery>
</admin>
</config>
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment