Skip to content

Instantly share code, notes, and snippets.

@phact
Created September 25, 2014 08:15
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save phact/8e0b2791558f94472a82 to your computer and use it in GitHub Desktop.
Save phact/8e0b2791558f94472a82 to your computer and use it in GitHub Desktop.
solr config and schema
<?xml version="1.0" encoding="UTF-8" ?>
<config>
<abortOnConfigurationError>${solr.abortOnConfigurationError:true}</abortOnConfigurationError>
<luceneMatchVersion>LUCENE_40</luceneMatchVersion>
<lib dir="/usr/share/dse/" />
<dataDir>${solr.data.dir:}</dataDir>
<directoryFactory name="DirectoryFactory"
class="com.datastax.bdp.cassandra.index.solr.DSENRTCachingDirectoryFactory">
<double name="maxmergesizemb">5.0</double>
<double name="maxcachedmb">32.0</double>
</directoryFactory>
<indexConfig>
<useCompoundFile>false</useCompoundFile>
<ramBufferSizeMB>100</ramBufferSizeMB>
<mergeFactor>10</mergeFactor>
<unlockOnStartup>true</unlockOnStartup>
<maxFieldLength>10000</maxFieldLength>
<writeLockTimeout>1000</writeLockTimeout>
<commitLockTimeout>10000</commitLockTimeout>
<reopenReaders>true</reopenReaders>
<deletionPolicy class="solr.SolrDeletionPolicy">
<str name="maxCommitsToKeep">1</str>
<str name="maxOptimizedCommitsToKeep">0</str>
</deletionPolicy>
<infoStream file="INFOSTREAM.txt">false</infoStream>
</indexConfig>
<jmx />
<updateHandler class="solr.DirectUpdateHandler2">
<autoSoftCommit>
<maxTime>10000</maxTime>
</autoSoftCommit>
</updateHandler>
<query>
<maxBooleanClauses>1024</maxBooleanClauses>
<filterCache class="solr.FastLRUCache"
size="128"
initialSize="0"
autowarmCount="0"/>
<enableLazyFieldLoading>true</enableLazyFieldLoading>
<queryResultWindowSize>20</queryResultWindowSize>
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
<useColdSearcher>true</useColdSearcher>
<maxWarmingSearchers>4</maxWarmingSearchers>
</query>
<requestDispatcher handleSelect="true" >
<requestParsers enableRemoteStreaming="true"
multipartUploadLimitInKB="2048000" />
<httpCaching never304="true" />
</requestDispatcher>
<requestHandler name="search" class="solr.SearchHandler" default="true">
<lst name="defaults">
<str name="echoHandler">true</str>
<str name="echoParams">explicit</str>
<int name="rows">10</int>
</lst>
</requestHandler>
<requestHandler name="/update"
class="solr.XmlUpdateRequestHandler">
</requestHandler>
<requestHandler name="/admin/"
class="solr.admin.AdminHandlers" />
<requestHandler name="/admin/ping" class="solr.PingRequestHandler">
<lst name="invariants">
<str name="qt">search</str>
<str name="q">solrpingquery</str>
</lst>
<lst name="defaults">
<str name="echoParams">all</str>
</lst>
</requestHandler>
<searchComponent class="uk.co.flax.solr.suggest.SuggestComponent" name="flaxsuggest">
<lst name="suggester">
<str name="name">multisuggest</str>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
<str name="lookupImpl">uk.co.flax.solr.suggest.AnalyzingInfixLookupFactory</str>
<str name="suggestAnalyzerFieldType">suggest</str>
<str name="indexPath">ResultlyData.Suggest</str>
<str name="dictionaryImpl">uk.co.flax.solr.suggest.ShingledDocumentDictionaryFactory</str>
<str name="field">title_suggest</str>
<str name="contextField">context</str>
</lst>
</searchComponent>
<requestHandler name="/suggest" class="solr.SearchHandler">
<lst name="defaults">
<str name="suggest">true</str>
<str name="suggest.dictionary">multisuggest</str>
<str name="shards.qt">/suggest</str>
</lst>
<arr name="components">
<str>flaxsuggest</str>
</arr>
</requestHandler>
<queryResponseWriter name="xslt" class="solr.XSLTResponseWriter">
<int name="xsltCacheLifetimeSeconds">5</int>
</queryResponseWriter>
<queryResponseWriter name="javabin" class="solr.BinaryResponseWriter">
<str name="resolverFactory">com.datastax.bdp.search.solr.response.ParallelRowResolver$Factory</str>
</queryResponseWriter>
<admin>
<defaultQuery>*:*</defaultQuery>
</admin>
</config>
<?xml version="1.0" encoding="UTF-8" ?>
<!--
Licensed to the Apache Software Foundation (ASF) under one or more
contributor license agreements. See the NOTICE file distributed with
this work for additional information regarding copyright ownership.
The ASF licenses this file to You under the Apache License, Version 2.0
(the "License"); you may not use this file except in compliance with
the License. You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
-->
<schema name="StreamData" version="1.1">
<types>
<fieldType name="string" class="solr.StrField"/>
<fieldType name="stringBool" class="solr.TextField">
<analyzer>
<tokenizer class="solr.KeywordTokenizerFactory"/>
<filter class="solr.LowerCaseFilterFactory"/>
</analyzer>
</fieldType>
<fieldType name="double" class="solr.TrieDoubleField" />
<fieldType name="byte" class="solr.ByteField" />
<fieldType name="uuid" class="solr.UUIDField" />
<fieldType name="long" class="solr.LongField"/>
<fieldType name="text" class="solr.TextField">
<analyzer>
<tokenizer class="solr.StandardTokenizerFactory"/>
<filter class="solr.ASCIIFoldingFilterFactory"/>
<filter class="solr.LowerCaseFilterFactory"/>
<filter class="si.virag.solr.LemmagenLemmatizerFactory" language="english" />
<!-- <filter class="solr.PorterStemFilterFactory"/> -->
</analyzer>
</fieldType>
<fieldType name="commaDelimited" class="solr.TextField">
<analyzer>
<tokenizer class="solr.PatternTokenizerFactory" pattern="|\s*" />
<filter class="solr.LowerCaseFilterFactory"/>
<filter class="solr.TrimFilterFactory"/>
</analyzer>
</fieldType>
<fieldType name="suggest" class="solr.TextField">
<analyzer type="index">
<tokenizer class="solr.KeywordTokenizerFactory"/>
<filter class="solr.LowerCaseFilterFactory"/>
</analyzer>
<analyzer type="query">
<tokenizer class="solr.KeywordTokenizerFactory"/>
<filter class="solr.LowerCaseFilterFactory"/>
</analyzer>
</fieldType>
</types>
<fields>
<field name="id" type="string" indexed="true" stored="true"/>
<field name="IsPrivate" type="stringBool" indexed="true" stored="false"/>
<field name="IsCrawled" type="stringBool" indexed="true" stored="false"/>
<field name="HasUQ" type="stringBool" indexed="true" stored="false"/>
<field name="LastCrawlTime" type="long" indexed="true" stored="false"/>
<field name="Category" type="string" indexed="true" stored="false"/>
<field name="RssSourceUrl" type="string" indexed="true" stored="false"/>
<field name="UserQueryTypeID" type="string" indexed="true" stored="false"/>
<field name="Description" type="text" indexed="true" stored="false"/>
<field name="Title" type="text" indexed="true" stored="true"/>
<field name="SiteKey" type="stringBool" indexed="true" stored="false"/>
<field name="Channel" type="stringBool" indexed="true" stored="false"/>
<field name="ImageURL_" type="string" indexed="true" stored="false"/>
<field name="LastQueueTime" type="long" indexed="true" stored="false"/>
<field name="color" type="commaDelimited" indexed="true" stored="false"/>
<field name="size" type="commaDelimited" indexed="true" stored="false"/>
<field name="Condition" type="stringBool" indexed="true" stored="false"/>
<field name="Price" type="double" indexed="true" stored="false"/>
<field name="LastStatusChangeTimeTicks" type="long" indexed="true" stored="false" />
<field name="IsPinned" type="stringBool" indexed="true" stored="false"/>
<field name="title_suggest" type="string" docValues="true" indexed="true" stored="false"/>
<field name="context" type="string" docValues="true" indexed="true" stored="false"/>
<field name="ViewedCount" type="long" indexed="true" stored="false"/>
<field name="SharedCount" type="long" indexed="true" stored="false"/>
<field name="PinnedCount" type="long" indexed="true" stored="false"/>
<field name="TrendingScore" type="long" indexed="true" stored="false"/>
<field name="expirationtime" type="long" indexed="true" stored="false"/>
<field name="oldPrice" type="double" indexed="true" stored="false"/>
<field name="mappedsize" type="commaDelimited" indexed="true" stored="false"/>
<field name="mappedcolor" type="commaDelimited" indexed="true" stored="false"/>
<field name="CrawlerHash" type="string" indexed="true" stored="true"/>
<field name="HashUpdate1" type="string" indexed="true" stored="false"/>
</fields>
<copyField source="Title" dest="title_suggest"/>
<copyField source="UserQueryTypeID" dest="context"/>
<defaultSearchField>id</defaultSearchField>
<uniqueKey>id</uniqueKey>
</schema>
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment