X-Git-Url: https://git.mdrn.pl/wolnelektury.git/blobdiff_plain/80d789aa009be1449b83b04b5838ebcc15368d68..ef05330bad3d16d8f478a6cb34e6744cc7565abd:/doc/solrconfig.xml?ds=inline diff --git a/doc/solrconfig.xml b/doc/solrconfig.xml index c57144092..e1484b4bf 100644 --- a/doc/solrconfig.xml +++ b/doc/solrconfig.xml @@ -35,9 +35,9 @@ that you fully re-index after changing this setting as it can affect both how text is indexed and queried. --> - <luceneMatchVersion>LUCENE_40</luceneMatchVersion> + <luceneMatchVersion>6.0.1</luceneMatchVersion> - <!-- lib directives can be used to instruct Solr to load an Jars + <!-- <lib/> directives can be used to instruct Solr to load any Jars identified and use them to resolve any "plugins" specified in your solrconfig.xml or schema.xml (ie: Analyzers, Request Handlers, etc...). @@ -48,11 +48,11 @@ If a "./lib" directory exists in your instanceDir, all files found in it are included as if you had used the following syntax... - + <lib dir="./lib" /> --> - <!-- A 'dir' option by itself adds any files found in the directory + <!-- A 'dir' option by itself adds any files found in the directory to the classpath, this is useful for including all jars in a directory. --> @@ -63,32 +63,34 @@ <!-- When a 'regex' is specified in addition to a 'dir', only the files in that directory which completely match the regex (anchored on both ends) will be included. - --> - <lib dir="../../../dist/" regex="apache-solr-cell-\d.*\.jar" /> - <lib dir="../../../contrib/extraction/lib" regex=".*\.jar" /> - - <lib dir="../../../dist/" regex="apache-solr-clustering-\d.*\.jar" /> - <lib dir="../../../contrib/clustering/lib/" regex=".*\.jar" /> - <lib dir="../../../dist/" regex="apache-solr-langid-\d.*\.jar" /> - <lib dir="../../../contrib/langid/lib/" regex=".*\.jar" /> + If a 'dir' option (with or without a regex) is used and nothing + is found that matches, a warning will be logged. - <lib dir="../../../dist/" regex="apache-solr-velocity-\d.*\.jar" /> - <lib dir="../../../contrib/velocity/lib" regex=".*\.jar" /> - - <!-- If a 'dir' option (with or without a regex) is used and nothing - is found that matches, it will be ignored + The examples below can be used to load some solr-contribs along + with their external dependencies. --> - <lib dir="/total/crap/dir/ignored" /> - - <!-- an exact 'path' can be used instead of a 'dir' to specify a - specific file. This will cause a serious error to be logged if - it can't be loaded. + <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" /> + <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" /> + + <lib dir="${solr.install.dir:../../../..}/contrib/clustering/lib/" regex=".*\.jar" /> + <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-clustering-\d.*\.jar" /> + + <lib dir="${solr.install.dir:../../../..}/contrib/langid/lib/" regex=".*\.jar" /> + <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-langid-\d.*\.jar" /> + + <lib dir="${solr.install.dir:../../../..}/contrib/velocity/lib" regex=".*\.jar" /> + <!-- browse-resources must come before solr-velocity JAR in order to override localized resources --> + <lib path="${solr.install.dir:../../../..}/example/files/browse-resources"/> + <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-velocity-\d.*\.jar" /> + <!-- an exact 'path' can be used instead of a 'dir' to specify a + specific jar file. This will cause a serious error to be logged + if it can't be loaded. --> <!-- - <lib path="../a-jar-that-does-not-exist.jar" /> + <lib path="../a-jar-that-does-not-exist.jar" /> --> - + <!-- Data Directory Used to specify an alternate directory to hold all index data @@ -98,9 +100,10 @@ --> <dataDir>${solr.data.dir:}</dataDir> + <schemaFactory class="ClassicIndexSchemaFactory"/> <!-- The DirectoryFactory to use for indexes. - + solr.StandardDirectoryFactory is filesystem based and tries to pick the best implementation for the current JVM and platform. solr.NRTCachingDirectoryFactory, the default, @@ -113,26 +116,26 @@ solr.RAMDirectoryFactory is memory based, not persistent, and doesn't work with replication. --> - <directoryFactory name="DirectoryFactory" - class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/> + <directoryFactory name="DirectoryFactory" + class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/> <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ Index Config - These settings control low-level behavior of indexing Most example settings here show the default value, but are commented out, to more easily see where customizations have been made. - + Note: This replaces <indexDefaults> and <mainIndex> from older versions ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ --> <indexConfig> - <!-- maxFieldLength was removed in 4.0. To get similar behavior, include a - LimitTokenCountFilterFactory in your fieldType definition. E.g. + <!-- maxFieldLength was removed in 4.0. To get similar behavior, include a + LimitTokenCountFilterFactory in your fieldType definition. E.g. <filter class="solr.LimitTokenCountFilterFactory" maxTokenCount="10000"/> --> <!-- Maximum time to wait for a write lock (ms) for an IndexWriter. Default: 1000 --> <!-- <writeLockTimeout>1000</writeLockTimeout> --> - <!-- Expert: Enabling compound file will use less files for the index, - using fewer file descriptors on the expense of performance decrease. + <!-- Expert: Enabling compound file will use less files for the index, + using fewer file descriptors on the expense of performance decrease. Default in Lucene is "true". Default in Solr is "false" (since 3.6) --> <!-- <useCompoundFile>false</useCompoundFile> --> @@ -146,7 +149,7 @@ <!-- <ramBufferSizeMB>32</ramBufferSizeMB> --> <!-- <maxBufferedDocs>1000</maxBufferedDocs> --> - <!-- Expert: Merge Policy + <!-- Expert: Merge Policy The Merge Policy in Lucene controls how merging of segments is done. The default since Solr/Lucene 3.3 is TieredMergePolicy. The default since Lucene 2.3 was the LogByteSizeMergePolicy, @@ -158,7 +161,7 @@ <int name="segmentsPerTier">10</int> </mergePolicy> --> - + <!-- Merge Factor The merge factor controls how many segments will get merged at a time. For TieredMergePolicy, mergeFactor is a convenience parameter which @@ -167,7 +170,7 @@ will be allowed before they are merged into one. Default is 10 for both merge policies. --> - <!-- + <!-- <mergeFactor>10</mergeFactor> --> @@ -177,15 +180,15 @@ can perform merges in the background using separate threads. The SerialMergeScheduler (Lucene 2.2 default) does not. --> - <!-- + <!-- <mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/> --> - <!-- LockFactory + <!-- LockFactory This option specifies which Lucene LockFactory implementation to use. - + single = SingleInstanceLockFactory - suggested for a read-only index or when there is no possibility of another process trying to modify the index. @@ -214,7 +217,7 @@ <!-- <unlockOnStartup>false</unlockOnStartup> --> - + <!-- Expert: Controls how often Lucene loads terms into memory Default is 128 and is likely good for most everyone. --> @@ -223,7 +226,7 @@ <!-- If true, IndexReaders will be reopened (often more efficient) instead of closed and then opened. Default: true --> - <!-- + <!-- <reopenReaders>true</reopenReaders> --> @@ -237,11 +240,11 @@ The default Solr IndexDeletionPolicy implementation supports deleting index commit points on number of commits, age of commit point and optimized status. - + The latest commit point should always be preserved regardless of the criteria. --> - <!-- + <!-- <deletionPolicy class="solr.SolrDeletionPolicy"> --> <!-- The number of commit points to be kept --> @@ -256,24 +259,24 @@ <str name="maxCommitAge">30MINUTES</str> <str name="maxCommitAge">1DAY</str> --> - <!-- + <!-- </deletionPolicy> --> <!-- Lucene Infostream - + To aid in advanced debugging, Lucene provides an "InfoStream" of detailed information when indexing. Setting The value to true will instruct the underlying Lucene IndexWriter to write its debugging info the specified file --> - <!-- <infoStream file="INFOSTREAM.txt">false</infoStream> --> + <!-- <infoStream file="INFOSTREAM.txt">false</infoStream> --> </indexConfig> <!-- JMX - + This example enables JMX if and only if an existing MBeanServer is found, use this if you want to configure JMX through JVM parameters. Remove this to disable exposing Solr configuration @@ -283,7 +286,7 @@ --> <jmx /> <!-- If you want to connect to a particular server, specify the - agentId + agentId --> <!-- <jmx agentId="myAgent" /> --> <!-- If you want to start a new MBeanServer, specify the serviceUrl --> @@ -293,11 +296,21 @@ <!-- The default high-performance update handler --> <updateHandler class="solr.DirectUpdateHandler2"> + <!-- Enables a transaction log, used for real-time get, durability, and + and solr cloud replica recovery. The log can grow as big as + uncommitted changes to the index, so use of a hard autoCommit + is recommended (see below). + "dir" - the target directory for transaction logs, defaults to the + solr data directory. --> + <updateLog> + <str name="dir">${solr.ulog.dir:}</str> + </updateLog> + <!-- AutoCommit Perform a hard commit automatically under certain conditions. Instead of enabling autoCommit, consider using "commitWithin" - when adding documents. + when adding documents. http://wiki.apache.org/solr/UpdateXmlMessages @@ -306,14 +319,14 @@ maxTime - Maximum amount of time in ms that is allowed to pass since a document was added before automaticly - triggering a new commit. + triggering a new commit. openSearcher - if false, the commit causes recent index changes to be flushed to stable storage, but does not cause a new searcher to be opened to make those changes visible. --> - <autoCommit> - <maxTime>15000</maxTime> - <openSearcher>false</openSearcher> + <autoCommit> + <maxTime>15000</maxTime> + <openSearcher>false</openSearcher> </autoCommit> <!-- softAutoCommit is like autoCommit except it causes a @@ -322,13 +335,13 @@ faster and more near-realtime friendly than a hard commit. --> <!-- - <autoSoftCommit> - <maxTime>1000</maxTime> + <autoSoftCommit> + <maxTime>1000</maxTime> </autoSoftCommit> --> <!-- Update Related Event Listeners - + Various IndexWriter related events can trigger Listeners to take actions. @@ -337,10 +350,10 @@ --> <!-- The RunExecutableListener executes an external command from a hook such as postCommit or postOptimize. - + exe - the name of the executable to run dir - dir to use as the current working directory. (default=".") - wait - the calling thread waits until the executable returns. + wait - the calling thread waits until the executable returns. (default="true") args - the arguments to pass to the program. (default is none) env - environment variables to set. (default is none) @@ -359,16 +372,8 @@ </listener> --> - <!-- Enables a transaction log, currently used for real-time get. - "dir" - the target directory for transaction logs, defaults to the - solr data directory. --> - <updateLog> - <str name="dir">${solr.data.dir:}</str> - </updateLog> - - </updateHandler> - + <!-- IndexReaderFactory Use the following format to specify a custom IndexReaderFactory, @@ -400,7 +405,7 @@ be specified. --> <!-- - <indexReaderFactory name="IndexReaderFactory" + <indexReaderFactory name="IndexReaderFactory" class="solr.StandardIndexReaderFactory"> <int name="setTermIndexDivisor">12</int> </indexReaderFactory > @@ -416,12 +421,12 @@ is thrown if exceeded. ** WARNING ** - + This option actually modifies a global Lucene property that will affect all SolrCores. If multiple solrconfig.xml files disagree on this property, the value at any given moment will be based on the last SolrCore to be initialized. - + --> <maxBooleanClauses>1024</maxBooleanClauses> @@ -430,7 +435,7 @@ There are two implementations of cache available for Solr, LRUCache, based on a synchronized LinkedHashMap, and - FastLRUCache, based on a ConcurrentHashMap. + FastLRUCache, based on a ConcurrentHashMap. FastLRUCache has faster gets and slower puts in single threaded operation and thus is generally faster than LRUCache @@ -455,7 +460,7 @@ initialSize - the initial capacity (number of entries) of the cache. (see java.util.HashMap) autowarmCount - the number of entries to prepopulate from - and old cache. + and old cache. --> <filterCache class="solr.FastLRUCache" size="512" @@ -463,28 +468,28 @@ autowarmCount="0"/> <!-- Query Result Cache - + Caches results of searches - ordered lists of document ids - (DocList) based on a query, a sort, and the range of documents requested. + (DocList) based on a query, a sort, and the range of documents requested. --> <queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/> - + <!-- Document Cache Caches Lucene Document objects (the stored fields for each document). Since Lucene internal document ids are transient, - this cache will not be autowarmed. + this cache will not be autowarmed. --> <documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/> - + <!-- Field Value Cache - + Cache used to hold field values that are quickly accessible by document id. The fieldValueCache is created by default even if not configured here. @@ -502,8 +507,8 @@ name through SolrIndexSearcher.getCache(),cacheLookup(), and cacheInsert(). The purpose is to enable easy caching of user/application level data. The regenerator argument should - be specified as an implementation of solr.CacheRegenerator - if autowarming is desired. + be specified as an implementation of solr.CacheRegenerator + if autowarming is desired. --> <!-- <cache name="myUserCache" @@ -550,12 +555,12 @@ are collected. For example, if a search for a particular query requests matching documents 10 through 19, and queryWindowSize is 50, then documents 0 through 49 will be collected and cached. Any further - requests in that range can be satisfied via the cache. + requests in that range can be satisfied via the cache. --> <queryResultWindowSize>20</queryResultWindowSize> <!-- Maximum number of documents to cache for any entry in the - queryResultCache. + queryResultCache. --> <queryResultMaxDocsCached>200</queryResultMaxDocsCached> @@ -573,10 +578,10 @@ prepared but there is no current registered searcher to handle requests or to gain autowarming data from. - + --> <!-- QuerySenderListener takes an array of NamedList and executes a - local query request for each NamedList in sequence. + local query request for each NamedList in sequence. --> <listener event="newSearcher" class="solr.QuerySenderListener"> <arr name="queries"> @@ -604,7 +609,7 @@ <useColdSearcher>false</useColdSearcher> <!-- Max Warming Searchers - + Maximum number of searchers that may be warming in the background concurrently. An error is returned if this limit is exceeded. @@ -648,14 +653,14 @@ multipartUploadLimitInKB - specifies the max size of Multipart File Uploads that Solr will allow in a Request. - + *** WARNING *** The settings below authorize Solr to fetch remote files, You should make sure your system has some authentication before using enableRemoteStreaming="true" - --> - <requestParsers enableRemoteStreaming="true" + --> + <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000" /> <!-- HTTP Caching @@ -669,21 +674,21 @@ <!-- If you include a <cacheControl> directive, it will be used to generate a Cache-Control header (as well as an Expires header if the value contains "max-age=") - + By default, no Cache-Control header is generated. - + You can use the <cacheControl> option even if you have set never304="true" --> <!-- <httpCaching never304="true" > - <cacheControl>max-age=30, public</cacheControl> + <cacheControl>max-age=30, public</cacheControl> </httpCaching> --> <!-- To enable Solr to respond with automatically generated HTTP Caching headers, and to response to Cache Validation requests correctly, set the value of never304="false" - + This will cause Solr to generate Last-Modified and ETag headers based on the properties of the Index. @@ -708,12 +713,12 @@ <!-- <httpCaching lastModifiedFrom="openTime" etagSeed="Solr"> - <cacheControl>max-age=30, public</cacheControl> + <cacheControl>max-age=30, public</cacheControl> </httpCaching> --> </requestDispatcher> - <!-- Request Handlers + <!-- Request Handlers http://wiki.apache.org/solr/SolrRequestHandler @@ -727,7 +732,7 @@ like so: http://host/app/[core/]select?qt=name If no qt is given, then the requestHandler that declares default="true" will be used or the one named "standard". - + If a Request Handler is declared with startup="lazy", then it will not be initialized until the first request that uses it. @@ -802,16 +807,16 @@ <str>nameOfCustomComponent2</str> </arr> --> - </requestHandler> + </requestHandler> <!-- A request handler that returns indented JSON by default --> <requestHandler name="/query" class="solr.SearchHandler"> - <lst name="defaults"> - <str name="echoParams">explicit</str> - <str name="wt">json</str> - <str name="indent">true</str> - <str name="df">text</str> - </lst> + <lst name="defaults"> + <str name="echoParams">explicit</str> + <str name="wt">json</str> + <str name="indent">true</str> + <str name="df">text</str> + </lst> </requestHandler> @@ -826,9 +831,9 @@ </lst> </requestHandler> - - <!-- A Robust Example - + + <!-- A Robust Example + This example SearchHandler declaration shows off usage of the SearchHandler with many defaults declared @@ -908,14 +913,14 @@ <!-- Spell checking defaults --> <str name="spellcheck">on</str> - <str name="spellcheck.extendedResults">false</str> + <str name="spellcheck.extendedResults">false</str> <str name="spellcheck.count">5</str> <str name="spellcheck.alternativeTermCount">2</str> - <str name="spellcheck.maxResultsForSuggest">5</str> + <str name="spellcheck.maxResultsForSuggest">5</str> <str name="spellcheck.collate">true</str> - <str name="spellcheck.collateExtendedResults">true</str> + <str name="spellcheck.collateExtendedResults">true</str> <str name="spellcheck.maxCollationTries">5</str> - <str name="spellcheck.maxCollations">3</str> + <str name="spellcheck.maxCollations">3</str> </lst> <!-- append spellchecking to our list of components --> @@ -925,8 +930,8 @@ </requestHandler> - <!-- Update Request Handler. - + <!-- Update Request Handler. + http://wiki.apache.org/solr/UpdateXmlMessages The canonical Request Handler for Modifying the Index through @@ -935,17 +940,17 @@ Note: Since solr1.1 requestHandlers requires a valid content type header if posted in the body. For example, curl now requires: -H 'Content-type:text/xml; charset=utf-8' - - To override the request content type and force a specific - Content-type, use the request parameter: + + To override the request content type and force a specific + Content-type, use the request parameter: ?update.contentType=text/csv - + This handler will pick a response format to match the input if the 'wt' parameter is not explicit --> <requestHandler name="/update" class="solr.UpdateRequestHandler"> - <!-- See below for information on defining - updateRequestProcessorChains that can be used by name + <!-- See below for information on defining + updateRequestProcessorChains that can be used by name on each Update Request --> <!-- @@ -954,14 +959,14 @@ </lst> --> </requestHandler> - + <!-- Solr Cell Update Request Handler - http://wiki.apache.org/solr/ExtractingRequestHandler + http://wiki.apache.org/solr/ExtractingRequestHandler --> - <requestHandler name="/update/extract" + <requestHandler name="/update/extract" startup="lazy" class="solr.extraction.ExtractingRequestHandler" > <lst name="defaults"> @@ -994,7 +999,7 @@ field value analysis will be marked as "matched" for every token that is produces by the query analysis --> - <requestHandler name="/analysis/field" + <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" /> @@ -1027,111 +1032,34 @@ request parameter that holds the query text to be analyzed. It also supports the "analysis.showmatch" parameter which when set to true, all field tokens that match the query tokens will be marked - as a "match". + as a "match". --> - <requestHandler name="/analysis/document" - class="solr.DocumentAnalysisRequestHandler" + <requestHandler name="/analysis/document" + class="solr.DocumentAnalysisRequestHandler" startup="lazy" /> - <!-- Admin Handlers - - Admin Handlers - This will register all the standard admin - RequestHandlers. - --> - <requestHandler name="/admin/" - class="solr.admin.AdminHandlers" /> - <!-- This single handler is equivalent to the following... --> - <!-- - <requestHandler name="/admin/luke" class="solr.admin.LukeRequestHandler" /> - <requestHandler name="/admin/system" class="solr.admin.SystemInfoHandler" /> - <requestHandler name="/admin/plugins" class="solr.admin.PluginInfoHandler" /> - <requestHandler name="/admin/threads" class="solr.admin.ThreadDumpHandler" /> - <requestHandler name="/admin/properties" class="solr.admin.PropertiesRequestHandler" /> - <requestHandler name="/admin/file" class="solr.admin.ShowFileRequestHandler" > - --> - <!-- If you wish to hide files under ${solr.home}/conf, explicitly - register the ShowFileRequestHandler using: - --> - <!-- - <requestHandler name="/admin/file" - class="solr.admin.ShowFileRequestHandler" > - <lst name="invariants"> - <str name="hidden">synonyms.txt</str> - <str name="hidden">anotherfile.txt</str> - </lst> - </requestHandler> - --> - - <!-- ping/healthcheck --> - <requestHandler name="/admin/ping" class="solr.PingRequestHandler"> - <lst name="invariants"> - <str name="q">solrpingquery</str> - </lst> - <lst name="defaults"> - <str name="echoParams">all</str> - </lst> - <!-- An optional feature of the PingRequestHandler is to configure the - handler with a "healthcheckFile" which can be used to enable/disable - the PingRequestHandler. - relative paths are resolved against the data dir - --> - <!-- <str name="healthcheckFile">server-enabled.txt</str> --> - </requestHandler> - <!-- Echo the request contents back to the client --> <requestHandler name="/debug/dump" class="solr.DumpRequestHandler" > <lst name="defaults"> - <str name="echoParams">explicit</str> + <str name="echoParams">explicit</str> <str name="echoHandler">true</str> </lst> </requestHandler> - - <!-- Solr Replication - - The SolrReplicationHandler supports replicating indexes from a - "master" used for indexing and "slaves" used for queries. - - http://wiki.apache.org/solr/SolrReplication - - In the example below, remove the <lst name="master"> section if - this is just a slave and remove the <lst name="slave"> section - if this is just a master. - --> - <!-- - <requestHandler name="/replication" class="solr.ReplicationHandler" > - <lst name="master"> - <str name="replicateAfter">commit</str> - <str name="replicateAfter">startup</str> - <str name="confFiles">schema.xml,stopwords.txt</str> - </lst> - <lst name="slave"> - <str name="masterUrl">http://localhost:8983/solr</str> - <str name="pollInterval">00:00:60</str> - </lst> - </requestHandler> - --> - - <!-- Solr Replication for SolrCloud Recovery - - This is the config need for SolrCloud's recovery replication. - --> - <requestHandler name="/replication" class="solr.ReplicationHandler" startup="lazy" /> - <!-- Search Components - Search components are registered to SolrCore and used by + Search components are registered to SolrCore and used by instances of SearchHandler (which can access them by name) - + By default, the following components are available: - + <searchComponent name="query" class="solr.QueryComponent" /> <searchComponent name="facet" class="solr.FacetComponent" /> <searchComponent name="mlt" class="solr.MoreLikeThisComponent" /> <searchComponent name="highlight" class="solr.HighlightComponent" /> <searchComponent name="stats" class="solr.StatsComponent" /> <searchComponent name="debug" class="solr.DebugComponent" /> - + Default configuration in a requestHandler would look like: <arr name="components"> @@ -1143,28 +1071,28 @@ <str>debug</str> </arr> - If you register a searchComponent to one of the standard names, + If you register a searchComponent to one of the standard names, that will be used instead of the default. To insert components before or after the 'standard' components, use: - + <arr name="first-components"> <str>myFirstComponentName</str> </arr> - + <arr name="last-components"> <str>myLastComponentName</str> </arr> NOTE: The component registered with the name "debug" will - always be executed after the "last-components" - + always be executed after the "last-components" + --> - + <!-- Spell Check The spell check component can return a list of alternative spelling - suggestions. + suggestions. http://wiki.apache.org/solr/SpellCheckComponent --> @@ -1199,11 +1127,11 @@ <float name="thresholdTokenFrequency">.01</float> --> </lst> - + <!-- a spellchecker that can break or combine words. See "/spell" handler below for usage --> <lst name="spellchecker"> <str name="name">wordbreak</str> - <str name="classname">solr.WordBreakSolrSpellChecker</str> + <str name="classname">solr.WordBreakSolrSpellChecker</str> <str name="field">name</str> <str name="combineWords">true</str> <str name="breakWords">true</str> @@ -1222,7 +1150,7 @@ </lst> --> - <!-- a spellchecker that use an alternate comparator + <!-- a spellchecker that use an alternate comparator comparatorClass be one of: 1. score (default) @@ -1249,7 +1177,7 @@ --> </searchComponent> - <!-- A request handler for demonstrating the spellcheck component. + <!-- A request handler for demonstrating the spellcheck component. NOTE: This is purely as an example. The whole purpose of the SpellCheckComponent is to hook it into the request handler that @@ -1258,7 +1186,7 @@ IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS NOT WHAT YOU WANT FOR YOUR PRODUCTION SYSTEM! - + See http://wiki.apache.org/solr/SpellCheckComponent for details on the request parameters. --> @@ -1272,14 +1200,14 @@ <str name="spellcheck.dictionary">default</str> <str name="spellcheck.dictionary">wordbreak</str> <str name="spellcheck">on</str> - <str name="spellcheck.extendedResults">true</str> + <str name="spellcheck.extendedResults">true</str> <str name="spellcheck.count">10</str> <str name="spellcheck.alternativeTermCount">5</str> - <str name="spellcheck.maxResultsForSuggest">5</str> + <str name="spellcheck.maxResultsForSuggest">5</str> <str name="spellcheck.collate">true</str> - <str name="spellcheck.collateExtendedResults">true</str> + <str name="spellcheck.collateExtendedResults">true</str> <str name="spellcheck.maxCollationTries">10</str> - <str name="spellcheck.maxCollations">5</str> + <str name="spellcheck.maxCollations">5</str> </lst> <arr name="last-components"> <str>spellcheck</str> @@ -1296,8 +1224,8 @@ This is purely as an example. - In reality you will likely want to add the component to your - already specified request handlers. + In reality you will likely want to add the component to your + already specified request handlers. --> <requestHandler name="/tvrh" class="solr.SearchHandler" startup="lazy"> <lst name="defaults"> @@ -1309,114 +1237,8 @@ </arr> </requestHandler> - <!-- Clustering Component - - http://wiki.apache.org/solr/ClusteringComponent - - You'll need to set the solr.cluster.enabled system property - when running solr to run with clustering enabled: - - java -Dsolr.clustering.enabled=true -jar start.jar - - --> - <searchComponent name="clustering" - enable="${solr.clustering.enabled:false}" - class="solr.clustering.ClusteringComponent" > - <!-- Declare an engine --> - <lst name="engine"> - <!-- The name, only one can be named "default" --> - <str name="name">default</str> - - <!-- Class name of Carrot2 clustering algorithm. - - Currently available algorithms are: - - * org.carrot2.clustering.lingo.LingoClusteringAlgorithm - * org.carrot2.clustering.stc.STCClusteringAlgorithm - * org.carrot2.clustering.kmeans.BisectingKMeansClusteringAlgorithm - - See http://project.carrot2.org/algorithms.html for the - algorithm's characteristics. - --> - <str name="carrot.algorithm">org.carrot2.clustering.lingo.LingoClusteringAlgorithm</str> + <!-- Clustering Component. (Omitted here. See the default Solr example for a typical configuration.) --> - <!-- Overriding values for Carrot2 default algorithm attributes. - - For a description of all available attributes, see: - http://download.carrot2.org/stable/manual/#chapter.components. - Use attribute key as name attribute of str elements - below. These can be further overridden for individual - requests by specifying attribute key as request parameter - name and attribute value as parameter value. - --> - <str name="LingoClusteringAlgorithm.desiredClusterCountBase">20</str> - - <!-- Location of Carrot2 lexical resources. - - A directory from which to load Carrot2-specific stop words - and stop labels. Absolute or relative to Solr config directory. - If a specific resource (e.g. stopwords.en) is present in the - specified dir, it will completely override the corresponding - default one that ships with Carrot2. - - For an overview of Carrot2 lexical resources, see: - http://download.carrot2.org/head/manual/#chapter.lexical-resources - --> - <str name="carrot.lexicalResourcesDir">clustering/carrot2</str> - - <!-- The language to assume for the documents. - - For a list of allowed values, see: - http://download.carrot2.org/stable/manual/#section.attribute.lingo.MultilingualClustering.defaultLanguage - --> - <str name="MultilingualClustering.defaultLanguage">ENGLISH</str> - </lst> - <lst name="engine"> - <str name="name">stc</str> - <str name="carrot.algorithm">org.carrot2.clustering.stc.STCClusteringAlgorithm</str> - </lst> - </searchComponent> - - <!-- A request handler for demonstrating the clustering component - - This is purely as an example. - - In reality you will likely want to add the component to your - already specified request handlers. - --> - <requestHandler name="/clustering" - startup="lazy" - enable="${solr.clustering.enabled:false}" - class="solr.SearchHandler"> - <lst name="defaults"> - <bool name="clustering">true</bool> - <str name="clustering.engine">default</str> - <bool name="clustering.results">true</bool> - <!-- The title field --> - <str name="carrot.title">name</str> - <str name="carrot.url">id</str> - <!-- The field to cluster on --> - <str name="carrot.snippet">features</str> - <!-- produce summaries --> - <bool name="carrot.produceSummary">true</bool> - <!-- the maximum number of labels per cluster --> - <!--<int name="carrot.numDescriptions">5</int>--> - <!-- produce sub clusters --> - <bool name="carrot.outputSubClusters">false</bool> - - <str name="defType">edismax</str> - <str name="qf"> - text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4 - </str> - <str name="q.alt">*:*</str> - <str name="rows">10</str> - <str name="fl">*,score</str> - </lst> - <arr name="last-components"> - <str>clustering</str> - </arr> - </requestHandler> - <!-- Terms Component http://wiki.apache.org/solr/TermsComponent @@ -1430,7 +1252,8 @@ <requestHandler name="/terms" class="solr.SearchHandler" startup="lazy"> <lst name="defaults"> <bool name="terms">true</bool> - </lst> + <bool name="distrib">false</bool> + </lst> <arr name="components"> <str>terms</str> </arr> @@ -1470,7 +1293,7 @@ <highlighting> <!-- Configure the standard fragmenter --> <!-- This could most likely be commented out in the "default" case --> - <fragmenter name="gap" + <fragmenter name="gap" default="true" class="solr.highlight.GapFragmenter"> <lst name="defaults"> @@ -1478,10 +1301,10 @@ </lst> </fragmenter> - <!-- A regular-expression-based fragmenter - (for sentence extraction) + <!-- A regular-expression-based fragmenter + (for sentence extraction) --> - <fragmenter name="regex" + <fragmenter name="regex" class="solr.highlight.RegexFragmenter"> <lst name="defaults"> <!-- slightly smaller fragsizes work better because of slop --> @@ -1494,7 +1317,7 @@ </fragmenter> <!-- Configure the standard formatter --> - <formatter name="html" + <formatter name="html" default="true" class="solr.highlight.HtmlFormatter"> <lst name="defaults"> @@ -1504,27 +1327,27 @@ </formatter> <!-- Configure the standard encoder --> - <encoder name="html" + <encoder name="html" class="solr.highlight.HtmlEncoder" /> <!-- Configure the standard fragListBuilder --> - <fragListBuilder name="simple" + <fragListBuilder name="simple" class="solr.highlight.SimpleFragListBuilder"/> - + <!-- Configure the single fragListBuilder --> - <fragListBuilder name="single" + <fragListBuilder name="single" class="solr.highlight.SingleFragListBuilder"/> - + <!-- Configure the weighted fragListBuilder --> - <fragListBuilder name="weighted" + <fragListBuilder name="weighted" default="true" class="solr.highlight.WeightedFragListBuilder"/> - + <!-- default tag FragmentsBuilder --> - <fragmentsBuilder name="default" + <fragmentsBuilder name="default" default="true" class="solr.highlight.ScoreOrderFragmentsBuilder"> - <!-- + <!-- <lst name="defaults"> <str name="hl.multiValuedSeparatorChar">/</str> </lst> @@ -1532,7 +1355,7 @@ </fragmentsBuilder> <!-- multi-colored tag FragmentsBuilder --> - <fragmentsBuilder name="colored" + <fragmentsBuilder name="colored" class="solr.highlight.ScoreOrderFragmentsBuilder"> <lst name="defaults"> <str name="hl.tag.pre"><![CDATA[ @@ -1544,8 +1367,8 @@ <str name="hl.tag.post"><![CDATA[</b>]]></str> </lst> </fragmentsBuilder> - - <boundaryScanner name="default" + + <boundaryScanner name="default" default="true" class="solr.highlight.SimpleBoundaryScanner"> <lst name="defaults"> @@ -1553,8 +1376,8 @@ <str name="hl.bs.chars">.,!? 	 </str> </lst> </boundaryScanner> - - <boundaryScanner name="breakIterator" + + <boundaryScanner name="breakIterator" class="solr.highlight.BreakIteratorBoundaryScanner"> <lst name="defaults"> <!-- type should be one of CHARACTER, WORD(default), LINE and SENTENCE --> @@ -1576,15 +1399,15 @@ http://wiki.apache.org/solr/UpdateRequestProcessor - --> + --> <!-- Deduplication An example dedup update processor that creates the "id" field on the fly based on the hash code of some other fields. This example has overwriteDupes set to false since we are using the id field as the signatureField and Solr will maintain - uniqueness based on that anyway. - + uniqueness based on that anyway. + --> <!-- <updateRequestProcessorChain name="dedupe"> @@ -1599,7 +1422,7 @@ <processor class="solr.RunUpdateProcessorFactory" /> </updateRequestProcessorChain> --> - + <!-- Language identification This example update chain identifies the language of the incoming @@ -1639,7 +1462,7 @@ <processor class="solr.RunUpdateProcessorFactory" /> </updateRequestProcessorChain> --> - + <!-- Response Writers http://wiki.apache.org/solr/QueryResponseWriter @@ -1655,7 +1478,7 @@ overridden... --> <!-- - <queryResponseWriter name="xml" + <queryResponseWriter name="xml" default="true" class="solr.XMLResponseWriter" /> <queryResponseWriter name="json" class="solr.JSONResponseWriter"/> @@ -1664,6 +1487,7 @@ <queryResponseWriter name="php" class="solr.PHPResponseWriter"/> <queryResponseWriter name="phps" class="solr.PHPSerializedResponseWriter"/> <queryResponseWriter name="csv" class="solr.CSVResponseWriter"/> + <queryResponseWriter name="schema.xml" class="solr.SchemaXmlResponseWriter"/> --> <queryResponseWriter name="json" class="solr.JSONResponseWriter"> @@ -1673,16 +1497,17 @@ --> <str name="content-type">text/plain; charset=UTF-8</str> </queryResponseWriter> - + <!-- Custom response writers can be declared as needed... --> - <queryResponseWriter name="velocity" class="solr.VelocityResponseWriter" startup="lazy"/> - + <queryResponseWriter name="velocity" class="solr.VelocityResponseWriter" startup="lazy"> + <str name="template.base.dir">${velocity.template.base.dir:}</str> + </queryResponseWriter> <!-- XSLT response writer transforms the XML output by any xslt file found in Solr's conf/xslt directory. Changes to xslt files are checked for - every xsltCacheLifetimeSeconds. + every xsltCacheLifetimeSeconds. --> <queryResponseWriter name="xslt" class="solr.XSLTResponseWriter"> <int name="xsltCacheLifetimeSeconds">5</int> @@ -1710,11 +1535,11 @@ --> <!-- example of registering a custom function parser --> <!-- - <valueSourceParser name="myfunc" + <valueSourceParser name="myfunc" class="com.mycompany.MyValueSourceParser" /> --> - - + + <!-- Document Transformers http://wiki.apache.org/solr/DocTransformers --> @@ -1723,12 +1548,12 @@ <transformer name="db" class="com.mycompany.LoadFromDatabaseTransformer" > <int name="connection">jdbc://....</int> </transformer> - + To add a constant value to all docs, use: <transformer name="mytrans2" class="org.apache.solr.response.transform.ValueAugmenterFactory" > <int name="value">5</int> </transformer> - + If you want the user to still be able to change it with _value:something_ use this: <transformer name="mytrans3" class="org.apache.solr.response.transform.ValueAugmenterFactory" > <double name="defaultValue">5</double> @@ -1738,11 +1563,6 @@ EditorialMarkerFactory will do exactly that: <transformer name="qecBooster" class="org.apache.solr.response.transform.EditorialMarkerFactory" /> --> - - <!-- Legacy config for the admin interface --> - <admin> - <defaultQuery>*:*</defaultQuery> - </admin> </config>