diff options
author | server <brownptcdash@gmail.com> | 2019-12-10 18:12:37 -0500 |
---|---|---|
committer | server <brownptcdash@gmail.com> | 2019-12-10 18:12:37 -0500 |
commit | 7478e610d99d1f2fb383ecbfa0b70d72eae27f81 (patch) | |
tree | 59486701838067351f00580315c05690f36a39ce /solr-8.1.1/example/example-DIH/solr/tika | |
parent | 096718ee546afbd7568bf8ec9e23dca0556d814d (diff) |
solr changes
Diffstat (limited to 'solr-8.1.1/example/example-DIH/solr/tika')
4 files changed, 0 insertions, 142 deletions
diff --git a/solr-8.1.1/example/example-DIH/solr/tika/conf/managed-schema b/solr-8.1.1/example/example-DIH/solr/tika/conf/managed-schema deleted file mode 100644 index b90f314ff..000000000 --- a/solr-8.1.1/example/example-DIH/solr/tika/conf/managed-schema +++ /dev/null @@ -1,54 +0,0 @@ -<?xml version="1.0" encoding="UTF-8" ?> -<!-- - Licensed to the Apache Software Foundation (ASF) under one or more - contributor license agreements. See the NOTICE file distributed with - this work for additional information regarding copyright ownership. - The ASF licenses this file to You under the Apache License, Version 2.0 - (the "License"); you may not use this file except in compliance with - the License. You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. ---> - -<schema name="example-DIH-tika" version="1.6"> - - <uniqueKey>id</uniqueKey> - - <field name="id" type="string" indexed="true" stored="true"/> - <field name="author" type="text_simple" indexed="true" stored="true"/> - <field name="title" type="text_simple" indexed="true" stored="true" multiValued="true"/> - <field name="format" type="string" indexed="true" stored="true"/> - - <!-- field "text" is searchable but it is not stored to save space --> - <field name="text" type="text_simple" indexed="true" stored="false" multiValued="true"/> - - - <!-- Uncomment the dynamicField definition to catch any other fields - that may have been declared in the DIH configuration. - This allows to speed up prototyping. - --> - <!-- <dynamicField name="*" type="string" indexed="true" stored="true" multiValued="true"/> --> - - <!-- The StrField type is not analyzed, but is indexed/stored verbatim. --> - <fieldType name="string" class="solr.StrField" sortMissingLast="true"/> - - - <!-- A basic text field that has reasonable, generic - cross-language defaults: it tokenizes with StandardTokenizer, - and down cases. It does not deal with stopwords or other issues. - See other examples for alternative definitions. - --> - <fieldType name="text_simple" class="solr.TextField" positionIncrementGap="100"> - <analyzer> - <tokenizer class="solr.StandardTokenizerFactory"/> - <filter class="solr.LowerCaseFilterFactory"/> - </analyzer> - </fieldType> - -</schema>
\ No newline at end of file diff --git a/solr-8.1.1/example/example-DIH/solr/tika/conf/solrconfig.xml b/solr-8.1.1/example/example-DIH/solr/tika/conf/solrconfig.xml deleted file mode 100644 index d8509f863..000000000 --- a/solr-8.1.1/example/example-DIH/solr/tika/conf/solrconfig.xml +++ /dev/null @@ -1,61 +0,0 @@ -<?xml version="1.0" encoding="UTF-8" ?> -<!-- - Licensed to the Apache Software Foundation (ASF) under one or more - contributor license agreements. See the NOTICE file distributed with - this work for additional information regarding copyright ownership. - The ASF licenses this file to You under the Apache License, Version 2.0 - (the "License"); you may not use this file except in compliance with - the License. You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. ---> - -<!-- - This is a DEMO configuration highlighting elements - specifically needed to get this example running - such as libraries and request handler specifics. - - It uses defaults or does not define most of production-level settings - such as various caches or auto-commit policies. - - See Solr Reference Guide and other examples for - more details on a well configured solrconfig.xml - https://lucene.apache.org/solr/guide/the-well-configured-solr-instance.html ---> - -<config> - <!-- Controls what version of Lucene various components of Solr - adhere to. Generally, you want to use the latest version to - get all bug fixes and improvements. It is highly recommended - that you fully re-index after changing this setting as it can - affect both how text is indexed and queried. - --> - <luceneMatchVersion>8.1.1</luceneMatchVersion> - - <!-- Load Data Import Handler and Apache Tika (extraction) libraries --> - <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-dataimporthandler-.*\.jar"/> - <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar"/> - - <requestHandler name="/select" class="solr.SearchHandler"> - <lst name="defaults"> - <str name="echoParams">explicit</str> - <str name="df">text</str> - <!-- Change from JSON to XML format (the default prior to Solr 7.0) - <str name="wt">xml</str> - --> - </lst> - </requestHandler> - - <requestHandler name="/dataimport" class="solr.DataImportHandler"> - <lst name="defaults"> - <str name="config">tika-data-config.xml</str> - </lst> - </requestHandler> - -</config> diff --git a/solr-8.1.1/example/example-DIH/solr/tika/conf/tika-data-config.xml b/solr-8.1.1/example/example-DIH/solr/tika/conf/tika-data-config.xml deleted file mode 100644 index 5286fc418..000000000 --- a/solr-8.1.1/example/example-DIH/solr/tika/conf/tika-data-config.xml +++ /dev/null @@ -1,26 +0,0 @@ -<dataConfig> - <dataSource type="BinFileDataSource"/> - <document> - <entity name="file" processor="FileListEntityProcessor" dataSource="null" - baseDir="${solr.install.dir}/example/exampledocs" fileName=".*pdf" - rootEntity="false"> - - <field column="file" name="id"/> - - <entity name="pdf" processor="TikaEntityProcessor" - url="${file.fileAbsolutePath}" format="text"> - - <field column="Author" name="author" meta="true"/> - <!-- in the original PDF, the Author meta-field name is upper-cased, - but in Solr schema it is lower-cased - --> - - <field column="title" name="title" meta="true"/> - <field column="dc:format" name="format" meta="true"/> - - <field column="text" name="text"/> - - </entity> - </entity> - </document> -</dataConfig> diff --git a/solr-8.1.1/example/example-DIH/solr/tika/core.properties b/solr-8.1.1/example/example-DIH/solr/tika/core.properties deleted file mode 100644 index 8b1378917..000000000 --- a/solr-8.1.1/example/example-DIH/solr/tika/core.properties +++ /dev/null @@ -1 +0,0 @@ - |