diff options
author | Bob Zeleznik <zzzman@gmail.com> | 2019-12-10 18:49:03 -0500 |
---|---|---|
committer | Bob Zeleznik <zzzman@gmail.com> | 2019-12-10 18:49:03 -0500 |
commit | 1dbb45826d4414ed7a1acb5daff730b6e79e97c2 (patch) | |
tree | 9258a346834abccc9ce4881664ccb956f53ae9f7 /solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml | |
parent | 4ab742c54d600fb62b02268f48e711258558924b (diff) | |
parent | 68ccde3251622fdb51ef3d21282fddd8207da3c1 (diff) |
Merge branch 'master' of https://github.com/browngraphicslab/Dash-Web
Diffstat (limited to 'solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml')
-rw-r--r-- | solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml | 35 |
1 files changed, 0 insertions, 35 deletions
diff --git a/solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml b/solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml deleted file mode 100644 index b7de812d0..000000000 --- a/solr-8.1.1/example/example-DIH/solr/atom/conf/atom-data-config.xml +++ /dev/null @@ -1,35 +0,0 @@ -<dataConfig> - <dataSource type="URLDataSource"/> - <document> - - <entity name="stackoverflow" - url="https://stackoverflow.com/feeds/tag/solr" - processor="XPathEntityProcessor" - forEach="/feed|/feed/entry" - transformer="HTMLStripTransformer,RegexTransformer"> - - <!-- Pick this value up from the feed level and apply to all documents --> - <field column="lastchecked_dt" xpath="/feed/updated" commonField="true"/> - - <!-- Keep only the final numeric part of the URL --> - <field column="id" xpath="/feed/entry/id" regex=".*/" replaceWith=""/> - - <field column="title" xpath="/feed/entry/title"/> - <field column="author" xpath="/feed/entry/author/name"/> - <field column="category" xpath="/feed/entry/category/@term"/> - <field column="link" xpath="/feed/entry/link[@rel='alternate']/@href"/> - - <!-- Use transformers to convert HTML into plain text. - There is also an UpdateRequestProcess to trim remaining spaces. - --> - <field column="summary" xpath="/feed/entry/summary" stripHTML="true" regex="( |\n)+" replaceWith=" "/> - - <!-- Ignore namespaces when matching XPath --> - <field column="rank" xpath="/feed/entry/rank"/> - - <field column="published_dt" xpath="/feed/entry/published"/> - <field column="updated_dt" xpath="/feed/entry/updated"/> - </entity> - - </document> -</dataConfig> |