aboutsummaryrefslogtreecommitdiff
path: root/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering
diff options
context:
space:
mode:
authorandrewdkim <adkim414@gmail.com>2019-08-06 12:30:09 -0400
committerandrewdkim <adkim414@gmail.com>2019-08-06 12:30:09 -0400
commitb6990a61befdea70abd99f125a2488ce5a6f04a6 (patch)
tree833c13a0ddabb325cc2e39dbb199f111cced22d2 /solr-8.1.1/example/example-DIH/solr/mail/conf/clustering
parent2c86a6958186c020ce7fbe99555f07ffe9f9f821 (diff)
parent298d1c9b29d6ce2171fd9ac8274b64583b73f6f5 (diff)
merge from master
Diffstat (limited to 'solr-8.1.1/example/example-DIH/solr/mail/conf/clustering')
-rw-r--r--solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/kmeans-attributes.xml19
-rw-r--r--solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/lingo-attributes.xml24
-rw-r--r--solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/stc-attributes.xml19
3 files changed, 62 insertions, 0 deletions
diff --git a/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/kmeans-attributes.xml b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/kmeans-attributes.xml
new file mode 100644
index 000000000..d802465f6
--- /dev/null
+++ b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/kmeans-attributes.xml
@@ -0,0 +1,19 @@
+<!--
+ Default configuration for the bisecting k-means clustering algorithm.
+
+ This file can be loaded (and saved) by Carrot2 Workbench.
+ http://project.carrot2.org/download.html
+-->
+<attribute-sets default="attributes">
+ <attribute-set id="attributes">
+ <value-set>
+ <label>attributes</label>
+ <attribute key="MultilingualClustering.defaultLanguage">
+ <value type="org.carrot2.core.LanguageCode" value="ENGLISH"/>
+ </attribute>
+ <attribute key="MultilingualClustering.languageAggregationStrategy">
+ <value type="org.carrot2.text.clustering.MultilingualClustering$LanguageAggregationStrategy" value="FLATTEN_MAJOR_LANGUAGE"/>
+ </attribute>
+ </value-set>
+ </attribute-set>
+</attribute-sets>
diff --git a/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/lingo-attributes.xml b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/lingo-attributes.xml
new file mode 100644
index 000000000..5febfc320
--- /dev/null
+++ b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/lingo-attributes.xml
@@ -0,0 +1,24 @@
+<!--
+ Default configuration for the Lingo clustering algorithm.
+
+ This file can be loaded (and saved) by Carrot2 Workbench.
+ http://project.carrot2.org/download.html
+-->
+<attribute-sets default="attributes">
+ <attribute-set id="attributes">
+ <value-set>
+ <label>attributes</label>
+ <!--
+ The language to assume for clustered documents.
+ For a list of allowed values, see:
+ http://download.carrot2.org/stable/manual/#section.attribute.lingo.MultilingualClustering.defaultLanguage
+ -->
+ <attribute key="MultilingualClustering.defaultLanguage">
+ <value type="org.carrot2.core.LanguageCode" value="ENGLISH"/>
+ </attribute>
+ <attribute key="LingoClusteringAlgorithm.desiredClusterCountBase">
+ <value type="java.lang.Integer" value="20"/>
+ </attribute>
+ </value-set>
+ </attribute-set>
+</attribute-sets>
diff --git a/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/stc-attributes.xml b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/stc-attributes.xml
new file mode 100644
index 000000000..c1bf110c8
--- /dev/null
+++ b/solr-8.1.1/example/example-DIH/solr/mail/conf/clustering/carrot2/stc-attributes.xml
@@ -0,0 +1,19 @@
+<!--
+ Default configuration for the STC clustering algorithm.
+
+ This file can be loaded (and saved) by Carrot2 Workbench.
+ http://project.carrot2.org/download.html
+-->
+<attribute-sets default="attributes">
+ <attribute-set id="attributes">
+ <value-set>
+ <label>attributes</label>
+ <attribute key="MultilingualClustering.defaultLanguage">
+ <value type="org.carrot2.core.LanguageCode" value="ENGLISH"/>
+ </attribute>
+ <attribute key="MultilingualClustering.languageAggregationStrategy">
+ <value type="org.carrot2.text.clustering.MultilingualClustering$LanguageAggregationStrategy" value="FLATTEN_MAJOR_LANGUAGE"/>
+ </attribute>
+ </value-set>
+ </attribute-set>
+</attribute-sets>