diff options
Diffstat (limited to 'solr-8.3.1/example/exampledocs/utf8-example.xml')
-rw-r--r-- | solr-8.3.1/example/exampledocs/utf8-example.xml | 42 |
1 files changed, 42 insertions, 0 deletions
diff --git a/solr-8.3.1/example/exampledocs/utf8-example.xml b/solr-8.3.1/example/exampledocs/utf8-example.xml new file mode 100644 index 000000000..ee300a683 --- /dev/null +++ b/solr-8.3.1/example/exampledocs/utf8-example.xml @@ -0,0 +1,42 @@ +<?xml version="1.0" encoding="UTF-8"?> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<!-- + After posting this to Solr with bin/post, searching for "êâîôû" from + the solr/admin/ search page must return this document. + --> + +<add> + <doc> + <field name="id">UTF8TEST</field> + <field name="name">Test with some UTF-8 encoded characters</field> + <field name="manu">Apache Software Foundation</field> + <field name="cat">software</field> + <field name="cat">search</field> + <field name="features">No accents here</field> + <field name="features">This is an e acute: é</field> + <field name="features">eaiou with circumflexes: êâîôû</field> + <field name="features">eaiou with umlauts: ëäïöü</field> + <field name="features">tag with escaped chars: <nicetag/></field> + <field name="features">escaped ampersand: Bonnie & Clyde</field> + <field name="features">Outside the BMP:𐌈 codepoint=10308, a circle with an x inside. UTF8=f0908c88 UTF16=d800 df08</field> + <field name="price">0.0</field> + <field name="inStock">true</field> + </doc> +</add> + |