From 755463eed74ed7de9a3c1a12495d2dad655d31d5 Mon Sep 17 00:00:00 2001 From: Alvin Li Date: Tue, 13 Aug 2013 14:42:32 +0800 Subject: added 'isuifang_solr' --- .../example-DIH/solr/mail/conf/data-config.xml | 11 + .../example-DIH/solr/mail/conf/protwords.txt | 21 + .../example-DIH/solr/mail/conf/schema.xml | 373 ++++++++++ .../example-DIH/solr/mail/conf/solrconfig.xml | 792 +++++++++++++++++++++ .../example-DIH/solr/mail/conf/stopwords.txt | 58 ++ .../example-DIH/solr/mail/conf/synonyms.txt | 31 + 6 files changed, 1286 insertions(+) create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/data-config.xml create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/protwords.txt create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/schema.xml create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/solrconfig.xml create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/stopwords.txt create mode 100644 isuifang_solr/example-DIH/solr/mail/conf/synonyms.txt (limited to 'isuifang_solr/example-DIH/solr/mail') diff --git a/isuifang_solr/example-DIH/solr/mail/conf/data-config.xml b/isuifang_solr/example-DIH/solr/mail/conf/data-config.xml new file mode 100644 index 0000000..eed4c2b --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/data-config.xml @@ -0,0 +1,11 @@ + + + + + + diff --git a/isuifang_solr/example-DIH/solr/mail/conf/protwords.txt b/isuifang_solr/example-DIH/solr/mail/conf/protwords.txt new file mode 100644 index 0000000..1dfc0ab --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/protwords.txt @@ -0,0 +1,21 @@ +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +#----------------------------------------------------------------------- +# Use a protected word file to protect against the stemmer reducing two +# unrelated words to the same base word. + +# Some non-words that normally won't be encountered, +# just to test that they won't be stemmed. +dontstems +zwhacky + diff --git a/isuifang_solr/example-DIH/solr/mail/conf/schema.xml b/isuifang_solr/example-DIH/solr/mail/conf/schema.xml new file mode 100644 index 0000000..406ce3b --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/schema.xml @@ -0,0 +1,373 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + messageId + + + catchAllField + + + + + diff --git a/isuifang_solr/example-DIH/solr/mail/conf/solrconfig.xml b/isuifang_solr/example-DIH/solr/mail/conf/solrconfig.xml new file mode 100644 index 0000000..c0f35b5 --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/solrconfig.xml @@ -0,0 +1,792 @@ + + + + + + LUCENE_36 + + + ${solr.abortOnConfigurationError:true} + + + + + + + false + + 10 + + + + 32 + 2147483647 + 10000 + 1000 + + + + + + + + + single + + + + + false + 32 + 10 + + + 2147483647 + 10000 + + + false + + + + + false + + 1 + + + + + + + + + + + + + + + + + + + + + + + + + 1024 + + + + + + + + + + + + + + + + true + + + + + + + + 50 + + + 200 + + + + + + + + + solr 0 10 + rocks 0 10 + static newSearcher warming query from solrconfig.xml + + + + + + + fast_warm 0 10 + static firstSearcher warming query from solrconfig.xml + + + + + false + + + 2 + + + + + + + + + + + + + + + + + + + + + + + explicit + + + + + + + + + + + + + + dismax + explicit + 0.01 + + text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4 + + + text^0.2 features^1.1 name^1.5 manu^1.4 manu_exact^1.9 + + + ord(popularity)^0.5 recip(rord(price),1,1000,1000)^0.3 + + + id,name,price,score + + + 2<-1 5<-2 6<90% + + 100 + *:* + + text features name + + 0 + + name + regex + + + + + + + dismax + explicit + text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 + 2<-1 5<-2 6<90% + + incubationdate_dt:[* TO NOW/DAY-1MONTH]^2.2 + + + + inStock:true + + + + cat + manu_exact + price:[* TO 500] + price:[500 TO *] + + + + + + + + + + textSpell + + + default + spell + ./spellchecker1 + + + + jarowinkler + spell + + org.apache.lucene.search.spell.JaroWinklerDistance + ./spellchecker2 + + + + + solr.FileBasedSpellChecker + file + spellings.txt + UTF-8 + ./spellcheckerFile + + + + + + + + false + + false + + 1 + + + spellcheck + + + + + + data-config.xml + + + + + + + + true + + + tvComponent + + + + + + + + + + + + termsComp + + + + + + + + + + + + + + + + + + + + + + + + + explicit + true + + + + + + + + + 100 + + + + + + + + 70 + + 0.5 + + [-\w ,/\n\"']{20,200} + + + + + + + ]]> + ]]> + + + + + + + + + + + + + 5 + + + + + + + + + + solr + + + + + diff --git a/isuifang_solr/example-DIH/solr/mail/conf/stopwords.txt b/isuifang_solr/example-DIH/solr/mail/conf/stopwords.txt new file mode 100644 index 0000000..b5824da --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/stopwords.txt @@ -0,0 +1,58 @@ +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed with +# this work for additional information regarding copyright ownership. +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +#----------------------------------------------------------------------- +# a couple of test stopwords to test that the words are really being +# configured from this file: +stopworda +stopwordb + +#Standard english stop words taken from Lucene's StopAnalyzer +a +an +and +are +as +at +be +but +by +for +if +in +into +is +it +no +not +of +on +or +s +such +t +that +the +their +then +there +these +they +this +to +was +will +with + diff --git a/isuifang_solr/example-DIH/solr/mail/conf/synonyms.txt b/isuifang_solr/example-DIH/solr/mail/conf/synonyms.txt new file mode 100644 index 0000000..b0e31cb --- /dev/null +++ b/isuifang_solr/example-DIH/solr/mail/conf/synonyms.txt @@ -0,0 +1,31 @@ +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +#----------------------------------------------------------------------- +#some test synonym mappings unlikely to appear in real input text +aaa => aaaa +bbb => bbbb1 bbbb2 +ccc => cccc1,cccc2 +a\=>a => b\=>b +a\,a => b\,b +fooaaa,baraaa,bazaaa + +# Some synonym groups specific to this example +GB,gib,gigabyte,gigabytes +MB,mib,megabyte,megabytes +Television, Televisions, TV, TVs +#notice we use "gib" instead of "GiB" so any WordDelimiterFilter coming +#after us won't split it into two words. + +# Synonym mappings can be used for spelling correction too +pixima => pixma + -- cgit v1.2.2