• R/O
  • HTTP
  • SSH
  • HTTPS

libre10: Commit

libre10 git


Commit MetaInfo

Revision9a509ba3cde28f69836a6f2a03811d6ece58505e (tree)
Zeit2013-11-18 07:42:49
Autorgn64_jp <gn64@rec1...>
Commitergn64_jp

Log Message

solr : Use JapaneseTokenizerFactory(Kuromoji) instead of CJK-Bigram Filter.

Ändern Zusammenfassung

Diff

--- a/solr-4.5.1/libre10/solr/libre10/conf/schema.xml
+++ b/solr-4.5.1/libre10/solr/libre10/conf/schema.xml
@@ -16,6 +16,17 @@
1616 <filter class="solr.NGramFilterFactory" minGramSize="2" maxGramSize="15"/>-->
1717 </analyzer>
1818 </fieldType>
19+ <fieldType name="text_ja" class="solr.TextField">
20+ <analyzer>
21+ <tokenizer class="solr.JapaneseTokenizerFactory" mode="extended"/>
22+ <filter class="solr.JapaneseBaseFormFilterFactory"/>
23+ <filter class="solr.JapanesePartOfSpeechStopFilterFactory" tags="lang/stoptags_ja.txt" enablePositionIncrements="true"/>
24+ <filter class="solr.CJKWidthFilterFactory" />
25+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="lang/stopwords_ja.txt" enablePositionIncrements="true" />
26+ <filter class="solr.JapaneseKatakanaStemFilterFactory" minimumLength="2"/>
27+ <filter class="solr.LowerCaseFilterFactory"/>
28+ </analyzer>
29+ </fieldType>
1930 <fieldType name="long" class="solr.LongField" omitNorms="true"/>
2031 <fieldType name="uuid" class="solr.UUIDField" indexed="true" />
2132
@@ -28,7 +39,7 @@
2839 <field name="title_group_id" type="string" indexed="true" stored="true" required="true" />
2940 <field name="page" type="long" indexed="true" stored="true" required="true" />
3041 <field name="pagemax" type="long" indexed="true" stored="true" required="true" />
31-<field name="text" type="text_cjk" indexed="true" stored="true" required="true" termVectors="true" termPositions="true" termOffsets="true" />
42+<field name="text" type="text_ja" indexed="true" stored="true" required="true" termVectors="true" termPositions="true" termOffsets="true" />
3243 <!--<field name="text" type="text_cjk" indexed="true" stored="true" required="true" />-->
3344 <field name="genre" type="string" indexed="true" stored="true" required="false" multiValued="true" />
3445 <field name="path_id" type="string" indexed="false" stored="true" required="false" />
Show on old repository browser