solr

arirang 분석기

디츠 2019. 10. 4. 09:27

arirang.lucene-analyzer-6.2-1.1.0.jar
0.03MB
arirang-morph-1.1.0.jar
0.46MB
stopwords_ko.txt
0.01MB

1. 첨부 jar 파일 server/solr-webapp/webapp/WEB-INF/lib 적

2. lang/stopwords_kor.txt 적용

3. server/solr/board/conf/managed-schema 수정

<filter class="solr.LowerCaseFilterFactory"/>  
<filter class="solr.ClassicFilterFactory"/>  
<filter class="org.apache.lucene.analysis.ko.KoreanFilterFactory" hasOrigin="true" hasCNoun="true" bigrammable="false"/> </filter class="org.apache.lucene.analysis.ko.HanjaMappingFilterFactory"/>  
<filter class="org.apache.lucene.analysis.ko.PunctuationDelimitFilterFactory"/>  
<filter class="solr.StopFilterFactory" words="stopwords.txt" ignoreCase="true"/>  
    
 <analyzer type="query">  
	<tokenizer class="org.apache.lucene.analysis.ko.KoreanTokenizerFactory"/>  
	<filter class="solr.LowerCaseFilterFactory"/>  
	<filter class="solr.ClassicFilterFactory"/>  
	<filter class="org.apache.lucene.analysis.ko.KoreanFilterFactory" hasOrigin="true" hasCNoun="true" bigrammable="false"/> </filter class="org.apache.lucene.analysis.ko.WordSegmentFilterFactory" hasOrijin="true"/>  
	<filter class="org.apache.lucene.analysis.ko.HanjaMappingFilterFactory"/>  
	<filter class="org.apache.lucene.analysis.ko.PunctuationDelimitFilterFactory"/>  
	<filter class="solr.StopFilterFactory" words="lang/stopwords_tr.txt" ignoreCase="true"/>
</analyzer>