Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Sign up
Appearance settings

Commit 000c1dd

Browse files
committed
Dictionary based entity extraction now by Solr Text Tagger
1 parent 8891d93 commit 000c1dd

File tree

3 files changed

+21
-3
lines changed

3 files changed

+21
-3
lines changed
Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,4 @@
1+
{"requestHandler":{"/all_labels_ss_tag":{
2+
"name":"/all_labels_ss_tag",
3+
"class":"solr.TaggerRequestHandler",
4+
"defaults":{"field":"all_labels_ss_tag"}}}}

‎src/solr/opensemanticsearch-entities/conf/entities/readme.txt‎

Lines changed: 0 additions & 1 deletion
This file was deleted.

‎src/solr/opensemanticsearch-entities/conf/managed-schema‎

Lines changed: 17 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -116,8 +116,22 @@
116116
<field name="_root_" type="string" indexed="true" stored="false" docValues="false" />
117117
<field name="_text_" type="text_general" indexed="true" stored="false" multiValued="true"/>
118118

119-
<!-- Field for text we want only analyze by other automatic generated dictionary filtered fields (getting it by copy field) but we do not need to index or store -->
120-
<field name="do_not_index_txt" type="text_general" indexed="false" stored="false" multiValued="true"/>
119+
<fieldType name="tag" class="solr.TextField" omitNorms="true" omitTermFreqAndPositions="true" postingsFormat="FST50" multiValued="true">
120+
<analyzer type="index">
121+
<tokenizer class="solr.StandardTokenizerFactory"/>
122+
<filter class="solr.EnglishPossessiveFilterFactory"/>
123+
<filter class="solr.LowerCaseFilterFactory"/>
124+
<filter class="solr.ConcatenateGraphFilterFactory" preservePositionIncrements="false"/>
125+
</analyzer>
126+
<analyzer type="query">
127+
<tokenizer class="solr.StandardTokenizerFactory"/>
128+
<filter class="solr.EnglishPossessiveFilterFactory"/>
129+
<filter class="solr.LowerCaseFilterFactory"/>
130+
</analyzer>
131+
</fieldType>
132+
133+
<field name="all_labels_ss_tag" type="tag" stored="false"/>
134+
<copyField source="all_labels_ss" dest="all_labels_ss_tag"/>
121135

122136
<!-- This can be enabled, in case the client does not know what fields may be searched. It isn't enabled by default
123137
because it's very expensive to index everything twice. -->
@@ -193,6 +207,7 @@
193207
field first in an ascending sort and last in a descending sort.
194208
-->
195209

210+
196211
<!-- The StrField type is not analyzed, but indexed/stored verbatim. -->
197212
<fieldType name="string" class="solr.StrField" sortMissingLast="true" docValues="true" />
198213
<fieldType name="strings" class="solr.StrField" sortMissingLast="true" multiValued="true" docValues="true" />

0 commit comments

Comments
(0)

AltStyle によって変換されたページ (->オリジナル) /