如何在Solr中配置拼写检查功能?

时间:2019-01-11 13:07:47

标签: apache solr solrcloud

我想在Apache Solr-6.6.4中实现拼写检查功能,但不能这样做。我的程序没有提示我应该使用的正确单词(在Solr查询中)。

我的收藏名称是 employee 。我想对字段名称​​ jobTitleName 实施拼写检查。

我已引用以下链接: http://akashmusings.blogspot.com/2016/03/spell-check-with-solr.html

我正在使用以下配置。

schema.xml

<uniqueKey>userId</uniqueKey>

 <field name="userId" type="string" indexed="true" stored="true" required="false" /> 
 <field name="jobTitleName" type="string" indexed="false" stored="true" required="false"/>
 <field name="firstName" type="string" indexed="false" stored="true" required="false"/>
 <field name="lastName" type="string" indexed="false" stored="true" required="false"/>
 <field name="preferredFullName" type="string" indexed="false" stored="true" required="false"/>
 <field name="employeeCode" type="string" indexed="false" stored="true" required="false"/>
 <field name="region" type="string" indexed="false" stored="true" required="false"/>
 <field name="phoneNumber" type="string" indexed="false" stored="true" required="false"/>
 <field name="emailAddress" type="string" indexed="false" stored="true" required="false"/>
 <field name="_version_" type="tver" indexed="true" stored="true" />  
 <dynamicField name="ignored_*" type="ignored" multiValued="true"/>
 <dynamicField name="*" type="ignored" multiValued="true"/>
  <fieldType name="string" class="solr.StrField" sortMissingLast="true" docValues="true" />
  <fieldType name="booleans" class="solr.BoolField" sortMissingLast="true" multiValued="true"/>
  <fieldType name="int" class="solr.IntPointField" docValues="true"/>
  <fieldType name="text" class="solr.TextField" positionIncrementGap="100" multiValued="true"/> 
  <fieldType name="double" class="solr.TrieDoubleField" docValues="true" precisionStep="0" positionIncrementGap="0"/>
  <fieldType name="tdates" class="solr.TrieDateField" docValues="true" precisionStep="6" positionIncrementGap="0" multiValued="true"/>
  <fieldType name="tlongs" class="solr.TrieLongField" docValues="true" precisionStep="8" positionIncrementGap="0" multiValued="true"/>
  <fieldType name="tver" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0" />
  <fieldType name="tdoubles" class="solr.TrieDoubleField" docValues="true" precisionStep="8" positionIncrementGap="0" multiValued="true"/>
  <fieldType name="ignored" stored="false" indexed="false" docValues="false" multiValued="true" class="solr.StrField" />

solrconfig.xml(拼写检查)

  <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
    <str name="queryAnalyzerFieldType">text_general</str>
    <lst name="spellchecker">
      <str name="name">default</str>
      <str name="field">jobTitleName</str>
      <str name="classname">solr.DirectSolrSpellChecker</str>
      <str name="distanceMeasure">internal</str>
      <float name="accuracy">0.5</float>
      <int name="maxEdits">2</int>
      <int name="minPrefix">1</int>
      <int name="maxInspections">5</int>
      <int name="minQueryLength">4</int>
      <float name="maxQueryFrequency">0.01</float>
      <float name="thresholdTokenFrequency">.01</float>
    </lst>
    <lst name="spellchecker">
      <str name="name">wordbreak</str>
      <str name="classname">solr.WordBreakSolrSpellChecker</str>
      <str name="field">lowerfilt</str>
      <str name="combineWords">true</str>
      <str name="breakWords">true</str>
      <int name="maxChanges">10</int>
    </lst>
  </searchComponent>
  <requestHandler name="/spell" class="solr.SearchHandler" startup="lazy">
    <lst name="defaults">
      <str name="spellcheck.dictionary">default</str>
      <str name="spellcheck">on</str>
      <str name="spellcheck.extendedResults">true</str>
      <str name="spellcheck.count">10</str>
      <str name="spellcheck.alternativeTermCount">5</str>
      <str name="spellcheck.maxResultsForSuggest">5</str>
      <str name="spellcheck.collate">true</str>
      <str name="spellcheck.collateExtendedResults">true</str>
      <str name="spellcheck.maxCollationTries">10</str>
      <str name="spellcheck.maxCollations">5</str>
    </lst>
    <arr name="last-components">
      <str>spellcheck</str>
    </arr>
  </requestHandler>

solrconfig.xml(更新)

  <initParams path="/update/**,/query,/select,/tvrh,/elevate,/spell,/browse">
    <lst name="defaults">
      <str name="df">firstName</str>
    </lst>
  </initParams>

  <initParams path="/update/**">
    <lst name="defaults">
      <str name="update.chain">add-unknown-fields-to-the-schema</str>
    </lst>
  </initParams>    
  <searchComponent name="spellcheck" class="solr.SpellCheckComponent">   
    <str name="queryAnalyzerFieldType">text_general</str>   
    <lst name="spellchecker">
        <str name="name">default</str>
        <str name="field">jobTitleName</str>
      <str name="classname">solr.DirectSolrSpellChecker</str>
      <str name="distanceMeasure">internal</str>
      <float name="accuracy">0.5</float>
      <int name="maxEdits">2</int>
      <int name="minPrefix">1</int>
      <int name="maxInspections">5</int>
      <int name="minQueryLength">4</int>
      <float name="maxQueryFrequency">0.01</float>
      <float name="thresholdTokenFrequency">.01</float>
    </lst>    
    <lst name="spellchecker">
      <str name="name">wordbreak</str>
      <str name="classname">solr.WordBreakSolrSpellChecker</str>
      <str name="field">lowerfilt</str>
      <str name="combineWords">true</str>
      <str name="breakWords">true</str>
      <int name="maxChanges">10</int>
       </lst>
  </searchComponent>

  <requestHandler name="/spell" class="solr.SearchHandler" startup="lazy">
    <lst name="defaults">
      <str name="spellcheck.dictionary">default</str>
      <str name="spellcheck">on</str>
      <str name="spellcheck.extendedResults">true</str>
      <str name="spellcheck.count">10</str>
      <str name="spellcheck.alternativeTermCount">5</str>
      <str name="spellcheck.maxResultsForSuggest">5</str>
      <str name="spellcheck.collate">true</str>
      <str name="spellcheck.collateExtendedResults">true</str>
      <str name="spellcheck.maxCollationTries">10</str>
      <str name="spellcheck.maxCollations">5</str>
    </lst>
    <arr name="last-components">
      <str>spellcheck</str>
    </arr>
  </requestHandler>

要求 我希望当用户输入错误的jobTitleName时,Solr应该使用拼写检查产生正确的建议。

例如如果用户以jobTitleName身份输入Developer,则Solr应该使用拼写检查向用户提供推荐作为Developer。

0 个答案:

没有答案