У меня есть сценарий для моего проекта.
я использую вместе FuzzyLookupFactory (с несколькими Suggester) и AnalyzingInfixLookupFactory. Я использую solrj (java api) для запроса запроса.
Сначала я ищу слово с помощью анализаinginfixlookupfactory, это может найти слово в любом месте поля, но вы должны правильно ввести его. например, название продукта «Тошиба», если вы будете искать «Тош» он мог найти « TOSHIBA» правильно, но если вы ищете «toshba» это будет не найти какой-либо продукт.
на этот раз я использую fuzzylookupfactory advester i разделить все слова (например, у вас есть «toshiba laptop» word1 = toshiba word2 = ноутбук и т. Д.) И искать один к одному, а нечеткий найдет toshba -> toshiba и после find toshiba снова используйте analycinginfixlookupfactory для поиска полного поля продукта.
, например, вы хотите, чтобы найти "ноутбуков Toshiba", и вы искали "toshba laptp". сначала попробуйте «analysisinginfixlookupfactory», и ответ будет равен нулю. После ответа на нулевой поиск нечеткой для каждого слова и добавьте то, что вы найдете как toshba -> toshiba + laptp-> laptop, это будет toshiba laptop, и теперь вы можете снова искать анализ infixlookupfactory для полного поля.
мой анализ Suggester в (solrconfig.xml)
<searchComponent name="suggestAnalyzing" class="solr.SuggestComponent">
<lst name="suggester">
<str name="name">suggestAnalyzing</str>
<str name="lookupImpl">AnalyzingInfixLookupFactory</str>
<str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
<str name="storeDir">suggester_fuzzy_dir</str>
<str name="indexPath">suggester_infix_dir</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">COMPLETE_FIELD</str>
<str name="suggestAnalyzerFieldType">textgen</str>
<float name="threshold">0.005</float>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
</searchComponent>
<requestHandler name="/suggestAnalyzing" class="solr.SearchHandler">
<lst name="defaults">
<str name="suggest.dictionary">suggestAnalyzing</str>
<str name="suggest">true</str>
<str name="suggest.count">10</str>
</lst>
<arr name="components">
<str>suggestAnalyzing</str>
</arr>
</requestHandler>
мой нечеткий Suggester в (solrconfig.xml)
<searchComponent class="solr.SuggestComponent" name="suggest">
<lst name="suggester">
<str name="name">word1suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word1</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word2suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word2</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word2suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word3suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word3</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word3suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="exactMatchFirst">true</str>
<float name="threshold">0.005</float>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word4suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word4</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word4suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word5suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word5</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word5suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word6suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word6</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word6suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="exactMatchFirst">true</str>
<float name="threshold">0.005</float>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word7suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word7</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word7suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="exactMatchFirst">true</str>
<float name="threshold">0.005</float>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
<lst name="suggester">
<str name="name">word8suggester</str>
<str name="lookupImpl">FuzzyLookupFactory</str>
<str name="dictionaryImpl">DocumentDictionaryFactory</str>
<str name="field">word8</str> <!-- the indexed field to derive suggestions from -->
<str name="suggestAnalyzerFieldType">textgen</str>
<str name="indexPath">suggestions/word8suggester</str>
<str name="storeDir">suggest_fuzzy_doc_expr_dict</str>
<str name="preserveSep">true</str>
<str name="preservePositionIncrements">true</str>
<str name="exactMatchFirst">true</str>
<float name="threshold">0.005</float>
<str name="buildOnStartup">false</str>
<str name="buildOnCommit">false</str>
</lst>
</searchComponent>
<requestHandler class="solr.SearchHandler" name="/suggest">
<lst name="defaults">
<str name="spellcheck">true</str>
<str name="suggest">true</str>
<str name="suggest.dictionary">word1suggester</str>
<str name="suggest.dictionary">word2suggester</str>
<str name="suggest.dictionary">word3suggester</str>
<str name="suggest.dictionary">word4suggester</str>
<str name="suggest.dictionary">word5suggester</str>
<str name="suggest.dictionary">word6suggester</str>
<str name="suggest.dictionary">word7suggester</str>
<str name="suggest.dictionary">word8suggester</str>
<str name="spellcheck.count">10</str>
</lst>
<arr name="components">
<str>suggest</str>
</arr>
</requestHandler>
мои поля управляемых схемы
<fieldType name="textgen" class="solr.TextField" positionIncrementGap="100">
<analyzer type="index">
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange="0"/>
<filter class="solr.LowerCaseFilterFactory"/>
</analyzer>
<analyzer type="query">
<tokenizer class="solr.WhitespaceTokenizerFactory"/>
<filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
<filter class="solr.StopFilterFactory"
ignoreCase="true"
words="stopwords.txt"
/>
<filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="0"/>
<filter class="solr.LowerCaseFilterFactory"/>
</analyzer>
</fieldType>
<field name="word1" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="COMPLETE_FIELD" type="textgen" multiValued="true" indexed="true" stored="true"/>
<field name="word2" type="text_general" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word3" type="text_general" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word4" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word5" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word6" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word7" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>
<field name="word8" type="textgen" omitNorms="true" omitTermFreqAndPositions="true" multiValued="true" indexed="true" stored="true"/>