Skip to content

Commit

Permalink
Merge pull request #3156 from Smile-SA/fix-elision
Browse files Browse the repository at this point in the history
Fix french stemmer on "clef/clefs" and better elision management
  • Loading branch information
rbayet authored Jan 31, 2024
2 parents 31a5f76 + 1b296c4 commit 15a24cd
Showing 1 changed file with 9 additions and 9 deletions.
18 changes: 9 additions & 9 deletions src/module-elasticsuite-core/etc/elasticsuite_analysis.xml
Original file line number Diff line number Diff line change
Expand Up @@ -150,7 +150,7 @@
<!--
Known issues with the "french" stemmer.
-->
<rules>["clous => clou", "verrous => verrou", "ecrous => ecrou", "jeux => jeu", "photos => photo"]</rules>
<rules>["clous => clou", "verrous => verrou", "ecrous => ecrou", "jeux => jeu", "photos => photo", "clef => cle", "clefs => cle"]</rules>
</filter>
<filter name="stemmer_override" type="stemmer_override" language="it">
<!--
Expand All @@ -163,10 +163,10 @@
<articles>["d", "l", "m", "n", "s", "t"]</articles>
</filter>
<filter name="elision" type="elision" language="fr">
<articles>["l", "m", "t", "qu", "n", "s","j", "d", "c"]</articles>
<articles>["l", "m", "t", "qu", "n", "s", "j", "d", "c"]</articles>
</filter>
<filter name="elision" type="elision" language="it">
<articles>["c", "l", "all", "dall", "dell","nell", "sull", "coll", "pell","gl", "agl", "dagl", "degl", "negl","sugl", "un", "m", "t", "s", "v", "d"]</articles>
<articles>["c", "l", "all", "dall", "dell", "nell", "sull", "coll", "pell", "gl", "agl", "dagl", "degl", "negl", "sugl", "un", "m", "t", "s", "v", "d"]</articles>
</filter>
<filter name="phonetic" type="phonetic" language="default">
<encoder>metaphone</encoder>
Expand Down Expand Up @@ -194,9 +194,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
<filter ref="stemmer_override" />
<filter ref="stemmer" />
</filters>
Expand All @@ -208,9 +208,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
</filters>
<char_filters>
<char_filter ref="html_strip" />
Expand All @@ -220,9 +220,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="reference_word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
<filter ref="reference_shingle" />
</filters>
<char_filters>
Expand All @@ -233,9 +233,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
<filter ref="stemmer_override" />
<filter ref="stemmer" />
<filter ref="shingle" />
Expand All @@ -258,9 +258,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
<filter ref="phonetic" />
</filters>
<char_filters>
Expand All @@ -271,9 +271,9 @@
<filters>
<filter ref="ascii_folding" />
<filter ref="trim" />
<filter ref="elision" />
<filter ref="word_delimiter" />
<filter ref="lowercase" />
<filter ref="elision" />
<filter ref="stemmer_override" />
<filter ref="stemmer" />
<filter ref="edge_ngram_filter"/>
Expand Down

0 comments on commit 15a24cd

Please sign in to comment.