Manybubbles has uploaded a new change for review.
https://gerrit.wikimedia.org/r/76832
Change subject: Stop producing nonsense words in suggestions.
......................................................................
Stop producing nonsense words in suggestions.
Did this by using an analysis chain closer to the default for
suggestions so we wouldn't suggest stemmed words. This should work fine
for space delimited languages but will need some love when we turn to
non-space delimited languages.
Change-Id: I59252615964def7e3330a4b95bcd3189f53497ea
---
M updateSearchConfig.php
1 file changed, 26 insertions(+), 6 deletions(-)
git pull ssh://gerrit.wikimedia.org:29418/mediawiki/extensions/CirrusSearch
refs/changes/32/76832/1
diff --git a/updateSearchConfig.php b/updateSearchConfig.php
index 553f966..808d5f0 100644
--- a/updateSearchConfig.php
+++ b/updateSearchConfig.php
@@ -312,9 +312,7 @@
'analysis' => array(
'analyzer' => array(
'text' => $this->buildTextAnalyzer(),
- 'suggest' => array_merge(
$this->buildTextAnalyzer(), array(
- 'filter' => array(
'suggest_shingle' )
- ) ),
+ 'suggest' =>
$this->buildSuggestAnalyzer(),
'prefix' => array(
'type' => 'custom',
'tokenizer' => 'prefix',
@@ -347,13 +345,35 @@
);
}
+ /**
+ * Build a suggest analyzer customized for this language code.
+ */
private function buildTextAnalyzer() {
+ $langs = Language::getTranslatedLanguageNames( 'en' );
+ $analyzer = array(
+ 'type' => strtolower( $langs["en"] ),
+ );
+
global $wgLanguageCode;
switch ($wgLanguageCode) {
- case 'en': return array(
- 'type' => 'english'
- );
+ // Customization goes here.
}
+
+ return $analyzer;
+ }
+
+ private function buildSuggestAnalyzer() {
+ $analyzer = array(
+ 'type' => 'default',
+ 'filter' => array( 'suggest_shingle' ),
+ );
+
+ global $wgLanguageCode;
+ switch ($wgLanguageCode) {
+ // Customization goes here.
+ }
+
+ return $analyzer;
}
/**
--
To view, visit https://gerrit.wikimedia.org/r/76832
To unsubscribe, visit https://gerrit.wikimedia.org/r/settings
Gerrit-MessageType: newchange
Gerrit-Change-Id: I59252615964def7e3330a4b95bcd3189f53497ea
Gerrit-PatchSet: 1
Gerrit-Project: mediawiki/extensions/CirrusSearch
Gerrit-Branch: master
Gerrit-Owner: Manybubbles <[email protected]>
_______________________________________________
MediaWiki-commits mailing list
[email protected]
https://lists.wikimedia.org/mailman/listinfo/mediawiki-commits