diff options
-rw-r--r-- | inc/indexer.php | 2 | ||||
-rw-r--r-- | inc/lang/de/stopwords.txt | 3 | ||||
-rw-r--r-- | inc/lang/en/stopwords.txt | 10 |
3 files changed, 14 insertions, 1 deletions
diff --git a/inc/indexer.php b/inc/indexer.php index 08ad03965..4b59684cd 100644 --- a/inc/indexer.php +++ b/inc/indexer.php @@ -12,7 +12,7 @@ require_once(DOKU_INC.'inc/utf8.php'); require_once(DOKU_INC.'inc/parserutils.php'); // set the minimum token length to use in the index (note, this doesn't apply to numeric tokens) -if (!defined('IDX_MINWORDLENGTH')) define('IDX_MINWORDLENGTH',3); +if (!defined('IDX_MINWORDLENGTH')) define('IDX_MINWORDLENGTH',2); // Asian characters are handled as words. The following regexp defines the // Unicode-Ranges for Asian characters diff --git a/inc/lang/de/stopwords.txt b/inc/lang/de/stopwords.txt index 78261b7c9..443b17723 100644 --- a/inc/lang/de/stopwords.txt +++ b/inc/lang/de/stopwords.txt @@ -50,6 +50,8 @@ hinter ich ihr ihre +in +im ist jede jedem @@ -98,6 +100,7 @@ unter vom von vor +um wann warum was diff --git a/inc/lang/en/stopwords.txt b/inc/lang/en/stopwords.txt index bc6eb48ae..afc301659 100644 --- a/inc/lang/en/stopwords.txt +++ b/inc/lang/en/stopwords.txt @@ -4,6 +4,8 @@ # This list is based upon the ones found at http://www.ranks.nl/stopwords/ about are +as +an and you your @@ -13,10 +15,18 @@ com for from into +if +in +is +it how +of +on +or that the this +to was what when |