summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--inc/indexer.php2
-rw-r--r--inc/lang/de/stopwords.txt3
-rw-r--r--inc/lang/en/stopwords.txt10
3 files changed, 14 insertions, 1 deletions
diff --git a/inc/indexer.php b/inc/indexer.php
index 08ad03965..4b59684cd 100644
--- a/inc/indexer.php
+++ b/inc/indexer.php
@@ -12,7 +12,7 @@ require_once(DOKU_INC.'inc/utf8.php');
require_once(DOKU_INC.'inc/parserutils.php');
// set the minimum token length to use in the index (note, this doesn't apply to numeric tokens)
-if (!defined('IDX_MINWORDLENGTH')) define('IDX_MINWORDLENGTH',3);
+if (!defined('IDX_MINWORDLENGTH')) define('IDX_MINWORDLENGTH',2);
// Asian characters are handled as words. The following regexp defines the
// Unicode-Ranges for Asian characters
diff --git a/inc/lang/de/stopwords.txt b/inc/lang/de/stopwords.txt
index 78261b7c9..443b17723 100644
--- a/inc/lang/de/stopwords.txt
+++ b/inc/lang/de/stopwords.txt
@@ -50,6 +50,8 @@ hinter
ich
ihr
ihre
+in
+im
ist
jede
jedem
@@ -98,6 +100,7 @@ unter
vom
von
vor
+um
wann
warum
was
diff --git a/inc/lang/en/stopwords.txt b/inc/lang/en/stopwords.txt
index bc6eb48ae..afc301659 100644
--- a/inc/lang/en/stopwords.txt
+++ b/inc/lang/en/stopwords.txt
@@ -4,6 +4,8 @@
# This list is based upon the ones found at http://www.ranks.nl/stopwords/
about
are
+as
+an
and
you
your
@@ -13,10 +15,18 @@ com
for
from
into
+if
+in
+is
+it
how
+of
+on
+or
that
the
this
+to
was
what
when