Bugfix for empty words

author Paul POULAIN <paul@koha-fr.org>

Fri, 12 Oct 2007 22:35:23 +0000 (17:35 -0500)

committer Joshua Ferraro <jmf@liblime.com>

Sat, 13 Oct 2007 03:21:07 +0000 (22:21 -0500)
author Paul POULAIN <paul@koha-fr.org>
Fri, 12 Oct 2007 22:35:23 +0000 (17:35 -0500)
committer Joshua Ferraro <jmf@liblime.com>
Sat, 13 Oct 2007 03:21:07 +0000 (22:21 -0500)
diff --git a/C4/Search.pm b/C4/Search.pm

index 02a4438..391f6f3 100644 (file)
--- a/C4/Search.pm
+++ b/C4/Search.pm
@@ -564,8 +564,13 @@ sub buildQuery {
          for ( my $i = 0 ; $i <= @operands ; $i++ ) {
              my $operand = $operands[$i];
              # remove stopwords from operand : parse all stopwords & remove them (case insensitive)
+            # we use IsAlpha unicode definition, to deal correctly with diacritics.
+            # otherwise, a french word like "leçon" is splitted in "le" "çon", le is an empty word, we get "çon"
+            # and don't find anything...
              foreach (keys %{C4::Context->stopwords}) {
-                $operand=~ s/\b$_\b//i;
+                $operand=~ s/\P{IsAlpha}$_\P{IsAlpha}/ /i;
+                $operand=~ s/^$_\P{IsAlpha}/ /i;
+                $operand=~ s/\P{IsAlpha}$_$/ /i;
              }
              my $index   = $indexes[$i];
              my $stemmed_operand;
author	Paul POULAIN <paul@koha-fr.org>
	Fri, 12 Oct 2007 22:35:23 +0000 (17:35 -0500)
committer	Joshua Ferraro <jmf@liblime.com>
	Sat, 13 Oct 2007 03:21:07 +0000 (22:21 -0500)