matching enhancements -- allow matching rule to be changed on the fly

[koha_gimpoz] / C4 / Search.pm
diff --git a/C4/Search.pm b/C4/Search.pm

old mode 100755 (executable)

new mode 100644 (file)

index ca6d5a4..9d345d4
--- a/C4/Search.pm
+++ b/C4/Search.pm
@@ -1,7 +1,5 @@
  package C4::Search;
  
-# Copyright 2000-2006 Katipo Communications
-#
  # This file is part of Koha.
  #
  # Koha is free software; you can redistribute it and/or modify it under the
@@ -18,139 +16,1662 @@ package C4::Search;
  # Suite 330, Boston, MA  02111-1307 USA
  
  use strict;
-use ZOOM;
-use Smart::Comments;
-use C4::Context;
-use MARC::Record;
-use MARC::File::XML;
-use C4::Biblio;
-
  require Exporter;
+use C4::Context;
+use C4::Biblio;    # GetMarcFromKohaField
+use C4::Koha;      # getFacets
+use Lingua::Stem;
+use C4::Date;
  
  use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
  
  # set the version for version checking
-$VERSION = do { my @v = '$Revision$' =~ /\d+/g;
-    shift(@v) . "." . join( "_", map { sprintf "%03d", $_ } @v );
-};
+$VERSION = 3.00;
  
  =head1 NAME
  
-C4::Search - Functions for searching the Koha catalog and other databases
+C4::Search - Functions for searching the Koha catalog.
  
  =head1 SYNOPSIS
  
-  use C4::Search;
+see opac/opac-search.pl or catalogue/search.pl for example of usage
  
  =head1 DESCRIPTION
  
-This module provides the searching facilities for the Koha catalog and
-other databases.
+This module provides the searching facilities for the Koha into a zebra catalog.
  
  =head1 FUNCTIONS
  
-=over 2
-
  =cut
  
  @ISA    = qw(Exporter);
-@EXPORT = qw(search get_record);
+@EXPORT = qw(
+  &SimpleSearch
+  &findseealso
+  &FindDuplicate
+  &searchResults
+  &getRecords
+  &buildQuery
+  &NZgetRecords
+  &ModBiblios
+);
  
  # make all your functions, whether exported or not;
  
-sub search {
-    my ( $search, $type, $number ) = @_;
-    my $dbh = C4::Context->dbh();
-    my $q;
-    my $Zconn;
-    my $raw;
-    eval { $Zconn = new ZOOM::Connection( C4::Context->config("zebradb") ); };
-    if ($@) {
-        warn "Error ", $@->code(), ": ", $@->message(), "\n";
+=head2 findseealso($dbh,$fields);
+
+C<$dbh> is a link to the DB handler.
+
+use C4::Context;
+my $dbh =C4::Context->dbh;
+
+C<$fields> is a reference to the fields array
+
+This function modify the @$fields array and add related fields to search on.
+
+=cut
+
+sub findseealso {
+    my ( $dbh, $fields ) = @_;
+    my $tagslib = GetMarcStructure( 1 );
+    for ( my $i = 0 ; $i <= $#{$fields} ; $i++ ) {
+        my ($tag)      = substr( @$fields[$i], 1, 3 );
+        my ($subfield) = substr( @$fields[$i], 4, 1 );
+        @$fields[$i] .= ',' . $tagslib->{$tag}->{$subfield}->{seealso}
+          if ( $tagslib->{$tag}->{$subfield}->{seealso} );
+    }
+}
+
+=head2 FindDuplicate
+
+($biblionumber,$biblionumber,$title) = FindDuplicate($record);
+
+=cut
+
+sub FindDuplicate {
+    my ($record) = @_;
+    my $dbh = C4::Context->dbh;
+    my $result = TransformMarcToKoha( $dbh, $record, '' );
+    my $sth;
+    my $query;
+    my $search;
+    my $type;
+    my ( $biblionumber, $title );
+
+    # search duplicate on ISBN, easy and fast..
+    # ... normalize first
+    if ( $result->{isbn} ) {
+        $result->{isbn} =~ s/\(.*$//;
+        $result->{isbn} =~ s/\s+$//; 
+    }
+    #$search->{'avoidquerylog'}=1;
+    if ( $result->{isbn} ) {
+        $query = "isbn=$result->{isbn}";
+    }
+    else {
+        $result->{title} =~ s /\\//g;
+        $result->{title} =~ s /\"//g;
+        $result->{title} =~ s /\(//g;
+        $result->{title} =~ s /\)//g;
+               # remove valid operators
+               $result->{title} =~ s/(and|or|not)//g;
+        $query = "ti,ext=$result->{title}";
+        $query .= " and mt=$result->{itemtype}" if ($result->{itemtype});    
+        if ($result->{author}){
+          $result->{author} =~ s /\\//g;
+          $result->{author} =~ s /\"//g;
+          $result->{author} =~ s /\(//g;
+          $result->{author} =~ s /\)//g;
+                 # remove valid operators
+                 $result->{author} =~ s/(and|or|not)//g;
+          $query .= " and au,ext=$result->{author}";
+        }     
+    }
+    my ($error,$searchresults) =
+      SimpleSearch($query); # FIXME :: hardcoded !
+    my @results;
+    foreach my $possible_duplicate_record (@$searchresults) {
+        my $marcrecord =
+          MARC::Record->new_from_usmarc($possible_duplicate_record);
+        my $result = TransformMarcToKoha( $dbh, $marcrecord, '' );
+        
+        # FIXME :: why 2 $biblionumber ?
+        if ($result){
+          push @results, $result->{'biblionumber'};
+          push @results, $result->{'title'};
+        }
+    }
+    return @results;  
+}
+
+=head2 SimpleSearch
+
+($error,$results) = SimpleSearch($query,@servers);
+
+this function performs a simple search on the catalog using zoom.
+
+=over 2
+
+=item C<input arg:>
+
+    * $query could be a simple keyword or a complete CCL query wich is depending on your ccl file.
+    * @servers is optionnal. default one is read on koha.xml
+
+=item C<Output arg:>
+    * $error is a string which containt the description error if there is one. Else it's empty.
+    * \@results is an array of marc record.
+
+=item C<usage in the script:>
+
+=back
+
+my ($error, $marcresults) = SimpleSearch($query);
+
+if (defined $error) {
+    $template->param(query_error => $error);
+    warn "error: ".$error;
+    output_html_with_http_headers $input, $cookie, $template->output;
+    exit;
+}
+
+my $hits = scalar @$marcresults;
+my @results;
+
+for(my $i=0;$i<$hits;$i++) {
+    my %resultsloop;
+    my $marcrecord = MARC::File::USMARC::decode($marcresults->[$i]);
+    my $biblio = TransformMarcToKoha(C4::Context->dbh,$marcrecord,'');
+
+    #build the hash for the template.
+    $resultsloop{highlight}       = ($i % 2)?(1):(0);
+    $resultsloop{title}           = $biblio->{'title'};
+    $resultsloop{subtitle}        = $biblio->{'subtitle'};
+    $resultsloop{biblionumber}    = $biblio->{'biblionumber'};
+    $resultsloop{author}          = $biblio->{'author'};
+    $resultsloop{publishercode}   = $biblio->{'publishercode'};
+    $resultsloop{publicationyear} = $biblio->{'publicationyear'};
+
+    push @results, \%resultsloop;
+}
+$template->param(result=>\@results);
+
+=cut
+
+sub SimpleSearch {
+    my $query   = shift;
+    if (C4::Context->preference('NoZebra')) {
+        my $result = NZorder(NZanalyse($query))->{'biblioserver'}->{'RECORDS'};
+        return (undef,$result);
+    } else {
+        my @servers = @_;
+        my @results;
+        my @tmpresults;
+        my @zconns;
+        return ( "No query entered", undef ) unless $query;
+    
+        #@servers = (C4::Context->config("biblioserver")) unless @servers;
+        @servers =
+        ("biblioserver") unless @servers
+        ;    # FIXME hardcoded value. See catalog/search.pl & opac-search.pl too.
+    
+        # Connect & Search
+        for ( my $i = 0 ; $i < @servers ; $i++ ) {
+            $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
+            $tmpresults[$i] =
+            $zconns[$i]
+            ->search( new ZOOM::Query::CCL2RPN( $query, $zconns[$i] ) );
+    
+            # getting error message if one occured.
+            my $error =
+                $zconns[$i]->errmsg() . " ("
+            . $zconns[$i]->errcode() . ") "
+            . $zconns[$i]->addinfo() . " "
+            . $zconns[$i]->diagset();
+    
+            return ( $error, undef ) if $zconns[$i]->errcode();
+        }
+        my $hits;
+        my $ev;
+        while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
+            $ev = $zconns[ $i - 1 ]->last_event();
+            if ( $ev == ZOOM::Event::ZEND ) {
+                $hits = $tmpresults[ $i - 1 ]->size();
+            }
+            if ( $hits > 0 ) {
+                for ( my $j = 0 ; $j < $hits ; $j++ ) {
+                    my $record = $tmpresults[ $i - 1 ]->record($j)->raw();
+                    push @results, $record;
+                }
+            }
+        }
+        return ( undef, \@results );
      }
+}
  
-    if ( $type eq 'CQL' ) {
-        my $string;
-        if ( $search->{'cql'} ) {
-            $string = $search->{'cql'};
+# performs the search
+sub getRecords {
+    my (
+        $koha_query,     $federated_query,  $sort_by_ref,
+        $servers_ref,    $results_per_page, $offset,
+        $expanded_facet, $branches,         $query_type,
+        $scan
+    ) = @_;
+#     warn "Query : $koha_query";
+    my @servers = @$servers_ref;
+    my @sort_by = @$sort_by_ref;
+
+    # create the zoom connection and query object
+    my $zconn;
+    my @zconns;
+    my @results;
+    my $results_hashref = ();
+
+    ### FACETED RESULTS
+    my $facets_counter = ();
+    my $facets_info    = ();
+    my $facets         = getFacets();
+
+    #### INITIALIZE SOME VARS USED CREATE THE FACETED RESULTS
+    my @facets_loop;    # stores the ref to array of hashes for template
+    for ( my $i = 0 ; $i < @servers ; $i++ ) {
+        $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
+
+# perform the search, create the results objects
+# if this is a local search, use the $koha-query, if it's a federated one, use the federated-query
+        my $query_to_use;
+        if ( $servers[$i] =~ /biblioserver/ ) {
+            $query_to_use = $koha_query;
          }
          else {
-            foreach my $var ( keys %$search ) {
-                $string .= "$var=\"$search->{$var}\" ";
+            $query_to_use = $federated_query;
+        }
+
+        # check if we've got a query_type defined
+        eval {
+            if ($query_type)
+            {
+                if ( $query_type =~ /^ccl/ ) {
+                    $query_to_use =~
+                      s/\:/\=/g;    # change : to = last minute (FIXME)
+
+                    #                 warn "CCL : $query_to_use";
+                    $results[$i] =
+                      $zconns[$i]->search(
+                        new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
+                      );
+                }
+                elsif ( $query_type =~ /^cql/ ) {
+
+                    #                 warn "CQL : $query_to_use";
+                    $results[$i] =
+                      $zconns[$i]->search(
+                        new ZOOM::Query::CQL( $query_to_use, $zconns[$i] ) );
+                }
+                elsif ( $query_type =~ /^pqf/ ) {
+
+                    #                 warn "PQF : $query_to_use";
+                    $results[$i] =
+                      $zconns[$i]->search(
+                        new ZOOM::Query::PQF( $query_to_use, $zconns[$i] ) );
+                }
+            }
+            else {
+                if ($scan) {
+
+                    #                 warn "preparing to scan";
+                    $results[$i] =
+                      $zconns[$i]->scan(
+                        new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
+                      );
+                }
+                else {
+
+                    #             warn "LAST : $query_to_use";
+                    $results[$i] =
+                      $zconns[$i]->search(
+                        new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
+                      );
+                }
+            }
+        };
+        if ($@) {
+            warn "WARNING: query problem with $query_to_use " . $@;
+        }
+
+        # concatenate the sort_by limits and pass them to the results object
+        my $sort_by;
+        foreach my $sort (@sort_by) {
+            if ($sort eq "author_az") {
+                $sort_by.="1=1003 <i ";
+            }
+            elsif ($sort eq "author_za") {
+                $sort_by.="1=1003 >i ";
+            }
+                       elsif ($sort eq "popularity_asc") {
+                               $sort_by.="1=9003 <i ";
+                       }
+                       elsif ($sort eq "popularity_dsc") {
+                $sort_by.="1=9003 >i ";
+            }
+                       elsif ($sort eq "call_number_asc") {
+                $sort_by.="1=20  <i ";
+            }
+                       elsif ($sort eq "call_number_dsc") {
+                $sort_by.="1=20 >i ";
+            }
+                       elsif ($sort eq "pubdate_asc") {
+                $sort_by.="1=31 <i ";
+            }
+                       elsif ($sort eq "pubdate_dsc") {
+                $sort_by.="1=31 >i ";
+            }
+                       elsif ($sort eq "acqdate_asc") {
+                $sort_by.="1=32 <i ";
+            }
+                       elsif ($sort eq "acqdate_dsc") {
+                $sort_by.="1=32 >i ";
+            }
+                       elsif ($sort eq "title_az") {
+                $sort_by.="1=4 <i ";
+            }
+                       elsif ($sort eq "title_za") {
+                $sort_by.="1=4 >i ";
              }
          }
-        $Zconn->option( cqlfile => C4::Context->config("intranetdir")
-              . "/zebra/pqf.properties" );
-        $Zconn->option( preferredRecordSyntax => "xml" );
-        $q = new ZOOM::Query::CQL2RPN( $string, $Zconn );
+               if ($sort_by) {
+                       if ( $results[$i]->sort( "yaz", $sort_by ) < 0) {
+                       warn "WARNING sort $sort_by failed";
+                       }
+               }
      }
-    my $rs;
-    my $n;
-    eval {
-        $rs = $Zconn->search($q);
-        $n  = $rs->size();
-    };
-    if ($@) {
-        print "Error ", $@->code(), ": ", $@->message(), "\n";
+    while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
+        my $ev = $zconns[ $i - 1 ]->last_event();
+        if ( $ev == ZOOM::Event::ZEND ) {
+            my $size = $results[ $i - 1 ]->size();
+            if ( $size > 0 ) {
+                my $results_hash;
+                #$results_hash->{'server'} = $servers[$i-1];
+                # loop through the results
+                $results_hash->{'hits'} = $size;
+                my $times;
+                if ( $offset + $results_per_page <= $size ) {
+                    $times = $offset + $results_per_page;
+                }
+                else {
+                    $times = $size;
+                }
+                for ( my $j = $offset ; $j < $times ; $j++ )
+                {   #(($offset+$count<=$size) ? ($offset+$count):$size) ; $j++){
+                    my $records_hash;
+                    my $record;
+                    my $facet_record;
+                    ## This is just an index scan
+                    if ($scan) {
+                        my ( $term, $occ ) = $results[ $i - 1 ]->term($j);
+
+                 # here we create a minimal MARC record and hand it off to the
+                 # template just like a normal result ... perhaps not ideal, but
+                 # it works for now
+                        my $tmprecord = MARC::Record->new();
+                        $tmprecord->encoding('UTF-8');
+                        my $tmptitle;
+
+          # srote the minimal record in author/title (depending on MARC flavour)
+                        if ( C4::Context->preference("marcflavour") eq
+                            "UNIMARC" )
+                        {
+                            $tmptitle = MARC::Field->new(
+                                '200', ' ', ' ',
+                                a => $term,
+                                f => $occ
+                            );
+                        }
+                        else {
+                            $tmptitle = MARC::Field->new(
+                                '245', ' ', ' ',
+                                a => $term,
+                                b => $occ
+                            );
+                        }
+                        $tmprecord->append_fields($tmptitle);
+                        $results_hash->{'RECORDS'}[$j] =
+                          $tmprecord->as_usmarc();
+                    }
+                    else {
+                        $record = $results[ $i - 1 ]->record($j)->raw();
+
+                        #warn "RECORD $j:".$record;
+                        $results_hash->{'RECORDS'}[$j] =
+                          $record;    # making a reference to a hash
+                                      # Fill the facets while we're looping
+                        $facet_record = MARC::Record->new_from_usmarc($record);
+
+                        #warn $servers[$i-1].$facet_record->title();
+                        for ( my $k = 0 ; $k <= @$facets ; $k++ ) {
+                            if ( $facets->[$k] ) {
+                                my @fields;
+                                for my $tag ( @{ $facets->[$k]->{'tags'} } ) {
+                                    push @fields, $facet_record->field($tag);
+                                }
+                                for my $field (@fields) {
+                                    my @subfields = $field->subfields();
+                                    for my $subfield (@subfields) {
+                                        my ( $code, $data ) = @$subfield;
+                                        if ( $code eq
+                                            $facets->[$k]->{'subfield'} )
+                                        {
+                                            $facets_counter->{ $facets->[$k]
+                                                  ->{'link_value'} }->{$data}++;
+                                        }
+                                    }
+                                }
+                                $facets_info->{ $facets->[$k]->{'link_value'} }
+                                  ->{'label_value'} =
+                                  $facets->[$k]->{'label_value'};
+                                $facets_info->{ $facets->[$k]->{'link_value'} }
+                                  ->{'expanded'} = $facets->[$k]->{'expanded'};
+                            }
+                        }
+                    }
+                }
+                $results_hashref->{ $servers[ $i - 1 ] } = $results_hash;
+            }
+
+            #print "connection ", $i-1, ": $size hits";
+            #print $results[$i-1]->record(0)->render() if $size > 0;
+            # BUILD FACETS
+            for my $link_value (
+                sort { $facets_counter->{$b} <=> $facets_counter->{$a} }
+                keys %$facets_counter
+              )
+            {
+                my $expandable;
+                my $number_of_facets;
+                my @this_facets_array;
+                for my $one_facet (
+                    sort {
+                        $facets_counter->{$link_value}
+                          ->{$b} <=> $facets_counter->{$link_value}->{$a}
+                    } keys %{ $facets_counter->{$link_value} }
+                  )
+                {
+                    $number_of_facets++;
+                    if (   ( $number_of_facets < 6 )
+                        || ( $expanded_facet eq $link_value )
+                        || ( $facets_info->{$link_value}->{'expanded'} ) )
+                    {
+
+                       # sanitize the link value ), ( will cause errors with CCL
+                        my $facet_link_value = $one_facet;
+                        $facet_link_value =~ s/(\(|\))/ /g;
+
+                        # fix the length that will display in the label
+                        my $facet_label_value = $one_facet;
+                        $facet_label_value = substr( $one_facet, 0, 20 ) . "..."
+                          unless length($facet_label_value) <= 20;
+
+                       # well, if it's a branch, label by the name, not the code
+                        if ( $link_value =~ /branch/ ) {
+                            $facet_label_value =
+                              $branches->{$one_facet}->{'branchname'};
+                        }
+
+                 # but we're down with the whole label being in the link's title
+                        my $facet_title_value = $one_facet;
+
+                        push @this_facets_array,
+                          (
+                            {
+                                facet_count =>
+                                  $facets_counter->{$link_value}->{$one_facet},
+                                facet_label_value => $facet_label_value,
+                                facet_title_value => $facet_title_value,
+                                facet_link_value  => $facet_link_value,
+                                type_link_value   => $link_value,
+                            },
+                          );
+                    }
+                }
+                unless ( $facets_info->{$link_value}->{'expanded'} ) {
+                    $expandable = 1
+                      if ( ( $number_of_facets > 6 )
+                        && ( $expanded_facet ne $link_value ) );
+                }
+                push @facets_loop,
+                  (
+                    {
+                        type_link_value => $link_value,
+                        type_id         => $link_value . "_id",
+                        type_label      =>
+                          $facets_info->{$link_value}->{'label_value'},
+                        facets     => \@this_facets_array,
+                        expandable => $expandable,
+                        expand     => $link_value,
+                    }
+                  );
+            }
+        }
      }
-    my $i = 0;
-    my @results;
-    while ( $i < $n && $i < $number ) {
-        $raw = $rs->record($i)->raw();
-        my $record = MARC::Record->new_from_xml($raw);
-        my $line = MARCmarc2koha( $dbh, $record );
-        push @results, $line;
-#       push @results,$raw;
-       $i++;
+    return ( undef, $results_hashref, \@facets_loop );
+}
+
+sub _remove_stopwords {
+       my ($operand,$index) = @_;
+       # if the index contains more than one qualifier, but not phrase:    
+       if ($index!~m/phr|ext/){
+       # operand may be a wordlist deleting stopwords
+       # remove stopwords from operand : parse all stopwords & remove them (case insensitive)
+       #       we use IsAlpha unicode definition, to deal correctly with diacritics.
+       #       otherwise, a french word like "leçon" is splitted in "le" "çon", le is an empty word, we get "çon"
+       #       and don't find anything...
+               foreach (keys %{C4::Context->stopwords}) {
+      next if ($_ =~/(and|or|not)/); # don't remove operators 
+                       $operand=~ s/\P{IsAlpha}$_\P{IsAlpha}/ /i;
+                       $operand=~ s/^$_\P{IsAlpha}/ /i;
+                       $operand=~ s/\P{IsAlpha}$_$/ /i;
+               }
+       }
+       return $operand;
+}
+
+sub _add_truncation {
+       my ($operand,$index) = @_;
+       my (@nontruncated,@righttruncated,@lefttruncated,@rightlefttruncated,@regexpr);
+       # if the index contains more than one qualifier, but not phrase, add truncation qualifiers
+       #if (index($index,"phr")<0 && index($index,",")>0){
+       # warn "ADDING TRUNCATION QUALIFIERS";
+               $operand =~s/^ //g;
+               my @wordlist= split (/\s/,$operand);
+               foreach my $word (@wordlist){
+                       if ($word=~s/^\*([^\*]+)\*$/$1/){
+        push @rightlefttruncated,$word;
+                       } 
+                       elsif($word=~s/^\*([^\*]+)$/$1/){
+                               push @lefttruncated,$word;
+                        
+                       } 
+                       elsif ($word=~s/^([^\*]+)\*$/$1/){
+                               push @righttruncated,$word;
+                       } 
+                       elsif (index($word,"*")<0){
+                               push @nontruncated,$word;
+                       }
+                       else {
+                               push @regexpr,$word;
+                        
+                       }
+               }
+       #}
+       return (\@nontruncated,\@righttruncated,\@lefttruncated,\@rightlefttruncated,\@regexpr);
+}
+
+sub _build_stemmed_operand {
+       my ($operand) = @_;
+       my $stemmed_operand;
+       #$operand =~ s/^(and |or |not )//i;
+       # STEMMING FIXME: may need to refine the field weighting so stemmed operands don't 
+       # disrupt the query ranking, this needs more testing
+       # FIXME: the locale should be set based on the user's language and/or search choice
+       my $stemmer = Lingua::Stem->new( -locale => 'EN-US' );
+       # FIXME: these should be stored in the db so the librarian can modify the behavior
+       $stemmer->add_exceptions(
+                       {
+                               'and' => 'and',
+                'or'  => 'or',
+                'not' => 'not',
+                       }
+                    
+               );
+       my @words = split( / /, $operand );
+       my $stems = $stemmer->stem(@words);
+       foreach my $stem (@$stems) {
+                       $stemmed_operand .= "$stem";
+                       $stemmed_operand .= "?" unless ( $stem =~ /(and$|or$|not$)/ ) || ( length($stem) < 3 );
+                       $stemmed_operand .= " ";
+       }
+       #warn "STEMMED OPERAND: $stemmed_operand";
+       return $stemmed_operand;
+}
+
+sub _build_weighted_query {
+       # FIELD WEIGHTING - This is largely experimental stuff. What I'm committing works
+       # pretty well but will work much better when we have an actual query parser
+       my ($operand,$stemmed_operand,$index) = @_;
+    my $stemming      = C4::Context->preference("QueryStemming")     || 0;
+    my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
+    my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
+
+    my $weighted_query .= " (rk=(";     # Specifies that we're applying rank
+       # keyword has different weight properties
+       if ( ( $index =~ /kw/ ) || ( !$index ) ) {
+       # a simple way to find out if this query uses an index
+               if ( $operand =~ /(\=|\:)/ ) {
+                       $weighted_query .= " $operand";
+               }
+               else {
+                       $weighted_query .=" Title-cover,ext,r1=\"$operand\"";   # title cover as exact
+                       $weighted_query .=" or ti,ext,r2=\"$operand\"";             # exact title elsewhere
+                       $weighted_query .= " or ti,phr,r3=\"$operand\"";          # index as phrase
+                       #$weighted_query .= " or any,ext,r4=$operand";         # index as exact
+                       #$weighted_query .=" or kw,wrdl,r5=\"$operand\"";            # all the words in the query (wordlist)
+                       $weighted_query .= " or wrd,fuzzy,r8=\"$operand\"" if $fuzzy_enabled; # add fuzzy
+                       $weighted_query .= " or wrd,right-Truncation,r9=\"$stemmed_operand\"" if ($stemming and $stemmed_operand); # add stemming
+                       # embedded sorting: 0 a-z; 1 z-a
+                       #$weighted_query .= ") or (sort1,aut=1";
+               }
+                    
+       }
+       #TODO: build better cases based on specific search indexes
+       #elsif ( $index =~ /au/ ) {
+       #       $weighted_query .=" $index,ext,r1=$operand";    # index label as exact
+       #       #$weighted_query .= " or (title-sort-az=0 or $index,startswithnt,st-word,r3=$operand #)";
+       #       $weighted_query .=" or $index,phr,r3=$operand";    # index as phrase
+       #       $weighted_query .= " or $index,rt,wrd,r3=$operand";
+       #}
+       #elsif ( $index =~ /ti/ ) {
+       #       $weighted_query .=" Title-cover,ext,r1=$operand"; # index label as exact
+       #       $weighted_query .= " or Title-series,ext,r2=$operand";
+       #       #$weighted_query .= " or ti,ext,r2=$operand";
+       #       #$weighted_query .= " or ti,phr,r3=$operand";
+       #       #$weighted_query .= " or ti,wrd,r3=$operand";
+       #       $weighted_query .=" or (title-sort-az=0 or Title-cover,startswithnt,st-word,r3=$operand #)";
+       #       $weighted_query .=" or (title-sort-az=0 or Title-cover,phr,r6=$operand)";
+               #$weighted_query .= " or Title-cover,wrd,r5=$operand";
+               #$weighted_query .= " or ti,ext,r6=$operand";
+               #$weighted_query .= " or ti,startswith,phr,r7=$operand";
+               #$weighted_query .= " or ti,phr,r8=$operand";
+               #$weighted_query .= " or ti,wrd,r9=$operand";
+               #$weighted_query .= " or ti,ext,r2=$operand";         # index as exact
+               #$weighted_query .= " or ti,phr,r3=$operand";              # index as  phrase
+               #$weighted_query .= " or any,ext,r4=$operand";         # index as exact
+               #$weighted_query .= " or kw,wrd,r5=$operand";         # index as exact
+       #}
+       else {
+               warn "WEIGHT GENERIC";
+               $weighted_query .=" $index=$operand";
+               #$weighted_query .=" $index,ext,r1=$operand";    # index label as exact
+               #$weighted_query .= " or $index,ext,r2=$operand";            # index as exact
+               #$weighted_query .=" or $index,phr,r3=$operand";    # index as phrase
+               #$weighted_query .= " or $index,rt,wrd,r3=$operand";
+               #$weighted_query .=" or $index,wrd,r5=$operand";    # index as word right-truncated
+               #$weighted_query .= " or $index,wrd,fuzzy,r8=$operand" if $fuzzy_enabled;
+       }
+       $weighted_query .= "))";    # close rank specification
+       return $weighted_query;
+}
+
+# build the query itself
+sub buildQuery {
+    my ( $operators, $operands, $indexes, $limits, $sort_by ) = @_;
+
+    my @operators = @$operators if $operators;
+    my @indexes   = @$indexes   if $indexes;
+    my @operands  = @$operands  if $operands;
+    my @limits    = @$limits    if $limits;
+    my @sort_by   = @$sort_by   if $sort_by;
+
+       my $stemming      = C4::Context->preference("QueryStemming")     || 0;
+       my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
+       my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
+
+    my $human_search_desc;      # a human-readable query
+    my $machine_search_desc;    #a machine-readable query
+       #warn "OPERATORS: >@operators< INDEXES: >@indexes< OPERANDS: >@operands< LIMITS: >@limits< SORTS: >@sort_by<";
+       my $query = $operands[0];
+# STEP I: determine if this is a form-based / simple query or if it's complex (if complex,
+# we can't handle field weighting, stemming until a formal query parser is written
+
+# check if this is a known query language query, if it is, return immediately,
+# the user is responsible for constructing valid syntax:
+    if ( $query =~ /^ccl=/ ) {
+        return ( undef, $', $', $', 'ccl' );
+    }
+    if ( $query =~ /^cql=/ ) {
+        return ( undef, $', $', $', 'cql' );
      }
-    return ( \@results );
+    if ( $query =~ /^pqf=/ ) {
+        return ( undef, $', $', $', 'pqf' );
+    }
+    if ( $query =~ /(\(|\))/ ) {    # sorry, too complex, assume CCL
+        return ( undef, $query, $query, $query, 'ccl' );
+    }
+
+# form-based queries are limited to non-nested at a specific depth, so we can easily
+# modify the incoming query operands and indexes to do stemming and field weighting
+# Once we do so, we'll end up with a value in $query, just like if we had an
+# incoming $query from the user
+    else {
+        $query = ""; # clear it out so we can populate properly with field-weighted stemmed query
+        my $previous_operand;    # a flag used to keep track if there was a previous query
+                                                       # if there was, we can apply the current operator
+               # for every operand
+        for ( my $i = 0 ; $i <= @operands ; $i++ ) {
+
+                       # COMBINE OPERANDS, INDEXES AND OPERATORS
+                       if ( $operands[$i] ) {
+               my $operand = $operands[$i];
+               my $index   = $indexes[$i];
+
+                               # if there's no index, don't use one, it will throw a CCL error
+                               my $index_plus;# $index_plus = "$index:" if $index;
+                               my $index_plus_comma;# $index_plus_comma="$index," if $index;
+
+                               # Remove Stopwords      
+                               $operand = _remove_stopwords($operand,$index);
+                               #warn "OP_SW: $operand";
+                               # Handle Truncation
+                               my ($nontruncated,$righttruncated,$lefttruncated,$rightlefttruncated,$regexpr);
+                               ($nontruncated,$righttruncated,$lefttruncated,$rightlefttruncated,$regexpr) = _add_truncation($operand,$index);
+                               #warn "TRUNCATION: NON:@$nontruncated RIGHT:@$righttruncated LEFT:@$lefttruncated RIGHTLEFT:@$rightlefttruncated REGEX:@$regexpr";
+
+                               # Handle Stemming
+                       my $stemmed_operand;
+                               $stemmed_operand = _build_stemmed_operand($operand) if $stemming;
+
+                               # Handle Field Weighting
+                               my $weighted_operand;
+                $weighted_operand = _build_weighted_query($operand,$stemmed_operand,$index) if $weight_fields;
  
+                               # proves we're operating in multi-leaf mode
+                               # $weighted_operand = "$weighted_operand and $weighted_operand";
+                               $operand = $weighted_operand if $weight_fields;
+
+                # If there's a previous operand, we need to add an operator
+                if ($previous_operand) {
+                                       # user-specified operator
+                    if ( $operators[$i-1] ) {
+                                               $human_search_desc .="  $operators[$i-1] $index_plus $operands[$i]";
+                                               $query .= " $operators[$i-1] $index_plus $operand";
+                    }
+                    # the default operator is and
+                    else {
+                        $query             .= " and $index_plus $operand";
+                        $human_search_desc .= " and $index_plus $operands[$i]";
+                    }
+                }
+                               # There's no previous operand - FIXME: completely ignoring our $query, no field weighting, no stemming
+                               # FIXME: also, doesn't preserve original order
+                else { 
+                                       # if there are terms to fit with truncation
+                                       if (scalar(@$righttruncated)+scalar(@$lefttruncated)+scalar(@$rightlefttruncated)>0){
+                                               # add the non-truncated ones first
+                                               $query.= "$index_plus @$nontruncated " if (scalar(@$nontruncated)>0);
+                                               if (scalar(@$righttruncated)>0){
+                                                       $query .= "and $index_plus_comma"."rtrn:@$righttruncated ";
+                                               }            
+                                               if (scalar(@$lefttruncated)>0){
+                                                       $query .= "and $index_plus_comma"."ltrn:@$lefttruncated ";
+                                               }            
+                                               if (scalar(@$rightlefttruncated)>0){
+                                                       $query .= "and $index_plus_comma"."rltrn:@$rightlefttruncated ";
+                                               }
+                        $query=~s/^and//; # FIXME: this is cheating :-)
+                        $human_search_desc .= $query;
+                                       } else {           
+                        $query             .= " $index_plus $operand";
+                        $human_search_desc .= " $index_plus $operands[$i]";
+                                       }            
+                    $previous_operand = 1;
+                }
+            }    #/if $operands
+        }    # /for
+    }
+       #warn "QUERY:".$query;
+    # add limits
+    my $limit_query;
+    my $limit_search_desc;
+    foreach my $limit (@limits) {
+
+        # FIXME: not quite right yet ... will work on this soon -- JF
+        my $type = $1 if $limit =~ m/([^:]+):([^:]*)/;
+        if ( $limit =~ /available/ ) {
+            $limit_query .= " (($query and datedue=0000-00-00) or ($query and datedue=0000-00-00 not lost=1) or ($query and datedue=0000-00-00 not lost=2))";
+            #$limit_search_desc.=" and available";
+        }
+        elsif ( ($limit_query) && ( index( $limit_query, $type, 0 ) > 0 ) ) {
+            if ( $limit_query !~ /\(/ ) {
+                $limit_query =
+                    substr( $limit_query, 0, index( $limit_query, $type, 0 ) )
+                  . "("
+                  . substr( $limit_query, index( $limit_query, $type, 0 ) )
+                  . " or $limit )"
+                  if $limit;
+                $limit_search_desc =
+                  substr( $limit_search_desc, 0,
+                    index( $limit_search_desc, $type, 0 ) )
+                  . "("
+                  . substr( $limit_search_desc,
+                    index( $limit_search_desc, $type, 0 ) )
+                  . " or $limit )"
+                  if $limit;
+            }
+            else {
+                chop $limit_query;
+                chop $limit_search_desc;
+                $limit_query       .= " or $limit )" if $limit;
+                $limit_search_desc .= " or $limit )" if $limit;
+            }
+        }
+        elsif ( ($limit_query) && ( $limit =~ /mc/ ) ) {
+            $limit_query       .= " or $limit" if $limit;
+            $limit_search_desc .= " or $limit" if $limit;
+        }
+
+        # these are treated as AND
+        elsif ($limit_query) {
+           if ($limit =~ /branch/){
+                       $limit_query       .= " ) and ( $limit" if $limit;
+                       $limit_search_desc .= " ) and ( $limit" if $limit;
+               }else{
+                       $limit_query       .= " or $limit" if $limit;
+                       $limit_search_desc .= " or $limit" if $limit;
+               }
+        }
+
+        # otherwise, there is nothing but the limit
+        else {
+            $limit_query       .= "$limit" if $limit;
+            $limit_search_desc .= "$limit" if $limit;
+        }
+    }
+
+    # if there's also a query, we need to AND the limits to it
+    if ( ($limit_query) && ($query) ) {
+        $limit_query       = " and (" . $limit_query . ")";
+        $limit_search_desc = " and ($limit_search_desc)" if $limit_search_desc;
+
+    }
+       #warn "LIMIT: $limit_query";
+    $query             .= $limit_query;
+    $human_search_desc .= $limit_search_desc;
+
+    # now normalize the strings
+    $query =~ s/  / /g;    # remove extra spaces
+    $query =~ s/^ //g;     # remove any beginning spaces
+    $query =~ s/:/=/g;     # causes probs for server
+    $query =~ s/==/=/g;    # remove double == from query
+
+    my $federated_query = $human_search_desc;
+    $federated_query =~ s/  / /g;
+    $federated_query =~ s/^ //g;
+    $federated_query =~ s/:/=/g;
+    my $federated_query_opensearch = $federated_query;
+
+#     my $federated_query_RPN = new ZOOM::Query::CCL2RPN( $query , C4::Context->ZConn('biblioserver'));
+
+    $human_search_desc =~ s/  / /g;
+    $human_search_desc =~ s/^ //g;
+    my $koha_query = $query;
+
+    #warn "QUERY:".$koha_query;
+    #warn "SEARCHDESC:".$human_search_desc;
+    #warn "FEDERATED QUERY:".$federated_query;
+    return ( undef, $human_search_desc, $koha_query, $federated_query );
  }
  
-sub get_record {
+# IMO this subroutine is pretty messy still -- it's responsible for
+# building the HTML output for the template
+sub searchResults {
+    my ( $searchdesc, $hits, $results_per_page, $offset, @marcresults ) = @_;
+
+    my $dbh = C4::Context->dbh;
+    my $toggle;
+    my $even = 1;
+    my @newresults;
+    my $span_terms_hashref;
+    for my $span_term ( split( / /, $searchdesc ) ) {
+        $span_term =~ s/(.*=|\)|\(|\+|\.)//g;
+        $span_terms_hashref->{$span_term}++;
+    }
+
+    #Build brancnames hash
+    #find branchname
+    #get branch information.....
+    my %branches;
+    my $bsth =
+      $dbh->prepare("SELECT branchcode,branchname FROM branches")
+      ;    # FIXME : use C4::Koha::GetBranches
+    $bsth->execute();
+    while ( my $bdata = $bsth->fetchrow_hashref ) {
+        $branches{ $bdata->{'branchcode'} } = $bdata->{'branchname'};
+    }
+
+    #Build itemtype hash
+    #find itemtype & itemtype image
+    my %itemtypes;
+    $bsth =
+      $dbh->prepare("SELECT itemtype,description,imageurl,summary,notforloan FROM itemtypes");
+    $bsth->execute();
+    while ( my $bdata = $bsth->fetchrow_hashref ) {
+        $itemtypes{ $bdata->{'itemtype'} }->{description} =
+          $bdata->{'description'};
+        $itemtypes{ $bdata->{'itemtype'} }->{imageurl} = $bdata->{'imageurl'};
+        $itemtypes{ $bdata->{'itemtype'} }->{summary} = $bdata->{'summary'};
+        $itemtypes{ $bdata->{'itemtype'} }->{notforloan} = $bdata->{'notforloan'};
+    }
+
+    #search item field code
+    my $sth =
+      $dbh->prepare(
+"select tagfield from marc_subfield_structure where kohafield like 'items.itemnumber'"
+      );
+    $sth->execute;
+    my ($itemtag) = $sth->fetchrow;
+
+    ## find column names of items related to MARC
+    my $sth2 = $dbh->prepare("SHOW COLUMNS from items");
+    $sth2->execute;
+    my %subfieldstosearch;
+    while ( ( my $column ) = $sth2->fetchrow ) {
+        my ( $tagfield, $tagsubfield ) =
+          &GetMarcFromKohaField( "items." . $column, "" );
+        $subfieldstosearch{$column} = $tagsubfield;
+    }
+    my $times;
  
-    # pass in an id (biblionumber at this stage) and get back a MARC record
-    my ($id) = @_;
-    my $q;
-    my $Zconn;
-    my $raw;
-    eval { $Zconn = new ZOOM::Connection( C4::Context->config("zebradb") ); };
-    if ($@) {
-        warn "Error ", $@->code(), ": ", $@->message(), "\n";
+    if ( $hits && $offset + $results_per_page <= $hits ) {
+        $times = $offset + $results_per_page;
+    }
+    else {
+        $times = $hits;
      }
-    $Zconn->option( cqlfile => C4::Context->config("intranetdir")
-          . "/zebra/pqf.properties" );
-    $Zconn->option( preferredRecordSyntax => "xml" );
-    my $string = "identifier=$id";
-    warn $string;
  
-        $q = new ZOOM::Query::CQL2RPN( $string, $Zconn);
-    eval {
-#        my $rs = $Zconn->search_pqf("\@attr 1=12 $id");
-       my $rs = $Zconn->search($q);
-        my $n  = $rs->size();
-        if ( $n > 0 ) {
-            $raw = $rs->record(0)->raw();
+    for ( my $i = $offset ; $i <= $times - 1 ; $i++ ) {
+        my $marcrecord;
+        $marcrecord = MARC::File::USMARC::decode( $marcresults[$i] );
+        my $oldbiblio = TransformMarcToKoha( $dbh, $marcrecord, '' );
+        # add image url if there is one
+        if ( $itemtypes{ $oldbiblio->{itemtype} }->{imageurl} =~ /^http:/ ) {
+            $oldbiblio->{imageurl} =
+              $itemtypes{ $oldbiblio->{itemtype} }->{imageurl};
+            $oldbiblio->{description} =
+              $itemtypes{ $oldbiblio->{itemtype} }->{description};
+        }
+        else {
+            $oldbiblio->{imageurl} =
+              getitemtypeimagesrc() . "/"
+              . $itemtypes{ $oldbiblio->{itemtype} }->{imageurl}
+              if ( $itemtypes{ $oldbiblio->{itemtype} }->{imageurl} );
+            $oldbiblio->{description} =
+              $itemtypes{ $oldbiblio->{itemtype} }->{description};
+        }
+        #
+        # build summary if there is one (the summary is defined in itemtypes table
+        #
+        if ($itemtypes{ $oldbiblio->{itemtype} }->{summary}) {
+            my $summary = $itemtypes{ $oldbiblio->{itemtype} }->{summary};
+            my @fields = $marcrecord->fields();
+            foreach my $field (@fields) {
+                my $tag = $field->tag();
+                my $tagvalue = $field->as_string();
+                $summary =~ s/\[(.?.?.?.?)$tag\*(.*?)]/$1$tagvalue$2\[$1$tag$2]/g;
+                unless ($tag<10) {
+                    my @subf = $field->subfields;
+                    for my $i (0..$#subf) {
+                        my $subfieldcode = $subf[$i][0];
+                        my $subfieldvalue = $subf[$i][1];
+                        my $tagsubf = $tag.$subfieldcode;
+                        $summary =~ s/\[(.?.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue$2\[$1$tagsubf$2]/g;
+                    }
+                }
+            }
+            $summary =~ s/\[(.*?)]//g;
+            $summary =~ s/\n/<br>/g;
+            $oldbiblio->{summary} = $summary;
+        }
+        # add spans to search term in results for search term highlighting
+        foreach my $term ( keys %$span_terms_hashref ) {
+            my $old_term = $term;
+            if ( length($term) > 3 ) {
+                $term =~ s/(.*=|\)|\(|\+|\.|\?|\[|\])//g;
+                               $term =~ s/\\//g;
+                               $term =~ s/\*//g;
+
+                #FIXME: is there a better way to do this?
+                $oldbiblio->{'title'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'subtitle'} =~
+                  s/$term/<span class=\"term\">$&<\/span>/gi;
+
+                $oldbiblio->{'author'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'publishercode'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'place'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'pages'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'notes'} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+                $oldbiblio->{'size'}  =~ s/$term/<span class=\"term\">$&<\/span>/gi;
+            }
+        }
+
+        if ( $i % 2 ) {
+            $toggle = "#ffffcc";
+        }
+        else {
+            $toggle = "white";
          }
-    };
-    if ($@) {
+        $oldbiblio->{'toggle'} = $toggle;
+        my @fields = $marcrecord->field($itemtag);
+        my @items_loop;
+        my $items;
+        my $ordered_count     = 0;
+        my $onloan_count      = 0;
+        my $wthdrawn_count    = 0;
+        my $itemlost_count    = 0;
+        my $norequests        = 1;
+
+        #
+        # check the loan status of the item : 
+        # it is not stored in the MARC record, for pref (zebra reindexing)
+        # reason. Thus, we have to get the status from a specific SQL query
+        #
+        my $sth_issue = $dbh->prepare("
+            SELECT date_due,returndate 
+            FROM issues 
+            WHERE itemnumber=? AND returndate IS NULL");
+        my $items_count=scalar(@fields);
+        foreach my $field (@fields) {
+            my $item;
+            foreach my $code ( keys %subfieldstosearch ) {
+                $item->{$code} = $field->subfield( $subfieldstosearch{$code} );
+            }
+            $sth_issue->execute($item->{itemnumber});
+            $item->{due_date} = format_date($sth_issue->fetchrow);
+            $item->{onloan} = 1 if $item->{due_date};
+            # at least one item can be reserved : suppose no
+            $norequests = 1;
+            if ( $item->{wthdrawn} ) {
+                $wthdrawn_count++;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{unavailable}=1;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{wthdrawn}=1;
+            }
+            elsif ( $item->{itemlost} ) {
+                $itemlost_count++;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{unavailable}=1;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{itemlost}=1;
+            }
+            unless ( $item->{notforloan}) {
+                # OK, this one can be issued, so at least one can be reserved
+                $norequests = 0;
+            }
+            if ( ( $item->{onloan} ) && ( $item->{onloan} != '0000-00-00' ) )
+            {
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{unavailable}=1;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{onloancount} = 1;
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{due_date} = $item->{due_date};
+                $onloan_count++;
+            }
+            if ( $item->{'homebranch'} ) {
+                $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{count}++;
+            }
+
+            # Last resort
+            elsif ( $item->{'holdingbranch'} ) {
+                $items->{ $item->{'holdingbranch'} }->{count}++;
+            }
+            $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{itemcallnumber} =                $item->{itemcallnumber};
+            $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{location} =                $item->{location};
+            $items->{ $item->{'homebranch'}.'--'.$item->{'itemcallnumber'} }->{branchcode} =               $item->{homebranch};
+        }    # notforloan, item level and biblioitem level
+
+        # last check for norequest : if itemtype is notforloan, it can't be reserved either, whatever the items
+        $norequests = 1 if $itemtypes{$oldbiblio->{itemtype}}->{notforloan};
  
-        print "Error ", $@->code(), ": ", $@->message(), "\n";
+        for my $key ( sort keys %$items ) {
+            my $this_item = {
+                branchname     => $branches{$items->{$key}->{branchcode}},
+                branchcode     => $items->{$key}->{branchcode},
+                count          => $items->{$key}->{count},
+                itemcallnumber => $items->{$key}->{itemcallnumber},
+                location => $items->{$key}->{location},
+                onloancount      => $items->{$key}->{onloancount},
+                due_date         => $items->{$key}->{due_date},
+                wthdrawn      => $items->{$key}->{wthdrawn},
+                lost         => $items->{$key}->{itemlost},
+            };
+            push @items_loop, $this_item;
+        }
+        $oldbiblio->{norequests}    = $norequests;
+        $oldbiblio->{items_count}    = $items_count;
+        $oldbiblio->{items_loop}    = \@items_loop;
+        $oldbiblio->{onloancount}   = $onloan_count;
+        $oldbiblio->{wthdrawncount} = $wthdrawn_count;
+        $oldbiblio->{itemlostcount} = $itemlost_count;
+        $oldbiblio->{orderedcount}  = $ordered_count;
+        $oldbiblio->{isbn}          =~ s/-//g; # deleting - in isbn to enable amazon content 
+        push( @newresults, $oldbiblio );
      }
-    ###$raw
-    my $record = MARC::Record->new_from_xml($raw);
-    ###$record
-    return ($record);
+    return @newresults;
  }
  
-1;
-__END__
+
+
+#----------------------------------------------------------------------
+#
+# Non-Zebra GetRecords#
+#----------------------------------------------------------------------
+
+=head2 NZgetRecords
+
+  NZgetRecords has the same API as zera getRecords, even if some parameters are not managed
+
+=cut
+
+sub NZgetRecords {
+    my (
+        $koha_query,     $federated_query,  $sort_by_ref,
+        $servers_ref,    $results_per_page, $offset,
+        $expanded_facet, $branches,         $query_type,
+        $scan
+    ) = @_;
+    my $result = NZanalyse($koha_query);
+    return (undef,NZorder($result,@$sort_by_ref[0],$results_per_page,$offset),undef);
+}
+
+=head2 NZanalyse
+
+  NZanalyse : get a CQL string as parameter, and returns a list of biblionumber;title,biblionumber;title,...
+  the list is builded from inverted index in nozebra SQL table
+  note that title is here only for convenience : the sorting will be very fast when requested on title
+  if the sorting is requested on something else, we will have to reread all results, and that may be longer.
+
+=cut
+
+sub NZanalyse {
+    my ($string,$server) = @_;
+    # $server contains biblioserver or authorities, depending on what we search on.
+    #warn "querying : $string on $server";
+    $server='biblioserver' unless $server;
+    # if we have a ", replace the content to discard temporarily any and/or/not inside
+    my $commacontent;
+    if ($string =~/"/) {
+        $string =~ s/"(.*?)"/__X__/;
+        $commacontent = $1;
+#         print "commacontent : $commacontent\n";
+    }
+    # split the query string in 3 parts : X AND Y means : $left="X", $operand="AND" and $right="Y"
+    # then, call again NZanalyse with $left and $right
+    # (recursive until we find a leaf (=> something without and/or/not)
+    $string =~ /(.*)( and | or | not | AND | OR | NOT )(.*)/;
+    my $left = $1;
+    my $right = $3;
+    my $operand = lc($2);
+    # it's not a leaf, we have a and/or/not
+    if ($operand) {
+        # reintroduce comma content if needed
+        $right =~ s/__X__/"$commacontent"/ if $commacontent;
+        $left =~ s/__X__/"$commacontent"/ if $commacontent;
+#         warn "node : $left / $operand / $right\n";
+        my $leftresult = NZanalyse($left,$server);
+        my $rightresult = NZanalyse($right,$server);
+        # OK, we have the results for right and left part of the query
+        # depending of operand, intersect, union or exclude both lists
+        # to get a result list
+        if ($operand eq ' and ') {
+            my @leftresult = split /;/, $leftresult;
+#             my @rightresult = split /;/,$leftresult;
+            my $finalresult;
+            # parse the left results, and if the biblionumber exist in the right result, save it in finalresult
+            # the result is stored twice, to have the same weight for AND than OR.
+            # example : TWO : 61,61,64,121 (two is twice in the biblio #61) / TOWER : 61,64,130
+            # result : 61,61,61,61,64,64 for two AND tower : 61 has more weight than 64
+            foreach (@leftresult) {
+                if ($rightresult =~ "$_;") {
+                    $finalresult .= "$_;$_;";
+                }
+            }
+            return $finalresult;
+        } elsif ($operand eq ' or ') {
+            # just merge the 2 strings
+            return $leftresult.$rightresult;
+        } elsif ($operand eq ' not ') {
+            my @leftresult = split /;/, $leftresult;
+#             my @rightresult = split /;/,$leftresult;
+            my $finalresult;
+            foreach (@leftresult) {
+                unless ($rightresult =~ "$_;") {
+                    $finalresult .= "$_;";
+                }
+            }
+            return $finalresult;
+        } else {
+            # this error is impossible, because of the regexp that isolate the operand, but just in case...
+            die "error : operand unknown : $operand for $string";
+        }
+    # it's a leaf, do the real SQL query and return the result
+    } else {
+        $string =~  s/__X__/"$commacontent"/ if $commacontent;
+        $string =~ s/-|\.|\?|,|;|!|'|\(|\)|\[|\]|{|}|"|&|\+|\*|\// /g;
+#         warn "leaf : $string\n";
+        # parse the string in in operator/operand/value again
+        $string =~ /(.*)(>=|<=)(.*)/;
+        my $left = $1;
+        my $operator = $2;
+        my $right = $3;
+        unless ($operator) {
+            $string =~ /(.*)(>|<|=)(.*)/;
+            $left = $1;
+            $operator = $2;
+            $right = $3;
+        }
+        my $results;
+        # automatic replace for short operators
+        $left='title' if $left =~ '^ti';
+        $left='author' if $left =~ '^au';
+        $left='publisher' if $left =~ '^pb';
+        $left='subject' if $left =~ '^su';
+        $left='koha-Auth-Number' if $left =~ '^an';
+        $left='keyword' if $left =~ '^kw';
+        if ($operator) {
+            #do a specific search
+            my $dbh = C4::Context->dbh;
+            $operator='LIKE' if $operator eq '=' and $right=~ /%/;
+            my $sth = $dbh->prepare("SELECT biblionumbers,value FROM nozebra WHERE server=? AND indexname=? AND value $operator ?");
+            warn "$left / $operator / $right\n";
+            # split each word, query the DB and build the biblionumbers result
+            foreach (split / /,$right) {
+                my ($biblionumbers,$value);
+                next unless $_;
+                warn "EXECUTE : $server, $left, $_";
+                $sth->execute($server, $left, $_);
+                while (my ($line,$value) = $sth->fetchrow) {
+                    # if we are dealing with a numeric value, use only numeric results (in case of >=, <=, > or <)
+                    # otherwise, fill the result
+                    $biblionumbers .= $line unless ($right =~ /\d/ && $value =~ /\D/);
+                    warn "result : $value ". ($right =~ /\d/) . "==".(!$value =~ /\d/) ;#= $line";
+                }
+                # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
+                if ($results) {
+                    my @leftresult = split /;/, $biblionumbers;
+                    my $temp;
+                    foreach my $entry (@leftresult) { # $_ contains biblionumber,title-weight
+                        # remove weight at the end
+                        my $cleaned = $entry;
+                        $cleaned =~ s/-\d*$//;
+                        # if the entry already in the hash, take it & increase weight
+#                         warn "===== $cleaned =====";
+                        if ($results =~ "$cleaned") {
+                            $temp .= "$entry;$entry;";
+#                             warn "INCLUDING $entry";
+                        }
+                    }
+                    $results = $temp;
+                } else {
+                    $results = $biblionumbers;
+                }
+            }
+        } else {
+            #do a complete search (all indexes)
+            my $dbh = C4::Context->dbh;
+            my $sth = $dbh->prepare("SELECT biblionumbers FROM nozebra WHERE server=? AND value LIKE ?");
+            # split each word, query the DB and build the biblionumbers result
+            foreach (split / /,$string) {
+                next if C4::Context->stopwords->{uc($_)}; # skip if stopword
+                #warn "search on all indexes on $_";
+                my $biblionumbers;
+                next unless $_;
+                $sth->execute($server, $_);
+                while (my $line = $sth->fetchrow) {
+                    $biblionumbers .= $line;
+                }
+                # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
+                if ($results) {
+#                 warn "RES for $_ = $biblionumbers";
+                    my @leftresult = split /;/, $biblionumbers;
+                    my $temp;
+                    foreach my $entry (@leftresult) { # $_ contains biblionumber,title-weight
+                        # remove weight at the end
+                        my $cleaned = $entry;
+                        $cleaned =~ s/-\d*$//;
+                        # if the entry already in the hash, take it & increase weight
+#                         warn "===== $cleaned =====";
+                        if ($results =~ "$cleaned") {
+                            $temp .= "$entry;$entry;";
+#                             warn "INCLUDING $entry";
+                        }
+                    }
+                    $results = $temp;
+                } else {
+#                 warn "NEW RES for $_ = $biblionumbers";
+                    $results = $biblionumbers;
+                }
+            }
+        }
+#         warn "return : $results for LEAF : $string";
+        return $results;
+    }
+}
+
+=head2 NZorder
+
+  $finalresult = NZorder($biblionumbers, $ordering,$results_per_page,$offset);
+  
+  TODO :: Description
+
+=cut
+
+
+sub NZorder {
+    my ($biblionumbers, $ordering,$results_per_page,$offset) = @_;
+    # order title asc by default
+#     $ordering = '1=36 <i' unless $ordering;
+    $results_per_page=20 unless $results_per_page;
+    $offset = 0 unless $offset;
+    my $dbh = C4::Context->dbh;
+    #
+    # order by POPULARITY
+    #
+    if ($ordering =~ /popularity/) {
+        my %result;
+        my %popularity;
+        # popularity is not in MARC record, it's builded from a specific query
+        my $sth = $dbh->prepare("select sum(issues) from items where biblionumber=?");
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            $result{$biblionumber}=GetMarcBiblio($biblionumber);
+            $sth->execute($biblionumber);
+            my $popularity= $sth->fetchrow ||0;
+            # hint : the key is popularity.title because we can have
+            # many results with the same popularity. In this cas, sub-ordering is done by title
+            # we also have biblionumber to avoid bug for 2 biblios with the same title & popularity
+            # (un-frequent, I agree, but we won't forget anything that way ;-)
+            $popularity{sprintf("%10d",$popularity).$title.$biblionumber} = $biblionumber;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+        if ($ordering eq 'popularity_dsc') { # sort popularity DESC
+            foreach my $key (sort {$b cmp $a} (keys %popularity)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$popularity{$key}}->as_usmarc();
+            }
+        } else { # sort popularity ASC
+            foreach my $key (sort (keys %popularity)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$popularity{$key}}->as_usmarc();
+            }
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    #
+    # ORDER BY author
+    #
+    } elsif ($ordering =~/author/){
+        my %result;
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            my $record=GetMarcBiblio($biblionumber);
+            my $author;
+            if (C4::Context->preference('marcflavour') eq 'UNIMARC') {
+                $author=$record->subfield('200','f');
+                $author=$record->subfield('700','a') unless $author;
+            } else {
+                $author=$record->subfield('100','a');
+            }
+            # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
+            # and we don't want to get only 1 result for each of them !!!
+            $result{$author.$biblionumber}=$record;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+        if ($ordering eq 'author_za') { # sort by author desc
+            foreach my $key (sort (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        } else { # sort by author ASC
+            foreach my $key (sort { $a cmp $b } (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    #
+    # ORDER BY callnumber
+    #
+    } elsif ($ordering =~/callnumber/){
+        my %result;
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            my $record=GetMarcBiblio($biblionumber);
+            my $callnumber;
+            my ($callnumber_tag,$callnumber_subfield)=GetMarcFromKohaField($dbh,'items.itemcallnumber');
+            ($callnumber_tag,$callnumber_subfield)= GetMarcFromKohaField('biblioitems.callnumber') unless $callnumber_tag;
+            if (C4::Context->preference('marcflavour') eq 'UNIMARC') {
+                $callnumber=$record->subfield('200','f');
+            } else {
+                $callnumber=$record->subfield('100','a');
+            }
+            # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
+            # and we don't want to get only 1 result for each of them !!!
+            $result{$callnumber.$biblionumber}=$record;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+        if ($ordering eq 'call_number_dsc') { # sort by title desc
+            foreach my $key (sort (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        } else { # sort by title ASC
+            foreach my $key (sort { $a cmp $b } (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    } elsif ($ordering =~ /pubdate/){ #pub year
+        my %result;
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            my $record=GetMarcBiblio($biblionumber);
+            my ($publicationyear_tag,$publicationyear_subfield)=GetMarcFromKohaField($dbh,'biblioitems.publicationyear');
+            my $publicationyear=$record->subfield($publicationyear_tag,$publicationyear_subfield);
+            # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
+            # and we don't want to get only 1 result for each of them !!!
+            $result{$publicationyear.$biblionumber}=$record;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+        if ($ordering eq 'pubdate_dsc') { # sort by pubyear desc
+            foreach my $key (sort (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        } else { # sort by pub year ASC
+            foreach my $key (sort { $b cmp $a } (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key}->as_usmarc();
+            }
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    #
+    # ORDER BY title
+    #
+    } elsif ($ordering =~ /title/) { 
+        # the title is in the biblionumbers string, so we just need to build a hash, sort it and return
+        my %result;
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
+            # and we don't want to get only 1 result for each of them !!!
+            # hint & speed improvement : we can order without reading the record
+            # so order, and read records only for the requested page !
+            $result{$title.$biblionumber}=$biblionumber;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+        if ($ordering eq 'title_za') { # sort by title desc
+            foreach my $key (sort (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key};
+            }
+        } else { # sort by title ASC
+            foreach my $key (sort { $b cmp $a } (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key};
+            }
+        }
+        # limit the $results_per_page to result size if it's more
+        $results_per_page = $numbers-1 if $numbers < $results_per_page;
+        # for the requested page, replace biblionumber by the complete record
+        # speed improvement : avoid reading too much things
+        for (my $counter=$offset;$counter<=$offset+$results_per_page;$counter++) {
+            $result_hash->{'RECORDS'}[$counter] = GetMarcBiblio($result_hash->{'RECORDS'}[$counter])->as_usmarc;
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    } else {
+    #
+    # order by ranking
+    #
+        # we need 2 hashes to order by ranking : the 1st one to count the ranking, the 2nd to order by ranking
+        my %result;
+        my %count_ranking;
+        foreach (split /;/,$biblionumbers) {
+            my ($biblionumber,$title) = split /,/,$_;
+            $title =~ /(.*)-(\d)/;
+            # get weight 
+            my $ranking =$2;
+            # note that we + the ranking because ranking is calculated on weight of EACH term requested.
+            # if we ask for "two towers", and "two" has weight 2 in biblio N, and "towers" has weight 4 in biblio N
+            # biblio N has ranking = 6
+            $count_ranking{$biblionumber} += $ranking;
+        }
+        # build the result by "inverting" the count_ranking hash
+        # hing : as usual, we don't order by ranking only, to avoid having only 1 result for each rank. We build an hash on concat(ranking,biblionumber) instead
+#         warn "counting";
+        foreach (keys %count_ranking) {
+            $result{sprintf("%10d",$count_ranking{$_}).'-'.$_} = $_;
+        }
+        # sort the hash and return the same structure as GetRecords (Zebra querying)
+        my $result_hash;
+        my $numbers=0;
+            foreach my $key (sort {$b cmp $a} (keys %result)) {
+                $result_hash->{'RECORDS'}[$numbers++] = $result{$key};
+            }
+        # limit the $results_per_page to result size if it's more
+        $results_per_page = $numbers-1 if $numbers < $results_per_page;
+        # for the requested page, replace biblionumber by the complete record
+        # speed improvement : avoid reading too much things
+        for (my $counter=$offset;$counter<=$offset+$results_per_page;$counter++) {
+            $result_hash->{'RECORDS'}[$counter] = GetMarcBiblio($result_hash->{'RECORDS'}[$counter])->as_usmarc;
+        }
+        my $finalresult=();
+        $result_hash->{'hits'} = $numbers;
+        $finalresult->{'biblioserver'} = $result_hash;
+        return $finalresult;
+    }
+}
+=head2 ModBiblios
+
+($countchanged,$listunchanged) = ModBiblios($listbiblios, $tagsubfield,$initvalue,$targetvalue,$test);
+
+this function changes all the values $initvalue in subfield $tag$subfield in any record in $listbiblios
+test parameter if set donot perform change to records in database.
+
+=over 2
+
+=item C<input arg:>
+
+    * $listbiblios is an array ref to marcrecords to be changed
+    * $tagsubfield is the reference of the subfield to change.
+    * $initvalue is the value to search the record for
+    * $targetvalue is the value to set the subfield to
+    * $test is to be set only not to perform changes in database.
+
+=item C<Output arg:>
+    * $countchanged counts all the changes performed.
+    * $listunchanged contains the list of all the biblionumbers of records unchanged.
+
+=item C<usage in the script:>
  
  =back
  
+my ($countchanged, $listunchanged) = EditBiblios($results->{RECORD}, $tagsubfield,$initvalue,$targetvalue);;
+#If one wants to display unchanged records, you should get biblios foreach @$listunchanged 
+$template->param(countchanged => $countchanged, loopunchanged=>$listunchanged);
+
+=cut
+
+sub ModBiblios{
+  my ($listbiblios,$tagsubfield,$initvalue,$targetvalue,$test)=@_;
+  my $countmatched;
+  my @unmatched;
+  my ($tag,$subfield)=($1,$2) if ($tagsubfield=~/^(\d{1,3})([a-z0-9A-Z@])?$/); 
+  if ((length($tag)<3)&& $subfield=~/0-9/){
+    $tag=$tag.$subfield;
+    undef $subfield;
+  } 
+  my ($bntag,$bnsubf) = GetMarcFromKohaField('biblio.biblionumber');
+  my ($itemtag,$itemsubf) = GetMarcFromKohaField('items.itemnumber');
+  foreach my $usmarc (@$listbiblios){
+    my $record; 
+    $record=eval{MARC::Record->new_from_usmarc($usmarc)};
+    my $biblionumber;
+    if ($@){
+      # usmarc is not a valid usmarc May be a biblionumber
+      if ($tag eq $itemtag){
+        my $bib=GetBiblioFromItemNumber($usmarc);   
+        $record=GetMarcItem($bib->{'biblionumber'},$usmarc) ;   
+        $biblionumber=$bib->{'biblionumber'};
+      } else {   
+        $record=GetMarcBiblio($usmarc);   
+        $biblionumber=$usmarc;
+      }   
+    }  else {
+      if ($bntag >= 010){
+        $biblionumber = $record->subfield($bntag,$bnsubf);
+      }else {
+        $biblionumber=$record->field($bntag)->data;
+      }
+    }  
+    #GetBiblionumber is to be written.
+    #Could be replaced by TransformMarcToKoha (But Would be longer)
+    if ($record->field($tag)){
+      my $modify=0;  
+      foreach my $field ($record->field($tag)){
+        if ($subfield){
+          if ($field->delete_subfield('code' =>$subfield,'match'=>qr($initvalue))){
+            $countmatched++;
+            $modify=1;      
+            $field->update($subfield,$targetvalue) if ($targetvalue);
+          }
+        } else {
+          if ($tag >= 010){
+            if ($field->delete_field($field)){
+              $countmatched++;
+              $modify=1;      
+            }
+          } else {
+            $field->data=$targetvalue if ($field->data=~qr($initvalue));
+          }     
+        }    
+      }
+#       warn $record->as_formatted;
+      if ($modify){
+        ModBiblio($record,$biblionumber,GetFrameworkCode($biblionumber)) unless ($test);
+      } else {
+        push @unmatched, $biblionumber;   
+      }      
+    } else {
+      push @unmatched, $biblionumber;
+    }
+  }
+  return ($countmatched,\@unmatched);
+}
+
+END { }    # module clean-up code here (global destructor)
+
+1;
+__END__
+
  =head1 AUTHOR
  
  Koha Developement team <info@koha.org>
  
  =cut
-