3 # This file is part of Koha.
5 # Koha is free software; you can redistribute it and/or modify it under the
6 # terms of the GNU General Public License as published by the Free Software
7 # Foundation; either version 2 of the License, or (at your option) any later
10 # Koha is distributed in the hope that it will be useful, but WITHOUT ANY
11 # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
12 # A PARTICULAR PURPOSE. See the GNU General Public License for more details.
14 # You should have received a copy of the GNU General Public License along with
15 # Koha; if not, write to the Free Software Foundation, Inc., 59 Temple Place,
16 # Suite 330, Boston, MA 02111-1307 USA
19 #use warnings; FIXME - Bug 2505
22 use C4::Biblio; # GetMarcFromKohaField, GetBiblioData
23 use C4::Koha; # getFacets
25 use C4::Search::PazPar2;
27 use C4::Dates qw(format_date);
28 use C4::Members qw(GetHideLostItemsPreference);
31 use C4::Reserves; # CheckReserves
39 use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS $DEBUG);
41 # set the version for version checking
44 $DEBUG = ($ENV{DEBUG}) ? 1 : 0;
49 C4::Search - Functions for searching the Koha catalog.
53 See opac/opac-search.pl or catalogue/search.pl for example of usage
57 This module provides searching functions for Koha's bibliographic databases
74 &enabled_staff_search_views
76 #FIXME: i had to add BiblioAddAuthorities here because in Biblios.pm it caused circular dependencies (C4::Search uses C4::Biblio, and BiblioAddAuthorities uses SimpleSearch from C4::Search)
78 # make all your functions, whether exported or not;
82 ($biblionumber,$biblionumber,$title) = FindDuplicate($record);
84 This function attempts to find duplicate records using a hard-coded, fairly simplistic algorithm
90 my $dbh = C4::Context->dbh;
91 my $result = TransformMarcToKoha( $dbh, $record, '' );
96 my ( $biblionumber, $title );
98 # search duplicate on ISBN, easy and fast..
100 if ( $result->{isbn} ) {
101 $result->{isbn} =~ s/\(.*$//;
102 $result->{isbn} =~ s/\s+$//;
103 $query = "isbn=$result->{isbn}";
106 $result->{title} =~ s /\\//g;
107 $result->{title} =~ s /\"//g;
108 $result->{title} =~ s /\(//g;
109 $result->{title} =~ s /\)//g;
111 # FIXME: instead of removing operators, could just do
112 # quotes around the value
113 $result->{title} =~ s/(and|or|not)//g;
114 $query = "ti,ext=$result->{title}";
115 $query .= " and itemtype=$result->{itemtype}"
116 if ( $result->{itemtype} );
117 if ( $result->{author} ) {
118 $result->{author} =~ s /\\//g;
119 $result->{author} =~ s /\"//g;
120 $result->{author} =~ s /\(//g;
121 $result->{author} =~ s /\)//g;
123 # remove valid operators
124 $result->{author} =~ s/(and|or|not)//g;
125 $query .= " and au,ext=$result->{author}";
129 my ( $error, $searchresults, undef ) = SimpleSearch($query); # FIXME :: hardcoded !
131 if (!defined $error) {
132 foreach my $possible_duplicate_record (@{$searchresults}) {
134 MARC::Record->new_from_usmarc($possible_duplicate_record);
135 my $result = TransformMarcToKoha( $dbh, $marcrecord, '' );
137 # FIXME :: why 2 $biblionumber ?
139 push @results, $result->{'biblionumber'};
140 push @results, $result->{'title'};
149 ( $error, $results, $total_hits ) = SimpleSearch( $query, $offset, $max_results, [@servers] );
151 This function provides a simple search API on the bibliographic catalog
157 * $query can be a simple keyword or a complete CCL query
158 * @servers is optional. Defaults to biblioserver as found in koha-conf.xml
159 * $offset - If present, represents the number of records at the beggining to omit. Defaults to 0
160 * $max_results - if present, determines the maximum number of records to fetch. undef is All. defaults to undef.
165 Returns an array consisting of three elements
166 * $error is undefined unless an error is detected
167 * $results is a reference to an array of records.
168 * $total_hits is the number of hits that would have been returned with no limit
170 If an error is returned the two other return elements are undefined. If error itself is undefined
171 the other two elements are always defined
173 =item C<usage in the script:>
177 my ( $error, $marcresults, $total_hits ) = SimpleSearch($query);
179 if (defined $error) {
180 $template->param(query_error => $error);
181 warn "error: ".$error;
182 output_html_with_http_headers $input, $cookie, $template->output;
186 my $hits = @{$marcresults};
189 for my $r ( @{$marcresults} ) {
190 my $marcrecord = MARC::File::USMARC::decode($r);
191 my $biblio = TransformMarcToKoha(C4::Context->dbh,$marcrecord,q{});
193 #build the iarray of hashs for the template.
195 title => $biblio->{'title'},
196 subtitle => $biblio->{'subtitle'},
197 biblionumber => $biblio->{'biblionumber'},
198 author => $biblio->{'author'},
199 publishercode => $biblio->{'publishercode'},
200 publicationyear => $biblio->{'publicationyear'},
205 $template->param(result=>\@results);
210 my ( $query, $offset, $max_results, $servers ) = @_;
212 if ( C4::Context->preference('NoZebra') ) {
213 my $result = NZorder( NZanalyse($query) )->{'biblioserver'};
216 && $result->{hits} > 0 ? $result->{'RECORDS'} : [] );
217 return ( undef, $search_result, scalar($result->{hits}) );
220 return ( 'No query entered', undef, undef ) unless $query;
221 # FIXME hardcoded value. See catalog/search.pl & opac-search.pl too.
222 my @servers = defined ( $servers ) ? @$servers : ( 'biblioserver' );
229 # Initialize & Search Zebra
230 for ( my $i = 0 ; $i < @servers ; $i++ ) {
232 $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
233 $zoom_queries[$i] = new ZOOM::Query::CCL2RPN( $query, $zconns[$i]);
234 $tmpresults[$i] = $zconns[$i]->search( $zoom_queries[$i] );
238 $zconns[$i]->errmsg() . " ("
239 . $zconns[$i]->errcode() . ") "
240 . $zconns[$i]->addinfo() . " "
241 . $zconns[$i]->diagset();
243 return ( $error, undef, undef ) if $zconns[$i]->errcode();
247 # caught a ZOOM::Exception
251 . $@->addinfo() . " "
254 return ( $error, undef, undef );
257 while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
258 my $event = $zconns[ $i - 1 ]->last_event();
259 if ( $event == ZOOM::Event::ZEND ) {
261 my $first_record = defined( $offset ) ? $offset+1 : 1;
262 my $hits = $tmpresults[ $i - 1 ]->size();
263 $total_hits += $hits;
264 my $last_record = $hits;
265 if ( defined $max_results && $offset + $max_results < $hits ) {
266 $last_record = $offset + $max_results;
269 for my $j ( $first_record..$last_record ) {
270 my $record = $tmpresults[ $i - 1 ]->record( $j-1 )->raw(); # 0 indexed
271 push @{$results}, $record;
276 foreach my $result (@tmpresults) {
279 foreach my $zoom_query (@zoom_queries) {
280 $zoom_query->destroy();
283 return ( undef, $results, $total_hits );
289 ( undef, $results_hashref, \@facets_loop ) = getRecords (
291 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
292 $results_per_page, $offset, $expanded_facet, $branches,
296 The all singing, all dancing, multi-server, asynchronous, scanning,
297 searching, record nabbing, facet-building
299 See verbse embedded documentation.
305 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
306 $results_per_page, $offset, $expanded_facet, $branches,
310 my @servers = @$servers_ref;
311 my @sort_by = @$sort_by_ref;
313 # Initialize variables for the ZOOM connection and results object
317 my $results_hashref = ();
319 # Initialize variables for the faceted results objects
320 my $facets_counter = ();
321 my $facets_info = ();
322 my $facets = getFacets();
323 my $facets_maxrecs = C4::Context->preference('maxRecordsForFacets')||20;
325 my @facets_loop; # stores the ref to array of hashes for template facets loop
327 ### LOOP THROUGH THE SERVERS
328 for ( my $i = 0 ; $i < @servers ; $i++ ) {
329 $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
331 # perform the search, create the results objects
332 # if this is a local search, use the $koha-query, if it's a federated one, use the federated-query
333 my $query_to_use = ($servers[$i] =~ /biblioserver/) ? $koha_query : $simple_query;
335 #$query_to_use = $simple_query if $scan;
336 warn $simple_query if ( $scan and $DEBUG );
338 # Check if we've got a query_type defined, if so, use it
341 if ($query_type =~ /^ccl/) {
342 $query_to_use =~ s/\:/\=/g; # change : to = last minute (FIXME)
343 $results[$i] = $zconns[$i]->search(new ZOOM::Query::CCL2RPN($query_to_use, $zconns[$i]));
344 } elsif ($query_type =~ /^cql/) {
345 $results[$i] = $zconns[$i]->search(new ZOOM::Query::CQL($query_to_use, $zconns[$i]));
346 } elsif ($query_type =~ /^pqf/) {
347 $results[$i] = $zconns[$i]->search(new ZOOM::Query::PQF($query_to_use, $zconns[$i]));
349 warn "Unknown query_type '$query_type'. Results undetermined.";
352 $results[$i] = $zconns[$i]->scan( new ZOOM::Query::CCL2RPN($query_to_use, $zconns[$i]));
354 $results[$i] = $zconns[$i]->search(new ZOOM::Query::CCL2RPN($query_to_use, $zconns[$i]));
358 warn "WARNING: query problem with $query_to_use " . $@;
361 # Concatenate the sort_by limits and pass them to the results object
362 # Note: sort will override rank
364 foreach my $sort (@sort_by) {
365 if ( $sort eq "author_az" || $sort eq "author_asc" ) {
366 $sort_by .= "1=1003 <i ";
368 elsif ( $sort eq "author_za" || $sort eq "author_dsc" ) {
369 $sort_by .= "1=1003 >i ";
371 elsif ( $sort eq "popularity_asc" ) {
372 $sort_by .= "1=9003 <i ";
374 elsif ( $sort eq "popularity_dsc" ) {
375 $sort_by .= "1=9003 >i ";
377 elsif ( $sort eq "call_number_asc" ) {
378 $sort_by .= "1=8007 <i ";
380 elsif ( $sort eq "call_number_dsc" ) {
381 $sort_by .= "1=8007 >i ";
383 elsif ( $sort eq "pubdate_asc" ) {
384 $sort_by .= "1=31 <i ";
386 elsif ( $sort eq "pubdate_dsc" ) {
387 $sort_by .= "1=31 >i ";
389 elsif ( $sort eq "acqdate_asc" ) {
390 $sort_by .= "1=32 <i ";
392 elsif ( $sort eq "acqdate_dsc" ) {
393 $sort_by .= "1=32 >i ";
395 elsif ( $sort eq "title_az" || $sort eq "title_asc" ) {
396 $sort_by .= "1=4 <i ";
398 elsif ( $sort eq "title_za" || $sort eq "title_dsc" ) {
399 $sort_by .= "1=4 >i ";
402 warn "Ignoring unrecognized sort '$sort' requested" if $sort_by;
405 if ($sort_by && !$scan) {
406 if ( $results[$i]->sort( "yaz", $sort_by ) < 0 ) {
407 warn "WARNING sort $sort_by failed";
410 } # finished looping through servers
412 # The big moment: asynchronously retrieve results from all servers
413 while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
414 my $ev = $zconns[ $i - 1 ]->last_event();
415 if ( $ev == ZOOM::Event::ZEND ) {
416 next unless $results[ $i - 1 ];
417 my $size = $results[ $i - 1 ]->size();
421 # loop through the results
422 $results_hash->{'hits'} = $size;
424 if ( $offset + $results_per_page <= $size ) {
425 $times = $offset + $results_per_page;
430 for ( my $j = $offset ; $j < $times ; $j++ ) {
434 ## Check if it's an index scan
436 my ( $term, $occ ) = $results[ $i - 1 ]->term($j);
438 # here we create a minimal MARC record and hand it off to the
439 # template just like a normal result ... perhaps not ideal, but
441 my $tmprecord = MARC::Record->new();
442 $tmprecord->encoding('UTF-8');
446 # the minimal record in author/title (depending on MARC flavour)
447 if (C4::Context->preference("marcflavour") eq "UNIMARC") {
448 $tmptitle = MARC::Field->new('200',' ',' ', a => $term, f => $occ);
449 $tmprecord->append_fields($tmptitle);
451 $tmptitle = MARC::Field->new('245',' ',' ', a => $term,);
452 $tmpauthor = MARC::Field->new('100',' ',' ', a => $occ,);
453 $tmprecord->append_fields($tmptitle);
454 $tmprecord->append_fields($tmpauthor);
456 $results_hash->{'RECORDS'}[$j] = $tmprecord->as_usmarc();
461 $record = $results[ $i - 1 ]->record($j)->raw();
463 # warn "RECORD $j:".$record;
464 $results_hash->{'RECORDS'}[$j] = $record;
468 $results_hashref->{ $servers[ $i - 1 ] } = $results_hash;
470 # Fill the facets while we're looping, but only for the biblioserver and not for a scan
471 if ( !$scan && $servers[ $i - 1 ] =~ /biblioserver/ ) {
473 my $jmax = $size>$facets_maxrecs? $facets_maxrecs: $size;
475 for ( my $k = 0 ; $k <= @$facets ; $k++ ) {
476 ($facets->[$k]) or next;
477 my @fcodes = @{$facets->[$k]->{'tags'}};
478 my $sfcode = $facets->[$k]->{'subfield'};
480 for ( my $j = 0 ; $j < $jmax ; $j++ ) {
481 my $render_record = $results[ $i - 1 ]->record($j)->render();
484 foreach my $fcode (@fcodes) {
487 my $field_pattern = '\n'.$fcode.' ([^\n]+)';
488 my @field_tokens = ( $render_record =~ /$field_pattern/g ) ;
490 foreach my $field_token (@field_tokens) {
491 my $subfield_pattern = '\$'.$sfcode.' ([^\$]+)';
492 my @subfield_values = ( $field_token =~ /$subfield_pattern/g );
494 foreach my $subfield_value (@subfield_values) {
496 my $data = $subfield_value;
497 $data =~ s/^\s+//; # trim left
498 $data =~ s/\s+$//; # trim right
500 unless ( $data ~~ @used_datas ) {
501 $facets_counter->{ $facets->[$k]->{'link_value'} }->{$data}++;
502 push @used_datas, $data;
509 $facets_info->{ $facets->[$k]->{'link_value'} }->{'label_value'} = $facets->[$k]->{'label_value'};
510 $facets_info->{ $facets->[$k]->{'link_value'} }->{'expanded'} = $facets->[$k]->{'expanded'};
516 # warn "connection ", $i-1, ": $size hits";
517 # warn $results[$i-1]->record(0)->render() if $size > 0;
520 if ( $servers[ $i - 1 ] =~ /biblioserver/ ) {
522 sort { $facets_counter->{$b} <=> $facets_counter->{$a} }
523 keys %$facets_counter )
526 my $number_of_facets;
527 my @this_facets_array;
530 $facets_counter->{$link_value}->{$b}
531 <=> $facets_counter->{$link_value}->{$a}
532 } keys %{ $facets_counter->{$link_value} }
536 if ( ( $number_of_facets < 6 )
537 || ( $expanded_facet eq $link_value )
538 || ( $facets_info->{$link_value}->{'expanded'} ) )
541 # Sanitize the link value ), ( will cause errors with CCL,
542 my $facet_link_value = $one_facet;
543 $facet_link_value =~ s/(\(|\))/ /g;
545 # fix the length that will display in the label,
546 my $facet_label_value = $one_facet;
547 my $facet_max_length =
548 C4::Context->preference('FacetLabelTruncationLength') || 20;
550 substr( $one_facet, 0, $facet_max_length ) . "..."
551 if length($facet_label_value) > $facet_max_length;
553 # if it's a branch, label by the name, not the code,
554 if ( $link_value =~ /branch/ ) {
555 if (defined $branches
556 && ref($branches) eq "HASH"
557 && defined $branches->{$one_facet}
558 && ref ($branches->{$one_facet}) eq "HASH")
561 $branches->{$one_facet}->{'branchname'};
564 $facet_label_value = "*";
568 # but we're down with the whole label being in the link's title.
569 push @this_facets_array, {
570 facet_count => $facets_counter->{$link_value}->{$one_facet},
571 facet_label_value => $facet_label_value,
572 facet_title_value => $one_facet,
573 facet_link_value => $facet_link_value,
574 type_link_value => $link_value,
579 # handle expanded option
580 unless ( $facets_info->{$link_value}->{'expanded'} ) {
582 if ( ( $number_of_facets > 6 )
583 && ( $expanded_facet ne $link_value ) );
586 type_link_value => $link_value,
587 type_id => $link_value . "_id",
588 "type_label_" . $facets_info->{$link_value}->{'label_value'} => 1,
589 facets => \@this_facets_array,
590 expandable => $expandable,
591 expand => $link_value,
592 } unless ( ($facets_info->{$link_value}->{'label_value'} =~ /Libraries/) and (C4::Context->preference('singleBranchMode')) );
597 return ( undef, $results_hashref, \@facets_loop );
602 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
603 $results_per_page, $offset, $expanded_facet, $branches,
607 my $paz = C4::Search::PazPar2->new(C4::Context->config('pazpar2url'));
609 $paz->search($simple_query);
610 sleep 1; # FIXME: WHY?
613 my $results_hashref = {};
614 my $stats = XMLin($paz->stat);
615 my $results = XMLin($paz->show($offset, $results_per_page, 'work-title:1'), forcearray => 1);
617 # for a grouped search result, the number of hits
618 # is the number of groups returned; 'bib_hits' will have
619 # the total number of bibs.
620 $results_hashref->{'biblioserver'}->{'hits'} = $results->{'merged'}->[0];
621 $results_hashref->{'biblioserver'}->{'bib_hits'} = $stats->{'hits'};
623 HIT: foreach my $hit (@{ $results->{'hit'} }) {
624 my $recid = $hit->{recid}->[0];
626 my $work_title = $hit->{'md-work-title'}->[0];
628 if (exists $hit->{'md-work-author'}) {
629 $work_author = $hit->{'md-work-author'}->[0];
631 my $group_label = (defined $work_author) ? "$work_title / $work_author" : $work_title;
633 my $result_group = {};
634 $result_group->{'group_label'} = $group_label;
635 $result_group->{'group_merge_key'} = $recid;
638 if (exists $hit->{count}) {
639 $count = $hit->{count}->[0];
641 $result_group->{'group_count'} = $count;
643 for (my $i = 0; $i < $count; $i++) {
644 # FIXME -- may need to worry about diacritics here
645 my $rec = $paz->record($recid, $i);
646 push @{ $result_group->{'RECORDS'} }, $rec;
649 push @{ $results_hashref->{'biblioserver'}->{'GROUPS'} }, $result_group;
652 # pass through facets
653 my $termlist_xml = $paz->termlist('author,subject');
654 my $terms = XMLin($termlist_xml, forcearray => 1);
655 my @facets_loop = ();
656 #die Dumper($results);
657 # foreach my $list (sort keys %{ $terms->{'list'} }) {
659 # foreach my $facet (sort @{ $terms->{'list'}->{$list}->{'term'} } ) {
661 # facet_label_value => $facet->{'name'}->[0],
664 # push @facets_loop, ( {
665 # type_label => $list,
666 # facets => \@facets,
670 return ( undef, $results_hashref, \@facets_loop );
674 sub _remove_stopwords {
675 my ( $operand, $index ) = @_;
676 my @stopwords_removed;
678 # phrase and exact-qualified indexes shouldn't have stopwords removed
679 if ( $index !~ m/phr|ext/ ) {
681 # remove stopwords from operand : parse all stopwords & remove them (case insensitive)
682 # we use IsAlpha unicode definition, to deal correctly with diacritics.
683 # otherwise, a French word like "leçon" woudl be split into "le" "çon", "le"
684 # is a stopword, we'd get "çon" and wouldn't find anything...
686 foreach ( keys %{ C4::Context->stopwords } ) {
687 next if ( $_ =~ /(and|or|not)/ ); # don't remove operators
688 if ( my ($matched) = ($operand =~
689 /([^\X\p{isAlnum}]\Q$_\E[^\X\p{isAlnum}]|[^\X\p{isAlnum}]\Q$_\E$|^\Q$_\E[^\X\p{isAlnum}])/gi))
691 $operand =~ s/\Q$matched\E/ /gi;
692 push @stopwords_removed, $_;
696 return ( $operand, \@stopwords_removed );
700 sub _detect_truncation {
701 my ( $operand, $index ) = @_;
702 my ( @nontruncated, @righttruncated, @lefttruncated, @rightlefttruncated,
705 my @wordlist = split( /\s/, $operand );
706 foreach my $word (@wordlist) {
707 if ( $word =~ s/^\*([^\*]+)\*$/$1/ ) {
708 push @rightlefttruncated, $word;
710 elsif ( $word =~ s/^\*([^\*]+)$/$1/ ) {
711 push @lefttruncated, $word;
713 elsif ( $word =~ s/^([^\*]+)\*$/$1/ ) {
714 push @righttruncated, $word;
716 elsif ( index( $word, "*" ) < 0 ) {
717 push @nontruncated, $word;
720 push @regexpr, $word;
724 \@nontruncated, \@righttruncated, \@lefttruncated,
725 \@rightlefttruncated, \@regexpr
730 sub _build_stemmed_operand {
731 my ($operand,$lang) = @_;
732 require Lingua::Stem::Snowball ;
735 # If operand contains a digit, it is almost certainly an identifier, and should
736 # not be stemmed. This is particularly relevant for ISBNs and ISSNs, which
737 # can contain the letter "X" - for example, _build_stemmend_operand would reduce
738 # "014100018X" to "x ", which for a MARC21 database would bring up irrelevant
739 # results (e.g., "23 x 29 cm." from the 300$c). Bug 2098.
740 return $operand if $operand =~ /\d/;
742 # FIXME: the locale should be set based on the user's language and/or search choice
744 my $stemmer = Lingua::Stem::Snowball->new( lang => $lang,
745 encoding => "UTF-8" );
747 my @words = split( / /, $operand );
748 my @stems = $stemmer->stem(\@words);
749 for my $stem (@stems) {
750 $stemmed_operand .= "$stem";
751 $stemmed_operand .= "?"
752 unless ( $stem =~ /(and$|or$|not$)/ ) || ( length($stem) < 3 );
753 $stemmed_operand .= " ";
755 warn "STEMMED OPERAND: $stemmed_operand" if $DEBUG;
756 return $stemmed_operand;
760 sub _build_weighted_query {
762 # FIELD WEIGHTING - This is largely experimental stuff. What I'm committing works
763 # pretty well but could work much better if we had a smarter query parser
764 my ( $operand, $stemmed_operand, $index ) = @_;
765 my $stemming = C4::Context->preference("QueryStemming") || 0;
766 my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
767 my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
769 my $weighted_query .= "(rk=("; # Specifies that we're applying rank
771 # Keyword, or, no index specified
772 if ( ( $index eq 'kw' ) || ( !$index ) ) {
774 "Title-cover,ext,r1=\"$operand\""; # exact title-cover
775 $weighted_query .= " or ti,ext,r2=\"$operand\""; # exact title
776 $weighted_query .= " or ti,phr,r3=\"$operand\""; # phrase title
777 #$weighted_query .= " or any,ext,r4=$operand"; # exact any
778 #$weighted_query .=" or kw,wrdl,r5=\"$operand\""; # word list any
779 $weighted_query .= " or wrdl,fuzzy,r8=\"$operand\""
780 if $fuzzy_enabled; # add fuzzy, word list
781 $weighted_query .= " or wrdl,right-Truncation,r9=\"$stemmed_operand\""
782 if ( $stemming and $stemmed_operand )
783 ; # add stemming, right truncation
784 $weighted_query .= " or wrdl,r9=\"$operand\"";
786 # embedded sorting: 0 a-z; 1 z-a
787 # $weighted_query .= ") or (sort1,aut=1";
790 # Barcode searches should skip this process
791 elsif ( $index eq 'bc' ) {
792 $weighted_query .= "bc=\"$operand\"";
795 # Authority-number searches should skip this process
796 elsif ( $index eq 'an' ) {
797 $weighted_query .= "an=\"$operand\"";
800 # If the index already has more than one qualifier, wrap the operand
801 # in quotes and pass it back (assumption is that the user knows what they
802 # are doing and won't appreciate us mucking up their query
803 elsif ( $index =~ ',' ) {
804 $weighted_query .= " $index=\"$operand\"";
807 #TODO: build better cases based on specific search indexes
809 $weighted_query .= " $index,ext,r1=\"$operand\""; # exact index
810 #$weighted_query .= " or (title-sort-az=0 or $index,startswithnt,st-word,r3=$operand #)";
811 $weighted_query .= " or $index,phr,r3=\"$operand\""; # phrase index
813 " or $index,rt,wrdl,r3=\"$operand\""; # word list index
816 $weighted_query .= "))"; # close rank specification
817 return $weighted_query;
822 Return an array with available indexes.
844 'Author-personal-bibliography',
854 'Chronological-subdivision',
864 'Conference-name-heading',
865 'Conference-name-see',
866 'Conference-name-seealso',
871 'Corporate-name-heading',
872 'Corporate-name-see',
873 'Corporate-name-seealso',
875 'date-entered-on-file',
876 'Date-of-acquisition',
877 'Date-of-publication',
878 'Dewey-classification',
885 'Geographic-subdivision',
888 'Heading-use-main-or-added-entry',
889 'Heading-use-series-added-entry ',
890 'Heading-use-subject-added-entry',
908 'Local-classification',
911 'Match-heading-see-from',
919 'Name-geographic-heading',
920 'Name-geographic-see',
921 'Name-geographic-seealso',
929 'Personal-name-heading',
931 'Personal-name-seealso',
938 'Record-control-number',
949 'Subject-heading-thesaurus',
950 'Subject-name-personal',
951 'Subject-subdivision',
961 'Term-genre-form-heading',
962 'Term-genre-form-see',
963 'Term-genre-form-seealso',
970 'Title-uniform-heading',
972 'Title-uniform-seealso',
982 'classification-source',
984 'coded-location-qualifier',
995 'Local-classification',
998 'materials-specified',
1007 'replacementpricedate',
1025 $simple_query, $query_cgi,
1026 $query_desc, $limit,
1027 $limit_cgi, $limit_desc,
1028 $stopwords_removed, $query_type ) = buildQuery ( $operators, $operands, $indexes, $limits, $sort_by, $scan, $lang);
1030 Build queries and limits in CCL, CGI, Human,
1031 handle truncation, stemming, field weighting, stopwords, fuzziness, etc.
1033 See verbose embedded documentation.
1039 my ( $operators, $operands, $indexes, $limits, $sort_by, $scan, $lang) = @_;
1041 warn "---------\nEnter buildQuery\n---------" if $DEBUG;
1044 my @operators = $operators ? @$operators : ();
1045 my @indexes = $indexes ? @$indexes : ();
1046 my @operands = $operands ? @$operands : ();
1047 my @limits = $limits ? @$limits : ();
1048 my @sort_by = $sort_by ? @$sort_by : ();
1050 my $stemming = C4::Context->preference("QueryStemming") || 0;
1051 my $auto_truncation = C4::Context->preference("QueryAutoTruncate") || 0;
1052 my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
1053 my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
1054 my $remove_stopwords = C4::Context->preference("QueryRemoveStopwords") || 0;
1056 # no stemming/weight/fuzzy in NoZebra
1057 if ( C4::Context->preference("NoZebra") ) {
1061 $auto_truncation = 0;
1064 my $query = $operands[0];
1065 my $simple_query = $operands[0];
1067 # initialize the variables we're passing back
1076 my $stopwords_removed; # flag to determine if stopwords have been removed
1079 my $cclindexes = getIndexes();
1080 if ( $query !~ /\s*ccl=/ ) {
1081 while ( !$cclq && $query =~ /(?:^|\W)([\w-]+)(,[\w-]+)*[:=]/g ) {
1083 $cclq = grep { lc($_) eq $dx } @$cclindexes;
1085 $query = "ccl=$query" if $cclq;
1088 # for handling ccl, cql, pqf queries in diagnostic mode, skip the rest of the steps
1090 if ( $query =~ /^ccl=/ ) {
1092 # This is needed otherwise ccl= and &limit won't work together, and
1093 # this happens when selecting a subject on the opac-detail page
1095 $q .= ' and '.join(' and ', @limits);
1097 return ( undef, $q, $q, "q=ccl=$q", $q, '', '', '', '', 'ccl' );
1099 if ( $query =~ /^cql=/ ) {
1100 return ( undef, $', $', "q=cql=$'", $', '', '', '', '', 'cql' );
1102 if ( $query =~ /^pqf=/ ) {
1103 return ( undef, $', $', "q=pqf=$'", $', '', '', '', '', 'pqf' );
1106 # pass nested queries directly
1107 # FIXME: need better handling of some of these variables in this case
1108 # Nested queries aren't handled well and this implementation is flawed and causes users to be
1109 # unable to search for anything containing () commenting out, will be rewritten for 3.4.0
1110 # if ( $query =~ /(\(|\))/ ) {
1112 # undef, $query, $simple_query, $query_cgi,
1113 # $query, $limit, $limit_cgi, $limit_desc,
1114 # $stopwords_removed, 'ccl'
1118 # Form-based queries are non-nested and fixed depth, so we can easily modify the incoming
1119 # query operands and indexes and add stemming, truncation, field weighting, etc.
1120 # Once we do so, we'll end up with a value in $query, just like if we had an
1121 # incoming $query from the user
1124 ; # clear it out so we can populate properly with field-weighted, stemmed, etc. query
1125 my $previous_operand
1126 ; # a flag used to keep track if there was a previous query
1127 # if there was, we can apply the current operator
1129 for ( my $i = 0 ; $i <= @operands ; $i++ ) {
1131 # COMBINE OPERANDS, INDEXES AND OPERATORS
1132 if ( $operands[$i] ) {
1133 $operands[$i]=~s/^\s+//;
1135 # A flag to determine whether or not to add the index to the query
1138 # If the user is sophisticated enough to specify an index, turn off field weighting, stemming, and stopword handling
1139 if ( $operands[$i] =~ /\w(:|=)/ || $scan ) {
1142 $remove_stopwords = 0;
1144 $operands[$i] =~ s/\?/{?}/g; # need to escape question marks
1146 my $operand = $operands[$i];
1147 my $index = $indexes[$i];
1149 # Add index-specific attributes
1150 # Date of Publication
1151 if ( $index eq 'yr' ) {
1152 $index .= ",st-numeric";
1154 $stemming = $auto_truncation = $weight_fields = $fuzzy_enabled = $remove_stopwords = 0;
1157 # Date of Acquisition
1158 elsif ( $index eq 'acqdate' ) {
1159 $index .= ",st-date-normalized";
1161 $stemming = $auto_truncation = $weight_fields = $fuzzy_enabled = $remove_stopwords = 0;
1163 # ISBN,ISSN,Standard Number, don't need special treatment
1164 elsif ( $index eq 'nb' || $index eq 'ns' ) {
1166 $stemming, $auto_truncation,
1167 $weight_fields, $fuzzy_enabled,
1169 ) = ( 0, 0, 0, 0, 0 );
1177 # Set default structure attribute (word list)
1178 my $struct_attr = q{};
1179 unless ( $indexes_set || !$index || $index =~ /(st-|phr|ext|wrdl|nb|ns)/ ) {
1180 $struct_attr = ",wrdl";
1183 # Some helpful index variants
1184 my $index_plus = $index . $struct_attr . ':';
1185 my $index_plus_comma = $index . $struct_attr . ',';
1188 if ($remove_stopwords) {
1189 ( $operand, $stopwords_removed ) =
1190 _remove_stopwords( $operand, $index );
1191 warn "OPERAND w/out STOPWORDS: >$operand<" if $DEBUG;
1192 warn "REMOVED STOPWORDS: @$stopwords_removed"
1193 if ( $stopwords_removed && $DEBUG );
1196 if ($auto_truncation){
1197 unless ( $index =~ /(st-|phr|ext)/ ) {
1198 #FIXME only valid with LTR scripts
1199 $operand=join(" ",map{
1200 (index($_,"*")>0?"$_":"$_*")
1201 }split (/\s+/,$operand));
1202 warn $operand if $DEBUG;
1207 my $truncated_operand;
1208 my( $nontruncated, $righttruncated, $lefttruncated,
1209 $rightlefttruncated, $regexpr
1210 ) = _detect_truncation( $operand, $index );
1212 "TRUNCATION: NON:>@$nontruncated< RIGHT:>@$righttruncated< LEFT:>@$lefttruncated< RIGHTLEFT:>@$rightlefttruncated< REGEX:>@$regexpr<"
1217 scalar(@$righttruncated) + scalar(@$lefttruncated) +
1218 scalar(@$rightlefttruncated) > 0 )
1221 # Don't field weight or add the index to the query, we do it here
1223 undef $weight_fields;
1224 my $previous_truncation_operand;
1225 if (scalar @$nontruncated) {
1226 $truncated_operand .= "$index_plus @$nontruncated ";
1227 $previous_truncation_operand = 1;
1229 if (scalar @$righttruncated) {
1230 $truncated_operand .= "and " if $previous_truncation_operand;
1231 $truncated_operand .= $index_plus_comma . "rtrn:@$righttruncated ";
1232 $previous_truncation_operand = 1;
1234 if (scalar @$lefttruncated) {
1235 $truncated_operand .= "and " if $previous_truncation_operand;
1236 $truncated_operand .= $index_plus_comma . "ltrn:@$lefttruncated ";
1237 $previous_truncation_operand = 1;
1239 if (scalar @$rightlefttruncated) {
1240 $truncated_operand .= "and " if $previous_truncation_operand;
1241 $truncated_operand .= $index_plus_comma . "rltrn:@$rightlefttruncated ";
1242 $previous_truncation_operand = 1;
1245 $operand = $truncated_operand if $truncated_operand;
1246 warn "TRUNCATED OPERAND: >$truncated_operand<" if $DEBUG;
1249 my $stemmed_operand;
1250 $stemmed_operand = _build_stemmed_operand($operand, $lang)
1253 warn "STEMMED OPERAND: >$stemmed_operand<" if $DEBUG;
1255 # Handle Field Weighting
1256 my $weighted_operand;
1257 if ($weight_fields) {
1258 $weighted_operand = _build_weighted_query( $operand, $stemmed_operand, $index );
1259 $operand = $weighted_operand;
1263 warn "FIELD WEIGHTED OPERAND: >$weighted_operand<" if $DEBUG;
1265 # If there's a previous operand, we need to add an operator
1266 if ($previous_operand) {
1268 # User-specified operator
1269 if ( $operators[ $i - 1 ] ) {
1270 $query .= " $operators[$i-1] ";
1271 $query .= " $index_plus " unless $indexes_set;
1272 $query .= " $operand";
1273 $query_cgi .= "&op=$operators[$i-1]";
1274 $query_cgi .= "&idx=$index" if $index;
1275 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1277 " $operators[$i-1] $index_plus $operands[$i]";
1280 # Default operator is and
1283 $query .= "$index_plus " unless $indexes_set;
1284 $query .= "$operand";
1285 $query_cgi .= "&op=and&idx=$index" if $index;
1286 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1287 $query_desc .= " and $index_plus $operands[$i]";
1291 # There isn't a pervious operand, don't need an operator
1294 # Field-weighted queries already have indexes set
1295 $query .= " $index_plus " unless $indexes_set;
1297 $query_desc .= " $index_plus $operands[$i]";
1298 $query_cgi .= "&idx=$index" if $index;
1299 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1300 $previous_operand = 1;
1305 warn "QUERY BEFORE LIMITS: >$query<" if $DEBUG;
1308 my $group_OR_limits;
1309 my $availability_limit;
1310 foreach my $this_limit (@limits) {
1311 if ( $this_limit =~ /available/ ) {
1313 ## 'available' is defined as (items.onloan is NULL) and (items.itemlost = 0)
1315 ## all records not indexed in the onloan register (zebra) and all records with a value of lost equal to 0
1316 $availability_limit .=
1317 "( ( allrecords,AlwaysMatches='' not onloan,AlwaysMatches='') and (lost,st-numeric=0) )"; #or ( allrecords,AlwaysMatches='' not lost,AlwaysMatches='')) )";
1318 $limit_cgi .= "&limit=available";
1322 # group_OR_limits, prefixed by mc-
1323 # OR every member of the group
1324 elsif ( $this_limit =~ /mc/ ) {
1326 if ( $this_limit =~ /mc-ccode:/ ) {
1327 # in case the mc-ccode value has complicating chars like ()'s inside it we wrap in quotes
1328 $this_limit =~ tr/"//d;
1329 my ($k,$v) = split(/:/, $this_limit,2);
1330 $this_limit = $k.":\"".$v."\"";
1333 $group_OR_limits .= " or " if $group_OR_limits;
1334 $limit_desc .= " or " if $group_OR_limits;
1335 $group_OR_limits .= "$this_limit";
1336 $limit_cgi .= "&limit=$this_limit";
1337 $limit_desc .= " $this_limit";
1340 # Regular old limits
1342 $limit .= " and " if $limit || $query;
1343 $limit .= "$this_limit";
1344 $limit_cgi .= "&limit=$this_limit";
1345 if ($this_limit =~ /^branch:(.+)/) {
1346 my $branchcode = $1;
1347 my $branchname = GetBranchName($branchcode);
1348 if (defined $branchname) {
1349 $limit_desc .= " branch:$branchname";
1351 $limit_desc .= " $this_limit";
1354 $limit_desc .= " $this_limit";
1358 if ($group_OR_limits) {
1359 $limit .= " and " if ( $query || $limit );
1360 $limit .= "($group_OR_limits)";
1362 if ($availability_limit) {
1363 $limit .= " and " if ( $query || $limit );
1364 $limit .= "($availability_limit)";
1367 # Normalize the query and limit strings
1368 # This is flawed , means we can't search anything with : in it
1369 # if user wants to do ccl or cql, start the query with that
1370 # $query =~ s/:/=/g;
1371 $query =~ s/(?<=(ti|au|pb|su|an|kw|mc|nb|ns)):/=/g;
1372 $query =~ s/(?<=(wrdl)):/=/g;
1373 $query =~ s/(?<=(trn|phr)):/=/g;
1375 for ( $query, $query_desc, $limit, $limit_desc ) {
1376 s/ +/ /g; # remove extra spaces
1377 s/^ //g; # remove any beginning spaces
1378 s/ $//g; # remove any ending spaces
1379 s/==/=/g; # remove double == from query
1381 $query_cgi =~ s/^&//; # remove unnecessary & from beginning of the query cgi
1383 for ($query_cgi,$simple_query) {
1386 # append the limit to the query
1387 $query .= " " . $limit;
1391 warn "QUERY:" . $query;
1392 warn "QUERY CGI:" . $query_cgi;
1393 warn "QUERY DESC:" . $query_desc;
1394 warn "LIMIT:" . $limit;
1395 warn "LIMIT CGI:" . $limit_cgi;
1396 warn "LIMIT DESC:" . $limit_desc;
1397 warn "---------\nLeave buildQuery\n---------";
1400 undef, $query, $simple_query, $query_cgi,
1401 $query_desc, $limit, $limit_cgi, $limit_desc,
1402 $stopwords_removed, $query_type
1406 =head2 searchResults
1408 my @search_results = searchResults($search_context, $searchdesc, $hits,
1409 $results_per_page, $offset, $scan,
1410 @marcresults, $hidelostitems);
1412 Format results in a form suitable for passing to the template
1416 # IMO this subroutine is pretty messy still -- it's responsible for
1417 # building the HTML output for the template
1419 my ( $search_context, $searchdesc, $hits, $results_per_page, $offset, $scan, $marcresults ) = @_;
1420 my $dbh = C4::Context->dbh;
1423 $search_context = 'opac' if !$search_context || $search_context ne 'intranet';
1424 my ($is_opac, $hidelostitems);
1425 if ($search_context eq 'opac') {
1426 $hidelostitems = C4::Context->preference('hidelostitems');
1430 #Build branchnames hash
1432 #get branch information.....
1434 my $bsth =$dbh->prepare("SELECT branchcode,branchname FROM branches"); # FIXME : use C4::Branch::GetBranches
1436 while ( my $bdata = $bsth->fetchrow_hashref ) {
1437 $branches{ $bdata->{'branchcode'} } = $bdata->{'branchname'};
1439 # FIXME - We build an authorised values hash here, using the default framework
1440 # though it is possible to have different authvals for different fws.
1442 my $shelflocations =GetKohaAuthorisedValues('items.location','');
1444 # get notforloan authorised value list (see $shelflocations FIXME)
1445 my $notforloan_authorised_value = GetAuthValCode('items.notforloan','');
1447 #Build itemtype hash
1448 #find itemtype & itemtype image
1452 "SELECT itemtype,description,imageurl,summary,notforloan FROM itemtypes"
1455 while ( my $bdata = $bsth->fetchrow_hashref ) {
1456 foreach (qw(description imageurl summary notforloan)) {
1457 $itemtypes{ $bdata->{'itemtype'} }->{$_} = $bdata->{$_};
1461 #search item field code
1464 "SELECT tagfield FROM marc_subfield_structure WHERE kohafield LIKE 'items.itemnumber'"
1467 my ($itemtag) = $sth->fetchrow;
1469 ## find column names of items related to MARC
1470 my $sth2 = $dbh->prepare("SHOW COLUMNS FROM items");
1472 my %subfieldstosearch;
1473 while ( ( my $column ) = $sth2->fetchrow ) {
1474 my ( $tagfield, $tagsubfield ) =
1475 &GetMarcFromKohaField( "items." . $column, "" );
1476 $subfieldstosearch{$column} = $tagsubfield;
1479 # handle which records to actually retrieve
1481 if ( $hits && $offset + $results_per_page <= $hits ) {
1482 $times = $offset + $results_per_page;
1485 $times = $hits; # FIXME: if $hits is undefined, why do we want to equal it?
1488 my $marcflavour = C4::Context->preference("marcflavour");
1489 # We get the biblionumber position in MARC
1490 my ($bibliotag,$bibliosubf)=GetMarcFromKohaField('biblio.biblionumber','');
1492 # loop through all of the records we've retrieved
1493 for ( my $i = $offset ; $i <= $times - 1 ; $i++ ) {
1494 my $marcrecord = MARC::File::USMARC::decode( $marcresults->[$i] );
1498 ? GetFrameworkCode($marcrecord->field($bibliotag)->data)
1499 : GetFrameworkCode($marcrecord->subfield($bibliotag,$bibliosubf));
1500 my $oldbiblio = TransformMarcToKoha( $dbh, $marcrecord, $fw );
1501 $oldbiblio->{subtitle} = GetRecordValue('subtitle', $marcrecord, $fw);
1502 $oldbiblio->{result_number} = $i + 1;
1504 # add imageurl to itemtype if there is one
1505 $oldbiblio->{imageurl} = getitemtypeimagelocation( $search_context, $itemtypes{ $oldbiblio->{itemtype} }->{imageurl} );
1507 $oldbiblio->{'authorised_value_images'} = ($search_context eq 'opac' && C4::Context->preference('AuthorisedValueImages')) || ($search_context eq 'intranet' && C4::Context->preference('StaffAuthorisedValueImages')) ? C4::Items::get_authorised_value_images( C4::Biblio::get_biblio_authorised_values( $oldbiblio->{'biblionumber'}, $marcrecord ) ) : [];
1508 $oldbiblio->{normalized_upc} = GetNormalizedUPC( $marcrecord,$marcflavour);
1509 $oldbiblio->{normalized_ean} = GetNormalizedEAN( $marcrecord,$marcflavour);
1510 $oldbiblio->{normalized_oclc} = GetNormalizedOCLCNumber($marcrecord,$marcflavour);
1511 $oldbiblio->{normalized_isbn} = GetNormalizedISBN(undef,$marcrecord,$marcflavour);
1512 $oldbiblio->{content_identifier_exists} = 1 if ($oldbiblio->{normalized_isbn} or $oldbiblio->{normalized_oclc} or $oldbiblio->{normalized_ean} or $oldbiblio->{normalized_upc});
1514 # edition information, if any
1515 $oldbiblio->{edition} = $oldbiblio->{editionstatement};
1516 $oldbiblio->{description} = $itemtypes{ $oldbiblio->{itemtype} }->{description};
1517 # Build summary if there is one (the summary is defined in the itemtypes table)
1518 # FIXME: is this used anywhere, I think it can be commented out? -- JF
1519 if ( $itemtypes{ $oldbiblio->{itemtype} }->{summary} ) {
1520 my $summary = $itemtypes{ $oldbiblio->{itemtype} }->{summary};
1521 my @fields = $marcrecord->fields();
1524 foreach my $line ( "$summary\n" =~ /(.*)\n/g ){
1526 foreach my $tag ( $line =~ /\[(\d{3}[\w|\d])\]/ ) {
1527 $tag =~ /(.{3})(.)/;
1528 if($marcrecord->field($1)){
1529 my @abc = $marcrecord->field($1)->subfield($2);
1530 $tags->{$tag} = $#abc + 1 ;
1534 # We catch how many times to repeat this line
1536 foreach my $tag (keys(%$tags)){
1537 $max = $tags->{$tag} if($tags->{$tag} > $max);
1540 # we replace, and repeat each line
1541 for (my $i = 0 ; $i < $max ; $i++){
1542 my $newline = $line;
1544 foreach my $tag ( $newline =~ /\[(\d{3}[\w|\d])\]/g ) {
1545 $tag =~ /(.{3})(.)/;
1547 if($marcrecord->field($1)){
1548 my @repl = $marcrecord->field($1)->subfield($2);
1549 my $subfieldvalue = $repl[$i];
1551 if (! utf8::is_utf8($subfieldvalue)) {
1552 utf8::decode($subfieldvalue);
1555 $newline =~ s/\[$tag\]/$subfieldvalue/g;
1558 $newsummary .= "$newline\n";
1562 $newsummary =~ s/\[(.*?)]//g;
1563 $newsummary =~ s/\n/<br\/>/g;
1564 $oldbiblio->{summary} = $newsummary;
1567 # Pull out the items fields
1568 my @fields = $marcrecord->field($itemtag);
1569 my $marcflavor = C4::Context->preference("marcflavour");
1570 # adding linked items that belong to host records
1571 my $analyticsfield = '773';
1572 if ($marcflavor eq 'MARC21' || $marcflavor eq 'NORMARC') {
1573 $analyticsfield = '773';
1574 } elsif ($marcflavor eq 'UNIMARC') {
1575 $analyticsfield = '461';
1577 foreach my $hostfield ( $marcrecord->field($analyticsfield)) {
1578 my $hostbiblionumber = $hostfield->subfield("0");
1579 my $linkeditemnumber = $hostfield->subfield("9");
1580 if(!$hostbiblionumber eq undef){
1581 my $hostbiblio = GetMarcBiblio($hostbiblionumber, 1);
1582 my ($itemfield, undef) = GetMarcFromKohaField( 'items.itemnumber', GetFrameworkCode($hostbiblionumber) );
1583 if(!$hostbiblio eq undef){
1584 my @hostitems = $hostbiblio->field($itemfield);
1585 foreach my $hostitem (@hostitems){
1586 if ($hostitem->subfield("9") eq $linkeditemnumber){
1587 my $linkeditem =$hostitem;
1588 # append linked items if they exist
1589 if (!$linkeditem eq undef){
1590 push (@fields, $linkeditem);}
1597 # Setting item statuses for display
1598 my @available_items_loop;
1599 my @onloan_items_loop;
1600 my @other_items_loop;
1602 my $available_items;
1606 my $ordered_count = 0;
1607 my $available_count = 0;
1608 my $onloan_count = 0;
1609 my $longoverdue_count = 0;
1610 my $other_count = 0;
1611 my $wthdrawn_count = 0;
1612 my $itemlost_count = 0;
1613 my $hideatopac_count = 0;
1614 my $itembinding_count = 0;
1615 my $itemdamaged_count = 0;
1616 my $item_in_transit_count = 0;
1617 my $can_place_holds = 0;
1618 my $item_onhold_count = 0;
1619 my $items_count = scalar(@fields);
1620 my $maxitems_pref = C4::Context->preference('maxItemsinSearchResults');
1621 my $maxitems = $maxitems_pref ? $maxitems_pref - 1 : 1;
1623 # loop through every item
1625 foreach my $field (@fields) {
1628 # populate the items hash
1629 foreach my $code ( keys %subfieldstosearch ) {
1630 $item->{$code} = $field->subfield( $subfieldstosearch{$code} );
1635 my @hi = GetHiddenItemnumbers($item);
1636 $item->{'hideatopac'} = @hi;
1637 push @hiddenitems, @hi;
1640 my $hbranch = C4::Context->preference('HomeOrHoldingBranch') eq 'homebranch' ? 'homebranch' : 'holdingbranch';
1641 my $otherbranch = C4::Context->preference('HomeOrHoldingBranch') eq 'homebranch' ? 'holdingbranch' : 'homebranch';
1643 # set item's branch name, use HomeOrHoldingBranch syspref first, fall back to the other one
1644 if ($item->{$hbranch}) {
1645 $item->{'branchname'} = $branches{$item->{$hbranch}};
1647 elsif ($item->{$otherbranch}) { # Last resort
1648 $item->{'branchname'} = $branches{$item->{$otherbranch}};
1651 my $prefix = $item->{$hbranch} . '--' . $item->{location} . $item->{itype} . $item->{itemcallnumber};
1652 # For each grouping of items (onloan, available, unavailable), we build a key to store relevant info about that item
1653 my $userenv = C4::Context->userenv;
1654 if ( $item->{onloan} && !(C4::Members::GetHideLostItemsPreference($userenv->{'number'}) && $item->{itemlost}) ) {
1656 my $key = $prefix . $item->{onloan} . $item->{barcode};
1657 $onloan_items->{$key}->{due_date} = format_date($item->{onloan});
1658 $onloan_items->{$key}->{count}++ if $item->{$hbranch};
1659 $onloan_items->{$key}->{branchname} = $item->{branchname};
1660 $onloan_items->{$key}->{location} = $shelflocations->{ $item->{location} };
1661 $onloan_items->{$key}->{itemcallnumber} = $item->{itemcallnumber};
1662 $onloan_items->{$key}->{imageurl} = getitemtypeimagelocation( $search_context, $itemtypes{ $item->{itype} }->{imageurl} );
1663 # if something's checked out and lost, mark it as 'long overdue'
1664 if ( $item->{itemlost} ) {
1665 $onloan_items->{$prefix}->{longoverdue}++;
1666 $longoverdue_count++;
1667 } else { # can place holds as long as item isn't lost
1668 $can_place_holds = 1;
1672 # items not on loan, but still unavailable ( lost, withdrawn, damaged )
1676 if ( $item->{notforloan} == -1 ) {
1680 # is item in transit?
1681 my $transfertwhen = '';
1682 my ($transfertfrom, $transfertto);
1684 # is item on the reserve shelf?
1685 my $reservestatus = '';
1688 unless ($item->{wthdrawn}
1689 || $item->{itemlost}
1691 || $item->{notforloan}
1692 || $items_count > 20) {
1694 # A couple heuristics to limit how many times
1695 # we query the database for item transfer information, sacrificing
1696 # accuracy in some cases for speed;
1698 # 1. don't query if item has one of the other statuses
1699 # 2. don't check transit status if the bib has
1700 # more than 20 items
1702 # FIXME: to avoid having the query the database like this, and to make
1703 # the in transit status count as unavailable for search limiting,
1704 # should map transit status to record indexed in Zebra.
1706 ($transfertwhen, $transfertfrom, $transfertto) = C4::Circulation::GetTransfers($item->{itemnumber});
1707 ($reservestatus, $reserveitem, undef) = C4::Reserves::CheckReserves($item->{itemnumber});
1710 # item is withdrawn, lost, damaged, not for loan, reserved or in transit
1711 if ( $item->{wthdrawn}
1712 || $item->{itemlost}
1714 || $item->{notforloan} > 0
1715 || $item->{hideatopac}
1716 || $reservestatus eq 'Waiting'
1717 || ($transfertwhen ne ''))
1719 $wthdrawn_count++ if $item->{wthdrawn};
1720 $itemlost_count++ if $item->{itemlost};
1721 $itemdamaged_count++ if $item->{damaged};
1722 $hideatopac_count++ if $item->{hideatopac};
1723 $item_in_transit_count++ if $transfertwhen ne '';
1724 $item_onhold_count++ if $reservestatus eq 'Waiting';
1725 $item->{status} = $item->{wthdrawn} . "-" . $item->{itemlost} . "-" . $item->{damaged} . "-" . $item->{notforloan};
1727 # can place hold on item ?
1728 if ((!$item->{damaged} || C4::Context->preference('AllowHoldsOnDamagedItems'))
1729 && !$item->{itemlost}
1730 && !$item->{withdrawn}
1732 $can_place_holds = 1;
1737 my $key = $prefix . $item->{status};
1738 foreach (qw(wthdrawn itemlost damaged branchname itemcallnumber hideatopac)) {
1739 $other_items->{$key}->{$_} = $item->{$_};
1741 $other_items->{$key}->{intransit} = ( $transfertwhen ne '' ) ? 1 : 0;
1742 $other_items->{$key}->{onhold} = ($reservestatus) ? 1 : 0;
1743 $other_items->{$key}->{notforloan} = GetAuthorisedValueDesc('','',$item->{notforloan},'','',$notforloan_authorised_value) if $notforloan_authorised_value;
1744 $other_items->{$key}->{count}++ if $item->{$hbranch};
1745 $other_items->{$key}->{location} = $shelflocations->{ $item->{location} };
1746 $other_items->{$key}->{imageurl} = getitemtypeimagelocation( $search_context, $itemtypes{ $item->{itype} }->{imageurl} );
1750 $can_place_holds = 1;
1752 $available_items->{$prefix}->{count}++ if $item->{$hbranch};
1753 foreach (qw(branchname itemcallnumber hideatopac)) {
1754 $available_items->{$prefix}->{$_} = $item->{$_};
1756 $available_items->{$prefix}->{location} = $shelflocations->{ $item->{location} };
1757 $available_items->{$prefix}->{imageurl} = getitemtypeimagelocation( $search_context, $itemtypes{ $item->{itype} }->{imageurl} );
1760 } # notforloan, item level and biblioitem level
1761 if ($items_count > 0) {
1762 next if $is_opac && $hideatopac_count >= $items_count;
1763 next if $hidelostitems && $itemlost_count >= $items_count;
1765 my ( $availableitemscount, $onloanitemscount, $otheritemscount );
1766 for my $key ( sort keys %$onloan_items ) {
1767 (++$onloanitemscount > $maxitems) and last;
1768 push @onloan_items_loop, $onloan_items->{$key};
1770 for my $key ( sort keys %$other_items ) {
1771 (++$otheritemscount > $maxitems) and last;
1772 push @other_items_loop, $other_items->{$key};
1774 for my $key ( sort keys %$available_items ) {
1775 (++$availableitemscount > $maxitems) and last;
1776 push @available_items_loop, $available_items->{$key}
1779 # XSLT processing of some stuff
1781 SetUTF8Flag($marcrecord);
1782 $debug && warn $marcrecord->as_formatted;
1783 my $interface = $search_context eq 'opac' ? 'OPAC' : '';
1784 if (!$scan && C4::Context->preference($interface . "XSLTResultsDisplay")) {
1785 $oldbiblio->{XSLTResultsRecord} = XSLTParse4Display($oldbiblio->{biblionumber}, $marcrecord, 'Results',
1786 $search_context, 1, \@hiddenitems);
1787 # the last parameter tells Koha to clean up the problematic ampersand entities that Zebra outputs
1790 # if biblio level itypes are used and itemtype is notforloan, it can't be reserved either
1791 if (!C4::Context->preference("item-level_itypes")) {
1792 if ($itemtypes{ $oldbiblio->{itemtype} }->{notforloan}) {
1793 $can_place_holds = 0;
1796 $oldbiblio->{norequests} = 1 unless $can_place_holds;
1797 $oldbiblio->{itemsplural} = 1 if $items_count > 1;
1798 $oldbiblio->{items_count} = $items_count;
1799 $oldbiblio->{available_items_loop} = \@available_items_loop;
1800 $oldbiblio->{onloan_items_loop} = \@onloan_items_loop;
1801 $oldbiblio->{other_items_loop} = \@other_items_loop;
1802 $oldbiblio->{availablecount} = $available_count;
1803 $oldbiblio->{availableplural} = 1 if $available_count > 1;
1804 $oldbiblio->{onloancount} = $onloan_count;
1805 $oldbiblio->{onloanplural} = 1 if $onloan_count > 1;
1806 $oldbiblio->{othercount} = $other_count;
1807 $oldbiblio->{otherplural} = 1 if $other_count > 1;
1808 $oldbiblio->{wthdrawncount} = $wthdrawn_count;
1809 $oldbiblio->{itemlostcount} = $itemlost_count;
1810 $oldbiblio->{damagedcount} = $itemdamaged_count;
1811 $oldbiblio->{intransitcount} = $item_in_transit_count;
1812 $oldbiblio->{onholdcount} = $item_onhold_count;
1813 $oldbiblio->{orderedcount} = $ordered_count;
1814 # deleting - in isbn to enable amazon content
1815 $oldbiblio->{isbn} =~ s/-//g;
1817 if (C4::Context->preference("AlternateHoldingsField") && $items_count == 0) {
1818 my $fieldspec = C4::Context->preference("AlternateHoldingsField");
1819 my $subfields = substr $fieldspec, 3;
1820 my $holdingsep = C4::Context->preference("AlternateHoldingsSeparator") || ' ';
1821 my @alternateholdingsinfo = ();
1822 my @holdingsfields = $marcrecord->field(substr $fieldspec, 0, 3);
1823 my $alternateholdingscount = 0;
1825 for my $field (@holdingsfields) {
1826 my %holding = ( holding => '' );
1827 my $havesubfield = 0;
1828 for my $subfield ($field->subfields()) {
1829 if ((index $subfields, $$subfield[0]) >= 0) {
1830 $holding{'holding'} .= $holdingsep if (length $holding{'holding'} > 0);
1831 $holding{'holding'} .= $$subfield[1];
1835 if ($havesubfield) {
1836 push(@alternateholdingsinfo, \%holding);
1837 $alternateholdingscount++;
1841 $oldbiblio->{'ALTERNATEHOLDINGS'} = \@alternateholdingsinfo;
1842 $oldbiblio->{'alternateholdings_count'} = $alternateholdingscount;
1845 push( @newresults, $oldbiblio );
1851 =head2 SearchAcquisitions
1852 Search for acquisitions
1855 sub SearchAcquisitions{
1856 my ($datebegin, $dateend, $itemtypes,$criteria, $orderby) = @_;
1858 my $dbh=C4::Context->dbh;
1859 # Variable initialization
1863 LEFT JOIN biblioitems ON biblioitems.biblionumber=biblio.biblionumber
1864 LEFT JOIN items ON items.biblionumber=biblio.biblionumber
1865 WHERE dateaccessioned BETWEEN ? AND ?
1868 my (@params,@loopcriteria);
1870 push @params, $datebegin->output("iso");
1871 push @params, $dateend->output("iso");
1873 if (scalar(@$itemtypes)>0 and $criteria ne "itemtype" ){
1874 if(C4::Context->preference("item-level_itypes")){
1875 $str .= "AND items.itype IN (?".( ',?' x scalar @$itemtypes - 1 ).") ";
1877 $str .= "AND biblioitems.itemtype IN (?".( ',?' x scalar @$itemtypes - 1 ).") ";
1879 push @params, @$itemtypes;
1882 if ($criteria =~/itemtype/){
1883 if(C4::Context->preference("item-level_itypes")){
1884 $str .= "AND items.itype=? ";
1886 $str .= "AND biblioitems.itemtype=? ";
1889 if(scalar(@$itemtypes) == 0){
1890 my $itypes = GetItemTypes();
1891 for my $key (keys %$itypes){
1892 push @$itemtypes, $key;
1896 @loopcriteria= @$itemtypes;
1897 }elsif ($criteria=~/itemcallnumber/){
1898 $str .= "AND (items.itemcallnumber LIKE CONCAT(?,'%')
1899 OR items.itemcallnumber is NULL
1900 OR items.itemcallnumber = '')";
1902 @loopcriteria = ("AA".."ZZ", "") unless (scalar(@loopcriteria)>0);
1904 $str .= "AND biblio.title LIKE CONCAT(?,'%') ";
1905 @loopcriteria = ("A".."z") unless (scalar(@loopcriteria)>0);
1908 if ($orderby =~ /date_desc/){
1909 $str.=" ORDER BY dateaccessioned DESC";
1911 $str.=" ORDER BY title";
1914 my $qdataacquisitions=$dbh->prepare($str);
1916 my @loopacquisitions;
1917 foreach my $value(@loopcriteria){
1918 push @params,$value;
1920 $cell{"title"}=$value;
1921 $cell{"titlecode"}=$value;
1923 eval{$qdataacquisitions->execute(@params);};
1925 if ($@){ warn "recentacquisitions Error :$@";}
1928 while (my $data=$qdataacquisitions->fetchrow_hashref){
1929 push @loopdata, {"summary"=>GetBiblioSummary( $data->{'marcxml'} ) };
1931 $cell{"loopdata"}=\@loopdata;
1933 push @loopacquisitions,\%cell if (scalar(@{$cell{loopdata}})>0);
1936 $qdataacquisitions->finish;
1937 return \@loopacquisitions;
1939 #----------------------------------------------------------------------
1941 # Non-Zebra GetRecords#
1942 #----------------------------------------------------------------------
1946 NZgetRecords has the same API as zera getRecords, even if some parameters are not managed
1952 $query, $simple_query, $sort_by_ref, $servers_ref,
1953 $results_per_page, $offset, $expanded_facet, $branches,
1956 warn "query =$query" if $DEBUG;
1957 my $result = NZanalyse($query);
1958 warn "results =$result" if $DEBUG;
1960 NZorder( $result, @$sort_by_ref[0], $results_per_page, $offset ),
1966 NZanalyse : get a CQL string as parameter, and returns a list of biblionumber;title,biblionumber;title,...
1967 the list is built from an inverted index in the nozebra SQL table
1968 note that title is here only for convenience : the sorting will be very fast when requested on title
1969 if the sorting is requested on something else, we will have to reread all results, and that may be longer.
1974 my ( $string, $server ) = @_;
1975 # warn "---------" if $DEBUG;
1976 warn " NZanalyse" if $DEBUG;
1977 # warn "---------" if $DEBUG;
1979 # $server contains biblioserver or authorities, depending on what we search on.
1980 #warn "querying : $string on $server";
1981 $server = 'biblioserver' unless $server;
1983 # if we have a ", replace the content to discard temporarily any and/or/not inside
1985 if ( $string =~ /"/ ) {
1986 $string =~ s/"(.*?)"/__X__/;
1988 warn "commacontent : $commacontent" if $DEBUG;
1991 # split the query string in 3 parts : X AND Y means : $left="X", $operand="AND" and $right="Y"
1992 # then, call again NZanalyse with $left and $right
1993 # (recursive until we find a leaf (=> something without and/or/not)
1994 # delete repeated operator... Would then go in infinite loop
1995 while ( $string =~ s/( and| or| not| AND| OR| NOT)\1/$1/g ) {
1998 #process parenthesis before.
1999 if ( $string =~ /^\s*\((.*)\)(( and | or | not | AND | OR | NOT )(.*))?/ ) {
2002 my $operator = lc($3); # FIXME: and/or/not are operators, not operands
2004 "dealing w/parenthesis before recursive sub call. left :$left operator:$operator right:$right"
2006 my $leftresult = NZanalyse( $left, $server );
2008 my $rightresult = NZanalyse( $right, $server );
2010 # OK, we have the results for right and left part of the query
2011 # depending of operand, intersect, union or exclude both lists
2012 # to get a result list
2013 if ( $operator eq ' and ' ) {
2014 return NZoperatorAND($leftresult,$rightresult);
2016 elsif ( $operator eq ' or ' ) {
2018 # just merge the 2 strings
2019 return $leftresult . $rightresult;
2021 elsif ( $operator eq ' not ' ) {
2022 return NZoperatorNOT($leftresult,$rightresult);
2026 # this error is impossible, because of the regexp that isolate the operand, but just in case...
2030 warn "string :" . $string if $DEBUG;
2034 if ($string =~ /(.*?)( and | or | not | AND | OR | NOT )(.*)/) {
2037 $operator = lc($2); # FIXME: and/or/not are operators, not operands
2039 warn "no parenthesis. left : $left operator: $operator right: $right"
2042 # it's not a leaf, we have a and/or/not
2045 # reintroduce comma content if needed
2046 $right =~ s/__X__/"$commacontent"/ if $commacontent;
2047 $left =~ s/__X__/"$commacontent"/ if $commacontent;
2048 warn "node : $left / $operator / $right\n" if $DEBUG;
2049 my $leftresult = NZanalyse( $left, $server );
2050 my $rightresult = NZanalyse( $right, $server );
2051 warn " leftresult : $leftresult" if $DEBUG;
2052 warn " rightresult : $rightresult" if $DEBUG;
2053 # OK, we have the results for right and left part of the query
2054 # depending of operand, intersect, union or exclude both lists
2055 # to get a result list
2056 if ( $operator eq ' and ' ) {
2057 return NZoperatorAND($leftresult,$rightresult);
2059 elsif ( $operator eq ' or ' ) {
2061 # just merge the 2 strings
2062 return $leftresult . $rightresult;
2064 elsif ( $operator eq ' not ' ) {
2065 return NZoperatorNOT($leftresult,$rightresult);
2069 # this error is impossible, because of the regexp that isolate the operand, but just in case...
2070 die "error : operand unknown : $operator for $string";
2073 # it's a leaf, do the real SQL query and return the result
2076 $string =~ s/__X__/"$commacontent"/ if $commacontent;
2077 $string =~ s/-|\.|\?|,|;|!|'|\(|\)|\[|\]|{|}|"|&|\+|\*|\// /g;
2078 #remove trailing blank at the beginning
2080 warn "leaf:$string" if $DEBUG;
2082 # parse the string in in operator/operand/value again
2086 if ($string =~ /(.*)(>=|<=)(.*)/) {
2093 # warn "handling leaf... left:$left operator:$operator right:$right"
2095 unless ($operator) {
2096 if ($string =~ /(.*)(>|<|=)(.*)/) {
2101 "handling unless (operator)... left:$left operator:$operator right:$right"
2109 # strip adv, zebra keywords, currently not handled in nozebra: wrdl, ext, phr...
2112 # automatic replace for short operators
2113 $left = 'title' if $left =~ '^ti$';
2114 $left = 'author' if $left =~ '^au$';
2115 $left = 'publisher' if $left =~ '^pb$';
2116 $left = 'subject' if $left =~ '^su$';
2117 $left = 'koha-Auth-Number' if $left =~ '^an$';
2118 $left = 'keyword' if $left =~ '^kw$';
2119 $left = 'itemtype' if $left =~ '^mc$'; # Fix for Bug 2599 - Search limits not working for NoZebra
2120 warn "handling leaf... left:$left operator:$operator right:$right" if $DEBUG;
2121 my $dbh = C4::Context->dbh;
2122 if ( $operator && $left ne 'keyword' ) {
2123 #do a specific search
2124 $operator = 'LIKE' if $operator eq '=' and $right =~ /%/;
2125 my $sth = $dbh->prepare(
2126 "SELECT biblionumbers,value FROM nozebra WHERE server=? AND indexname=? AND value $operator ?"
2128 warn "$left / $operator / $right\n" if $DEBUG;
2130 # split each word, query the DB and build the biblionumbers result
2131 #sanitizing leftpart
2132 $left =~ s/^\s+|\s+$//;
2133 foreach ( split / /, $right ) {
2135 $_ =~ s/^\s+|\s+$//;
2137 warn "EXECUTE : $server, $left, $_" if $DEBUG;
2138 $sth->execute( $server, $left, $_ )
2139 or warn "execute failed: $!";
2140 while ( my ( $line, $value ) = $sth->fetchrow ) {
2142 # if we are dealing with a numeric value, use only numeric results (in case of >=, <=, > or <)
2143 # otherwise, fill the result
2144 $biblionumbers .= $line
2145 unless ( $right =~ /^\d+$/ && $value =~ /\D/ );
2146 warn "result : $value "
2147 . ( $right =~ /\d/ ) . "=="
2148 . ( $value =~ /\D/?$line:"" ) if $DEBUG; #= $line";
2151 # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
2153 warn "NZAND" if $DEBUG;
2154 $results = NZoperatorAND($biblionumbers,$results);
2156 $results = $biblionumbers;
2161 #do a complete search (all indexes), if index='kw' do complete search too.
2162 my $sth = $dbh->prepare(
2163 "SELECT biblionumbers FROM nozebra WHERE server=? AND value LIKE ?"
2166 # split each word, query the DB and build the biblionumbers result
2167 foreach ( split / /, $string ) {
2168 next if C4::Context->stopwords->{ uc($_) }; # skip if stopword
2169 warn "search on all indexes on $_" if $DEBUG;
2172 $sth->execute( $server, $_ );
2173 while ( my $line = $sth->fetchrow ) {
2174 $biblionumbers .= $line;
2177 # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
2179 $results = NZoperatorAND($biblionumbers,$results);
2182 warn "NEW RES for $_ = $biblionumbers" if $DEBUG;
2183 $results = $biblionumbers;
2187 warn "return : $results for LEAF : $string" if $DEBUG;
2190 warn "---------\nLeave NZanalyse\n---------" if $DEBUG;
2194 my ($rightresult, $leftresult)=@_;
2196 my @leftresult = split /;/, $leftresult;
2197 warn " @leftresult / $rightresult \n" if $DEBUG;
2199 # my @rightresult = split /;/,$leftresult;
2202 # parse the left results, and if the biblionumber exist in the right result, save it in finalresult
2203 # the result is stored twice, to have the same weight for AND than OR.
2204 # example : TWO : 61,61,64,121 (two is twice in the biblio #61) / TOWER : 61,64,130
2205 # result : 61,61,61,61,64,64 for two AND tower : 61 has more weight than 64
2206 foreach (@leftresult) {
2209 ( $value, $countvalue ) = ( $1, $2 ) if ($value=~/(.*)-(\d+)$/);
2210 if ( $rightresult =~ /\Q$value\E-(\d+);/ ) {
2211 $countvalue = ( $1 > $countvalue ? $countvalue : $1 );
2213 "$value-$countvalue;$value-$countvalue;";
2216 warn "NZAND DONE : $finalresult \n" if $DEBUG;
2217 return $finalresult;
2221 my ($rightresult, $leftresult)=@_;
2222 return $rightresult.$leftresult;
2226 my ($leftresult, $rightresult)=@_;
2228 my @leftresult = split /;/, $leftresult;
2230 # my @rightresult = split /;/,$leftresult;
2232 foreach (@leftresult) {
2234 $value=$1 if $value=~m/(.*)-\d+$/;
2235 unless ($rightresult =~ "$value-") {
2236 $finalresult .= "$_;";
2239 return $finalresult;
2244 $finalresult = NZorder($biblionumbers, $ordering,$results_per_page,$offset);
2251 my ( $biblionumbers, $ordering, $results_per_page, $offset ) = @_;
2252 warn "biblionumbers = $biblionumbers and ordering = $ordering\n" if $DEBUG;
2254 # order title asc by default
2255 # $ordering = '1=36 <i' unless $ordering;
2256 $results_per_page = 20 unless $results_per_page;
2257 $offset = 0 unless $offset;
2258 my $dbh = C4::Context->dbh;
2261 # order by POPULARITY
2263 if ( $ordering =~ /popularity/ ) {
2267 # popularity is not in MARC record, it's builded from a specific query
2269 $dbh->prepare("select sum(issues) from items where biblionumber=?");
2270 foreach ( split /;/, $biblionumbers ) {
2271 my ( $biblionumber, $title ) = split /,/, $_;
2272 $result{$biblionumber} = GetMarcBiblio($biblionumber);
2273 $sth->execute($biblionumber);
2274 my $popularity = $sth->fetchrow || 0;
2276 # hint : the key is popularity.title because we can have
2277 # many results with the same popularity. In this case, sub-ordering is done by title
2278 # we also have biblionumber to avoid bug for 2 biblios with the same title & popularity
2279 # (un-frequent, I agree, but we won't forget anything that way ;-)
2280 $popularity{ sprintf( "%10d", $popularity ) . $title
2281 . $biblionumber } = $biblionumber;
2284 # sort the hash and return the same structure as GetRecords (Zebra querying)
2287 if ( $ordering eq 'popularity_dsc' ) { # sort popularity DESC
2288 foreach my $key ( sort { $b cmp $a } ( keys %popularity ) ) {
2289 $result_hash->{'RECORDS'}[ $numbers++ ] =
2290 $result{ $popularity{$key} }->as_usmarc();
2293 else { # sort popularity ASC
2294 foreach my $key ( sort ( keys %popularity ) ) {
2295 $result_hash->{'RECORDS'}[ $numbers++ ] =
2296 $result{ $popularity{$key} }->as_usmarc();
2299 my $finalresult = ();
2300 $result_hash->{'hits'} = $numbers;
2301 $finalresult->{'biblioserver'} = $result_hash;
2302 return $finalresult;
2308 elsif ( $ordering =~ /author/ ) {
2310 foreach ( split /;/, $biblionumbers ) {
2311 my ( $biblionumber, $title ) = split /,/, $_;
2312 my $record = GetMarcBiblio($biblionumber);
2314 if ( C4::Context->preference('marcflavour') eq 'UNIMARC' ) {
2315 $author = $record->subfield( '200', 'f' );
2316 $author = $record->subfield( '700', 'a' ) unless $author;
2319 $author = $record->subfield( '100', 'a' );
2322 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2323 # and we don't want to get only 1 result for each of them !!!
2324 $result{ $author . $biblionumber } = $record;
2327 # sort the hash and return the same structure as GetRecords (Zebra querying)
2330 if ( $ordering eq 'author_za' || $ordering eq 'author_dsc' ) { # sort by author desc
2331 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2332 $result_hash->{'RECORDS'}[ $numbers++ ] =
2333 $result{$key}->as_usmarc();
2336 else { # sort by author ASC
2337 foreach my $key ( sort ( keys %result ) ) {
2338 $result_hash->{'RECORDS'}[ $numbers++ ] =
2339 $result{$key}->as_usmarc();
2342 my $finalresult = ();
2343 $result_hash->{'hits'} = $numbers;
2344 $finalresult->{'biblioserver'} = $result_hash;
2345 return $finalresult;
2348 # ORDER BY callnumber
2351 elsif ( $ordering =~ /callnumber/ ) {
2353 foreach ( split /;/, $biblionumbers ) {
2354 my ( $biblionumber, $title ) = split /,/, $_;
2355 my $record = GetMarcBiblio($biblionumber);
2357 my $frameworkcode = GetFrameworkCode($biblionumber);
2358 my ( $callnumber_tag, $callnumber_subfield ) = GetMarcFromKohaField( 'items.itemcallnumber', $frameworkcode);
2359 ( $callnumber_tag, $callnumber_subfield ) = GetMarcFromKohaField('biblioitems.callnumber', $frameworkcode)
2360 unless $callnumber_tag;
2361 if ( C4::Context->preference('marcflavour') eq 'UNIMARC' ) {
2362 $callnumber = $record->subfield( '200', 'f' );
2364 $callnumber = $record->subfield( '100', 'a' );
2367 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2368 # and we don't want to get only 1 result for each of them !!!
2369 $result{ $callnumber . $biblionumber } = $record;
2372 # sort the hash and return the same structure as GetRecords (Zebra querying)
2375 if ( $ordering eq 'call_number_dsc' ) { # sort by title desc
2376 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2377 $result_hash->{'RECORDS'}[ $numbers++ ] =
2378 $result{$key}->as_usmarc();
2381 else { # sort by title ASC
2382 foreach my $key ( sort { $a cmp $b } ( keys %result ) ) {
2383 $result_hash->{'RECORDS'}[ $numbers++ ] =
2384 $result{$key}->as_usmarc();
2387 my $finalresult = ();
2388 $result_hash->{'hits'} = $numbers;
2389 $finalresult->{'biblioserver'} = $result_hash;
2390 return $finalresult;
2392 elsif ( $ordering =~ /pubdate/ ) { #pub year
2394 foreach ( split /;/, $biblionumbers ) {
2395 my ( $biblionumber, $title ) = split /,/, $_;
2396 my $record = GetMarcBiblio($biblionumber);
2397 my ( $publicationyear_tag, $publicationyear_subfield ) =
2398 GetMarcFromKohaField( 'biblioitems.publicationyear', '' );
2399 my $publicationyear =
2400 $record->subfield( $publicationyear_tag,
2401 $publicationyear_subfield );
2403 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2404 # and we don't want to get only 1 result for each of them !!!
2405 $result{ $publicationyear . $biblionumber } = $record;
2408 # sort the hash and return the same structure as GetRecords (Zebra querying)
2411 if ( $ordering eq 'pubdate_dsc' ) { # sort by pubyear desc
2412 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2413 $result_hash->{'RECORDS'}[ $numbers++ ] =
2414 $result{$key}->as_usmarc();
2417 else { # sort by pub year ASC
2418 foreach my $key ( sort ( keys %result ) ) {
2419 $result_hash->{'RECORDS'}[ $numbers++ ] =
2420 $result{$key}->as_usmarc();
2423 my $finalresult = ();
2424 $result_hash->{'hits'} = $numbers;
2425 $finalresult->{'biblioserver'} = $result_hash;
2426 return $finalresult;
2432 elsif ( $ordering =~ /title/ ) {
2434 # the title is in the biblionumbers string, so we just need to build a hash, sort it and return
2436 foreach ( split /;/, $biblionumbers ) {
2437 my ( $biblionumber, $title ) = split /,/, $_;
2439 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2440 # and we don't want to get only 1 result for each of them !!!
2441 # hint & speed improvement : we can order without reading the record
2442 # so order, and read records only for the requested page !
2443 $result{ $title . $biblionumber } = $biblionumber;
2446 # sort the hash and return the same structure as GetRecords (Zebra querying)
2449 if ( $ordering eq 'title_az' ) { # sort by title desc
2450 foreach my $key ( sort ( keys %result ) ) {
2451 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2454 else { # sort by title ASC
2455 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2456 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2460 # limit the $results_per_page to result size if it's more
2461 $results_per_page = $numbers - 1 if $numbers < $results_per_page;
2463 # for the requested page, replace biblionumber by the complete record
2464 # speed improvement : avoid reading too much things
2466 my $counter = $offset ;
2467 $counter <= $offset + $results_per_page ;
2471 $result_hash->{'RECORDS'}[$counter] =
2472 GetMarcBiblio( $result_hash->{'RECORDS'}[$counter] )->as_usmarc;
2474 my $finalresult = ();
2475 $result_hash->{'hits'} = $numbers;
2476 $finalresult->{'biblioserver'} = $result_hash;
2477 return $finalresult;
2484 # we need 2 hashes to order by ranking : the 1st one to count the ranking, the 2nd to order by ranking
2487 foreach ( split /;/, $biblionumbers ) {
2488 my ( $biblionumber, $title ) = split /,/, $_;
2489 $title =~ /(.*)-(\d)/;
2494 # note that we + the ranking because ranking is calculated on weight of EACH term requested.
2495 # if we ask for "two towers", and "two" has weight 2 in biblio N, and "towers" has weight 4 in biblio N
2496 # biblio N has ranking = 6
2497 $count_ranking{$biblionumber} += $ranking;
2500 # build the result by "inverting" the count_ranking hash
2501 # hing : as usual, we don't order by ranking only, to avoid having only 1 result for each rank. We build an hash on concat(ranking,biblionumber) instead
2503 foreach ( keys %count_ranking ) {
2504 $result{ sprintf( "%10d", $count_ranking{$_} ) . '-' . $_ } = $_;
2507 # sort the hash and return the same structure as GetRecords (Zebra querying)
2510 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2511 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2514 # limit the $results_per_page to result size if it's more
2515 $results_per_page = $numbers - 1 if $numbers < $results_per_page;
2517 # for the requested page, replace biblionumber by the complete record
2518 # speed improvement : avoid reading too much things
2520 my $counter = $offset ;
2521 $counter <= $offset + $results_per_page ;
2525 $result_hash->{'RECORDS'}[$counter] =
2526 GetMarcBiblio( $result_hash->{'RECORDS'}[$counter] )->as_usmarc
2527 if $result_hash->{'RECORDS'}[$counter];
2529 my $finalresult = ();
2530 $result_hash->{'hits'} = $numbers;
2531 $finalresult->{'biblioserver'} = $result_hash;
2532 return $finalresult;
2536 =head2 enabled_staff_search_views
2538 %hash = enabled_staff_search_views()
2540 This function returns a hash that contains three flags obtained from the system
2541 preferences, used to determine whether a particular staff search results view
2546 =item C<Output arg:>
2548 * $hash{can_view_MARC} is true only if the MARC view is enabled
2549 * $hash{can_view_ISBD} is true only if the ISBD view is enabled
2550 * $hash{can_view_labeledMARC} is true only if the Labeled MARC view is enabled
2552 =item C<usage in the script:>
2556 $template->param ( C4::Search::enabled_staff_search_views );
2560 sub enabled_staff_search_views
2563 can_view_MARC => C4::Context->preference('viewMARC'), # 1 if the staff search allows the MARC view
2564 can_view_ISBD => C4::Context->preference('viewISBD'), # 1 if the staff search allows the ISBD view
2565 can_view_labeledMARC => C4::Context->preference('viewLabeledMARC'), # 1 if the staff search allows the Labeled MARC view
2569 sub AddSearchHistory{
2570 my ($borrowernumber,$session,$query_desc,$query_cgi, $total)=@_;
2571 my $dbh = C4::Context->dbh;
2573 # Add the request the user just made
2574 my $sql = "INSERT INTO search_history(userid, sessionid, query_desc, query_cgi, total, time) VALUES(?, ?, ?, ?, ?, NOW())";
2575 my $sth = $dbh->prepare($sql);
2576 $sth->execute($borrowernumber, $session, $query_desc, $query_cgi, $total);
2577 return $dbh->last_insert_id(undef, 'search_history', undef,undef,undef);
2580 sub GetSearchHistory{
2581 my ($borrowernumber,$session)=@_;
2582 my $dbh = C4::Context->dbh;
2584 # Add the request the user just made
2585 my $query = "SELECT FROM search_history WHERE (userid=? OR sessionid=?)";
2586 my $sth = $dbh->prepare($query);
2587 $sth->execute($borrowernumber, $session);
2588 return $sth->fetchall_hashref({});
2591 =head2 z3950_search_args
2593 $arrayref = z3950_search_args($matchpoints)
2595 This function returns an array reference that contains the search parameters to be
2596 passed to the Z39.50 search script (z3950_search.pl). The array elements
2597 are hash refs whose keys are name, value and encvalue, and whose values are the
2598 name of a search parameter, the value of that search parameter and the URL encoded
2599 value of that parameter.
2601 The search parameter names are lccn, isbn, issn, title, author, dewey and subject.
2603 The search parameter values are obtained from the bibliographic record whose
2604 data is in a hash reference in $matchpoints, as returned by Biblio::GetBiblioData().
2606 If $matchpoints is a scalar, it is assumed to be an unnamed query descriptor, e.g.
2607 a general purpose search argument. In this case, the returned array contains only
2608 entry: the key is 'title' and the value and encvalue are derived from $matchpoints.
2610 If a search parameter value is undefined or empty, it is not included in the returned
2613 The returned array reference may be passed directly to the template parameters.
2617 =item C<Output arg:>
2619 * $array containing hash refs as described above
2621 =item C<usage in the script:>
2625 $data = Biblio::GetBiblioData($bibno);
2626 $template->param ( MYLOOP => C4::Search::z3950_search_args($data) )
2630 $template->param ( MYLOOP => C4::Search::z3950_search_args($searchscalar) )
2634 sub z3950_search_args {
2636 my $isbn = Business::ISBN->new($bibrec);
2638 if (defined $isbn && $isbn->is_valid)
2640 $bibrec = { isbn => $bibrec } if !ref $bibrec;
2643 $bibrec = { title => $bibrec } if !ref $bibrec;
2646 for my $field (qw/ lccn isbn issn title author dewey subject /)
2648 my $encvalue = URI::Escape::uri_escape_utf8($bibrec->{$field});
2649 push @$array, { name=>$field, value=>$bibrec->{$field}, encvalue=>$encvalue } if defined $bibrec->{$field};
2654 =head2 BiblioAddAuthorities
2656 ( $countlinked, $countcreated ) = BiblioAddAuthorities($record, $frameworkcode);
2658 this function finds the authorities linked to the biblio
2659 * search in the authority DB for the same authid (in $9 of the biblio)
2660 * search in the authority DB for the same 001 (in $3 of the biblio in UNIMARC)
2661 * search in the authority DB for the same values (exactly) (in all subfields of the biblio)
2662 OR adds a new authority record
2668 * $record is the MARC record in question (marc blob)
2669 * $frameworkcode is the bibliographic framework to use (if it is "" it uses the default framework)
2671 =item C<Output arg:>
2673 * $countlinked is the number of authorities records that are linked to this authority
2677 * I had to add this to Search.pm (instead of the logical Biblio.pm) because of a circular dependency (this sub uses SimpleSearch, and Search.pm uses Biblio.pm)
2684 sub BiblioAddAuthorities{
2685 my ( $record, $frameworkcode ) = @_;
2686 my $dbh=C4::Context->dbh;
2687 my $query=$dbh->prepare(qq|
2688 SELECT authtypecode,tagfield
2689 FROM marc_subfield_structure
2690 WHERE frameworkcode=?
2691 AND (authtypecode IS NOT NULL AND authtypecode<>\"\")|);
2692 # SELECT authtypecode,tagfield
2693 # FROM marc_subfield_structure
2694 # WHERE frameworkcode=?
2695 # AND (authtypecode IS NOT NULL OR authtypecode<>\"\")|);
2696 $query->execute($frameworkcode);
2697 my ($countcreated,$countlinked);
2698 while (my $data=$query->fetchrow_hashref){
2699 foreach my $field ($record->field($data->{tagfield})){
2700 next if ($field->subfield('3')||$field->subfield('9'));
2701 # No authorities id in the tag.
2702 # Search if there is any authorities to link to.
2703 my $query='at='.$data->{authtypecode}.' ';
2704 map {$query.= ' and he,ext="'.$_->[1].'"' if ($_->[0]=~/[A-z]/)} $field->subfields();
2705 my ($error, $results, $total_hits)=SimpleSearch( $query, undef, undef, [ "authorityserver" ] );
2706 # there is only 1 result
2708 warn "BIBLIOADDSAUTHORITIES: $error";
2711 if ( @{$results} == 1 ) {
2712 my $marcrecord = MARC::File::USMARC::decode($results->[0]);
2713 $field->add_subfields('9'=>$marcrecord->field('001')->data);
2715 } elsif ( @{$results} > 1 ) {
2716 #More than One result
2717 #This can comes out of a lack of a subfield.
2718 # my $marcrecord = MARC::File::USMARC::decode($results->[0]);
2719 # $record->field($data->{tagfield})->add_subfields('9'=>$marcrecord->field('001')->data);
2722 #There are no results, build authority record, add it to Authorities, get authid and add it to 9
2723 ###NOTICE : This is only valid if a subfield is linked to one and only one authtypecode
2724 ###NOTICE : This can be a problem. We should also look into other types and rejected forms.
2725 my $authtypedata=C4::AuthoritiesMarc::GetAuthType($data->{authtypecode});
2726 next unless $authtypedata;
2727 my $marcrecordauth=MARC::Record->new();
2728 my $authfield=MARC::Field->new($authtypedata->{auth_tag_to_report},'','',"a"=>"".$field->subfield('a'));
2729 map { $authfield->add_subfields($_->[0]=>$_->[1]) if ($_->[0]=~/[A-z]/ && $_->[0] ne "a" )} $field->subfields();
2730 $marcrecordauth->insert_fields_ordered($authfield);
2732 # bug 2317: ensure new authority knows it's using UTF-8; currently
2733 # only need to do this for MARC21, as MARC::Record->as_xml_record() handles
2734 # automatically for UNIMARC (by not transcoding)
2735 # FIXME: AddAuthority() instead should simply explicitly require that the MARC::Record
2736 # use UTF-8, but as of 2008-08-05, did not want to introduce that kind
2737 # of change to a core API just before the 3.0 release.
2738 if (C4::Context->preference('marcflavour') eq 'MARC21') {
2739 SetMarcUnicodeFlag($marcrecordauth, 'MARC21');
2742 # warn "AUTH RECORD ADDED : ".$marcrecordauth->as_formatted;
2744 my $authid=AddAuthority($marcrecordauth,'',$data->{authtypecode});
2746 $field->add_subfields('9'=>$authid);
2750 return ($countlinked,$countcreated);
2753 =head2 GetDistinctValues($field);
2755 C<$field> is a reference to the fields array
2759 sub GetDistinctValues {
2760 my ($fieldname,$string)=@_;
2761 # returns a reference to a hash of references to branches...
2762 if ($fieldname=~/\./){
2763 my ($table,$column)=split /\./, $fieldname;
2764 my $dbh = C4::Context->dbh;
2765 warn "select DISTINCT($column) as value, count(*) as cnt from $table group by lib order by $column " if $DEBUG;
2766 my $sth = $dbh->prepare("select DISTINCT($column) as value, count(*) as cnt from $table ".($string?" where $column like \"$string%\"":"")."group by value order by $column ");
2768 my $elements=$sth->fetchall_arrayref({});
2773 my @servers=qw<biblioserver authorityserver>;
2774 my (@zconns,@results);
2775 for ( my $i = 0 ; $i < @servers ; $i++ ) {
2776 $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
2779 ZOOM::Query::CCL2RPN->new( qq"$fieldname $string", $zconns[$i])
2782 # The big moment: asynchronously retrieve results from all servers
2784 while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
2785 my $ev = $zconns[ $i - 1 ]->last_event();
2786 if ( $ev == ZOOM::Event::ZEND ) {
2787 next unless $results[ $i - 1 ];
2788 my $size = $results[ $i - 1 ]->size();
2790 for (my $j=0;$j<$size;$j++){
2792 @hashscan{qw(value cnt)}=$results[ $i - 1 ]->display_term($j);
2793 push @elements, \%hashscan;
2803 END { } # module clean-up code here (global destructor)
2810 Koha Development Team <http://koha-community.org/>