3 # This file is part of Koha.
5 # Koha is free software; you can redistribute it and/or modify it under the
6 # terms of the GNU General Public License as published by the Free Software
7 # Foundation; either version 2 of the License, or (at your option) any later
10 # Koha is distributed in the hope that it will be useful, but WITHOUT ANY
11 # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
12 # A PARTICULAR PURPOSE. See the GNU General Public License for more details.
14 # You should have received a copy of the GNU General Public License along with
15 # Koha; if not, write to the Free Software Foundation, Inc., 59 Temple Place,
16 # Suite 330, Boston, MA 02111-1307 USA
19 # use warnings; # FIXME
22 use C4::Biblio; # GetMarcFromKohaField
23 use C4::Koha; # getFacets
25 use C4::Search::PazPar2;
27 use C4::Dates qw(format_date);
31 use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS $DEBUG);
33 # set the version for version checking
36 $DEBUG = ($ENV{DEBUG}) ? 1 : 0;
41 C4::Search - Functions for searching the Koha catalog.
45 See opac/opac-search.pl or catalogue/search.pl for example of usage
49 This module provides searching functions for Koha's bibliographic databases
67 # make all your functions, whether exported or not;
69 =head2 findseealso($dbh,$fields);
71 C<$dbh> is a link to the DB handler.
74 my $dbh =C4::Context->dbh;
76 C<$fields> is a reference to the fields array
78 This function modifies the @$fields array and adds related fields to search on.
80 FIXME: this function is probably deprecated in Koha 3
85 my ( $dbh, $fields ) = @_;
86 my $tagslib = GetMarcStructure(1);
87 for ( my $i = 0 ; $i <= $#{$fields} ; $i++ ) {
88 my ($tag) = substr( @$fields[$i], 1, 3 );
89 my ($subfield) = substr( @$fields[$i], 4, 1 );
90 @$fields[$i] .= ',' . $tagslib->{$tag}->{$subfield}->{seealso}
91 if ( $tagslib->{$tag}->{$subfield}->{seealso} );
97 ($biblionumber,$biblionumber,$title) = FindDuplicate($record);
99 This function attempts to find duplicate records using a hard-coded, fairly simplistic algorithm
105 my $dbh = C4::Context->dbh;
106 my $result = TransformMarcToKoha( $dbh, $record, '' );
111 my ( $biblionumber, $title );
113 # search duplicate on ISBN, easy and fast..
114 # ... normalize first
115 if ( $result->{isbn} ) {
116 $result->{isbn} =~ s/\(.*$//;
117 $result->{isbn} =~ s/\s+$//;
118 $query = "isbn=$result->{isbn}";
121 $result->{title} =~ s /\\//g;
122 $result->{title} =~ s /\"//g;
123 $result->{title} =~ s /\(//g;
124 $result->{title} =~ s /\)//g;
126 # FIXME: instead of removing operators, could just do
127 # quotes around the value
128 $result->{title} =~ s/(and|or|not)//g;
129 $query = "ti,ext=$result->{title}";
130 $query .= " and itemtype=$result->{itemtype}"
131 if ( $result->{itemtype} );
132 if ( $result->{author} ) {
133 $result->{author} =~ s /\\//g;
134 $result->{author} =~ s /\"//g;
135 $result->{author} =~ s /\(//g;
136 $result->{author} =~ s /\)//g;
138 # remove valid operators
139 $result->{author} =~ s/(and|or|not)//g;
140 $query .= " and au,ext=$result->{author}";
144 # FIXME: add error handling
145 my ( $error, $searchresults ) = SimpleSearch($query); # FIXME :: hardcoded !
147 foreach my $possible_duplicate_record (@$searchresults) {
149 MARC::Record->new_from_usmarc($possible_duplicate_record);
150 my $result = TransformMarcToKoha( $dbh, $marcrecord, '' );
152 # FIXME :: why 2 $biblionumber ?
154 push @results, $result->{'biblionumber'};
155 push @results, $result->{'title'};
163 ( $error, $results, $total_hits ) = SimpleSearch( $query, $offset, $max_results, [@servers] );
165 This function provides a simple search API on the bibliographic catalog
171 * $query can be a simple keyword or a complete CCL query
172 * @servers is optional. Defaults to biblioserver as found in koha-conf.xml
173 * $offset - If present, represents the number of records at the beggining to omit. Defaults to 0
174 * $max_results - if present, determines the maximum number of records to fetch. undef is All. defaults to undef.
179 * $error is a empty unless an error is detected
180 * \@results is an array of records.
181 * $total_hits is the number of hits that would have been returned with no limit
183 =item C<usage in the script:>
187 my ( $error, $marcresults, $total_hits ) = SimpleSearch($query);
189 if (defined $error) {
190 $template->param(query_error => $error);
191 warn "error: ".$error;
192 output_html_with_http_headers $input, $cookie, $template->output;
196 my $hits = scalar @$marcresults;
199 for my $i (0..$hits) {
201 my $marcrecord = MARC::File::USMARC::decode($marcresults->[$i]);
202 my $biblio = TransformMarcToKoha(C4::Context->dbh,$marcrecord,'');
204 #build the hash for the template.
205 $resultsloop{highlight} = ($i % 2)?(1):(0);
206 $resultsloop{title} = $biblio->{'title'};
207 $resultsloop{subtitle} = $biblio->{'subtitle'};
208 $resultsloop{biblionumber} = $biblio->{'biblionumber'};
209 $resultsloop{author} = $biblio->{'author'};
210 $resultsloop{publishercode} = $biblio->{'publishercode'};
211 $resultsloop{publicationyear} = $biblio->{'publicationyear'};
213 push @results, \%resultsloop;
216 $template->param(result=>\@results);
221 my ( $query, $offset, $max_results, $servers ) = @_;
223 if ( C4::Context->preference('NoZebra') ) {
224 my $result = NZorder( NZanalyse($query) )->{'biblioserver'};
227 && $result->{hits} > 0 ? $result->{'RECORDS'} : [] );
228 return ( undef, $search_result, scalar($search_result) );
231 # FIXME hardcoded value. See catalog/search.pl & opac-search.pl too.
232 my @servers = defined ( $servers ) ? @$servers : ( "biblioserver" );
238 return ( "No query entered", undef, undef ) unless $query;
240 # Initialize & Search Zebra
241 for ( my $i = 0 ; $i < @servers ; $i++ ) {
243 $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
244 $zoom_queries[$i] = new ZOOM::Query::CCL2RPN( $query, $zconns[$i]);
245 $tmpresults[$i] = $zconns[$i]->search( $zoom_queries[$i] );
249 $zconns[$i]->errmsg() . " ("
250 . $zconns[$i]->errcode() . ") "
251 . $zconns[$i]->addinfo() . " "
252 . $zconns[$i]->diagset();
254 return ( $error, undef, undef ) if $zconns[$i]->errcode();
258 # caught a ZOOM::Exception
262 . $@->addinfo() . " "
265 return ( $error, undef, undef );
268 while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
269 my $event = $zconns[ $i - 1 ]->last_event();
270 if ( $event == ZOOM::Event::ZEND ) {
272 my $first_record = defined( $offset ) ? $offset+1 : 1;
273 my $hits = $tmpresults[ $i - 1 ]->size();
274 $total_hits += $hits;
275 my $last_record = $hits;
276 if ( defined $max_results && $offset + $max_results < $hits ) {
277 $last_record = $offset + $max_results;
280 for my $j ( $first_record..$last_record ) {
281 my $record = $tmpresults[ $i - 1 ]->record( $j-1 )->raw(); # 0 indexed
282 push @results, $record;
287 foreach my $result (@tmpresults) {
290 foreach my $zoom_query (@zoom_queries) {
291 $zoom_query->destroy();
294 return ( undef, \@results, $total_hits );
300 ( undef, $results_hashref, \@facets_loop ) = getRecords (
302 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
303 $results_per_page, $offset, $expanded_facet, $branches,
307 The all singing, all dancing, multi-server, asynchronous, scanning,
308 searching, record nabbing, facet-building
310 See verbse embedded documentation.
316 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
317 $results_per_page, $offset, $expanded_facet, $branches,
321 my @servers = @$servers_ref;
322 my @sort_by = @$sort_by_ref;
324 # Initialize variables for the ZOOM connection and results object
328 my $results_hashref = ();
330 # Initialize variables for the faceted results objects
331 my $facets_counter = ();
332 my $facets_info = ();
333 my $facets = getFacets();
336 ; # stores the ref to array of hashes for template facets loop
338 ### LOOP THROUGH THE SERVERS
339 for ( my $i = 0 ; $i < @servers ; $i++ ) {
340 $zconns[$i] = C4::Context->Zconn( $servers[$i], 1 );
342 # perform the search, create the results objects
343 # if this is a local search, use the $koha-query, if it's a federated one, use the federated-query
344 my $query_to_use = ($servers[$i] =~ /biblioserver/) ? $koha_query : $simple_query;
346 #$query_to_use = $simple_query if $scan;
347 warn $simple_query if ( $scan and $DEBUG );
349 # Check if we've got a query_type defined, if so, use it
353 if ( $query_type =~ /^ccl/ ) {
355 s/\:/\=/g; # change : to = last minute (FIXME)
358 new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
361 elsif ( $query_type =~ /^cql/ ) {
364 new ZOOM::Query::CQL( $query_to_use, $zconns[$i] ) );
366 elsif ( $query_type =~ /^pqf/ ) {
369 new ZOOM::Query::PQF( $query_to_use, $zconns[$i] ) );
376 new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
382 new ZOOM::Query::CCL2RPN( $query_to_use, $zconns[$i] )
388 warn "WARNING: query problem with $query_to_use " . $@;
391 # Concatenate the sort_by limits and pass them to the results object
392 # Note: sort will override rank
394 foreach my $sort (@sort_by) {
395 if ( $sort eq "author_az" ) {
396 $sort_by .= "1=1003 <i ";
398 elsif ( $sort eq "author_za" ) {
399 $sort_by .= "1=1003 >i ";
401 elsif ( $sort eq "popularity_asc" ) {
402 $sort_by .= "1=9003 <i ";
404 elsif ( $sort eq "popularity_dsc" ) {
405 $sort_by .= "1=9003 >i ";
407 elsif ( $sort eq "call_number_asc" ) {
408 $sort_by .= "1=20 <i ";
410 elsif ( $sort eq "call_number_dsc" ) {
411 $sort_by .= "1=20 >i ";
413 elsif ( $sort eq "pubdate_asc" ) {
414 $sort_by .= "1=31 <i ";
416 elsif ( $sort eq "pubdate_dsc" ) {
417 $sort_by .= "1=31 >i ";
419 elsif ( $sort eq "acqdate_asc" ) {
420 $sort_by .= "1=32 <i ";
422 elsif ( $sort eq "acqdate_dsc" ) {
423 $sort_by .= "1=32 >i ";
425 elsif ( $sort eq "title_az" ) {
426 $sort_by .= "1=4 <i ";
428 elsif ( $sort eq "title_za" ) {
429 $sort_by .= "1=4 >i ";
433 if ( $results[$i]->sort( "yaz", $sort_by ) < 0 ) {
434 warn "WARNING sort $sort_by failed";
437 } # finished looping through servers
439 # The big moment: asynchronously retrieve results from all servers
440 while ( ( my $i = ZOOM::event( \@zconns ) ) != 0 ) {
441 my $ev = $zconns[ $i - 1 ]->last_event();
442 if ( $ev == ZOOM::Event::ZEND ) {
443 next unless $results[ $i - 1 ];
444 my $size = $results[ $i - 1 ]->size();
448 # loop through the results
449 $results_hash->{'hits'} = $size;
451 if ( $offset + $results_per_page <= $size ) {
452 $times = $offset + $results_per_page;
457 for ( my $j = $offset ; $j < $times ; $j++ ) {
462 ## Check if it's an index scan
464 my ( $term, $occ ) = $results[ $i - 1 ]->term($j);
466 # here we create a minimal MARC record and hand it off to the
467 # template just like a normal result ... perhaps not ideal, but
469 my $tmprecord = MARC::Record->new();
470 $tmprecord->encoding('UTF-8');
474 # the minimal record in author/title (depending on MARC flavour)
475 if (C4::Context->preference("marcflavour") eq "UNIMARC") {
476 $tmptitle = MARC::Field->new('200',' ',' ', a => $term, f => $occ);
477 $tmprecord->append_fields($tmptitle);
479 $tmptitle = MARC::Field->new('245',' ',' ', a => $term,);
480 $tmpauthor = MARC::Field->new('100',' ',' ', a => $occ,);
481 $tmprecord->append_fields($tmptitle);
482 $tmprecord->append_fields($tmpauthor);
484 $results_hash->{'RECORDS'}[$j] = $tmprecord->as_usmarc();
489 $record = $results[ $i - 1 ]->record($j)->raw();
491 # warn "RECORD $j:".$record;
492 $results_hash->{'RECORDS'}[$j] = $record;
494 # Fill the facets while we're looping, but only for the biblioserver
495 $facet_record = MARC::Record->new_from_usmarc($record)
496 if $servers[ $i - 1 ] =~ /biblioserver/;
498 #warn $servers[$i-1]."\n".$record; #.$facet_record->title();
500 for ( my $k = 0 ; $k <= @$facets ; $k++ ) {
502 if ( $facets->[$k] ) {
504 for my $tag ( @{ $facets->[$k]->{'tags'} } )
507 $facet_record->field($tag);
509 for my $field (@fields) {
510 my @subfields = $field->subfields();
511 for my $subfield (@subfields) {
512 my ( $code, $data ) = @$subfield;
514 $facets->[$k]->{'subfield'} )
516 $facets_counter->{ $facets->[$k]
522 $facets_info->{ $facets->[$k]
523 ->{'link_value'} }->{'label_value'} =
524 $facets->[$k]->{'label_value'};
525 $facets_info->{ $facets->[$k]
526 ->{'link_value'} }->{'expanded'} =
527 $facets->[$k]->{'expanded'};
533 $results_hashref->{ $servers[ $i - 1 ] } = $results_hash;
536 # warn "connection ", $i-1, ": $size hits";
537 # warn $results[$i-1]->record(0)->render() if $size > 0;
540 if ( $servers[ $i - 1 ] =~ /biblioserver/ ) {
542 sort { $facets_counter->{$b} <=> $facets_counter->{$a} }
543 keys %$facets_counter )
546 my $number_of_facets;
547 my @this_facets_array;
550 $facets_counter->{$link_value}
551 ->{$b} <=> $facets_counter->{$link_value}->{$a}
552 } keys %{ $facets_counter->{$link_value} }
556 if ( ( $number_of_facets < 6 )
557 || ( $expanded_facet eq $link_value )
558 || ( $facets_info->{$link_value}->{'expanded'} ) )
561 # Sanitize the link value ), ( will cause errors with CCL,
562 my $facet_link_value = $one_facet;
563 $facet_link_value =~ s/(\(|\))/ /g;
565 # fix the length that will display in the label,
566 my $facet_label_value = $one_facet;
568 substr( $one_facet, 0, 20 ) . "..."
569 unless length($facet_label_value) <= 20;
571 # if it's a branch, label by the name, not the code,
572 if ( $link_value =~ /branch/ ) {
574 $branches->{$one_facet}->{'branchname'};
577 # but we're down with the whole label being in the link's title.
578 my $facet_title_value = $one_facet;
580 push @this_facets_array,
584 $facets_counter->{$link_value}
586 facet_label_value => $facet_label_value,
587 facet_title_value => $facet_title_value,
588 facet_link_value => $facet_link_value,
589 type_link_value => $link_value,
595 # handle expanded option
596 unless ( $facets_info->{$link_value}->{'expanded'} ) {
598 if ( ( $number_of_facets > 6 )
599 && ( $expanded_facet ne $link_value ) );
604 type_link_value => $link_value,
605 type_id => $link_value . "_id",
606 "type_label_" . $facets_info->{$link_value}->{'label_value'} => 1,
607 facets => \@this_facets_array,
608 expandable => $expandable,
609 expand => $link_value,
611 ) unless ( ($facets_info->{$link_value}->{'label_value'} =~ /Libraries/) and (C4::Context->preference('singleBranchMode')) );
616 return ( undef, $results_hashref, \@facets_loop );
621 $koha_query, $simple_query, $sort_by_ref, $servers_ref,
622 $results_per_page, $offset, $expanded_facet, $branches,
626 my $paz = C4::Search::PazPar2->new(C4::Context->config('pazpar2url'));
628 $paz->search($simple_query);
632 my $results_hashref = {};
633 my $stats = XMLin($paz->stat);
634 my $results = XMLin($paz->show($offset, $results_per_page, 'work-title:1'), forcearray => 1);
636 # for a grouped search result, the number of hits
637 # is the number of groups returned; 'bib_hits' will have
638 # the total number of bibs.
639 $results_hashref->{'biblioserver'}->{'hits'} = $results->{'merged'}->[0];
640 $results_hashref->{'biblioserver'}->{'bib_hits'} = $stats->{'hits'};
642 HIT: foreach my $hit (@{ $results->{'hit'} }) {
643 my $recid = $hit->{recid}->[0];
645 my $work_title = $hit->{'md-work-title'}->[0];
647 if (exists $hit->{'md-work-author'}) {
648 $work_author = $hit->{'md-work-author'}->[0];
650 my $group_label = (defined $work_author) ? "$work_title / $work_author" : $work_title;
652 my $result_group = {};
653 $result_group->{'group_label'} = $group_label;
654 $result_group->{'group_merge_key'} = $recid;
657 if (exists $hit->{count}) {
658 $count = $hit->{count}->[0];
660 $result_group->{'group_count'} = $count;
662 for (my $i = 0; $i < $count; $i++) {
663 # FIXME -- may need to worry about diacritics here
664 my $rec = $paz->record($recid, $i);
665 push @{ $result_group->{'RECORDS'} }, $rec;
668 push @{ $results_hashref->{'biblioserver'}->{'GROUPS'} }, $result_group;
671 # pass through facets
672 my $termlist_xml = $paz->termlist('author,subject');
673 my $terms = XMLin($termlist_xml, forcearray => 1);
674 my @facets_loop = ();
675 #die Dumper($results);
676 # foreach my $list (sort keys %{ $terms->{'list'} }) {
678 # foreach my $facet (sort @{ $terms->{'list'}->{$list}->{'term'} } ) {
680 # facet_label_value => $facet->{'name'}->[0],
683 # push @facets_loop, ( {
684 # type_label => $list,
685 # facets => \@facets,
689 return ( undef, $results_hashref, \@facets_loop );
693 sub _remove_stopwords {
694 my ( $operand, $index ) = @_;
695 my @stopwords_removed;
697 # phrase and exact-qualified indexes shouldn't have stopwords removed
698 if ( $index !~ m/phr|ext/ ) {
700 # remove stopwords from operand : parse all stopwords & remove them (case insensitive)
701 # we use IsAlpha unicode definition, to deal correctly with diacritics.
702 # otherwise, a French word like "leçon" woudl be split into "le" "çon", "le"
703 # is a stopword, we'd get "çon" and wouldn't find anything...
704 foreach ( keys %{ C4::Context->stopwords } ) {
705 next if ( $_ =~ /(and|or|not)/ ); # don't remove operators
707 /(\P{IsAlpha}$_\P{IsAlpha}|^$_\P{IsAlpha}|\P{IsAlpha}$_$|^$_$)/ )
709 $operand =~ s/\P{IsAlpha}$_\P{IsAlpha}/ /gi;
710 $operand =~ s/^$_\P{IsAlpha}/ /gi;
711 $operand =~ s/\P{IsAlpha}$_$/ /gi;
712 $operand =~ s/$1//gi;
713 push @stopwords_removed, $_;
717 return ( $operand, \@stopwords_removed );
721 sub _detect_truncation {
722 my ( $operand, $index ) = @_;
723 my ( @nontruncated, @righttruncated, @lefttruncated, @rightlefttruncated,
726 my @wordlist = split( /\s/, $operand );
727 foreach my $word (@wordlist) {
728 if ( $word =~ s/^\*([^\*]+)\*$/$1/ ) {
729 push @rightlefttruncated, $word;
731 elsif ( $word =~ s/^\*([^\*]+)$/$1/ ) {
732 push @lefttruncated, $word;
734 elsif ( $word =~ s/^([^\*]+)\*$/$1/ ) {
735 push @righttruncated, $word;
737 elsif ( index( $word, "*" ) < 0 ) {
738 push @nontruncated, $word;
741 push @regexpr, $word;
745 \@nontruncated, \@righttruncated, \@lefttruncated,
746 \@rightlefttruncated, \@regexpr
751 sub _build_stemmed_operand {
755 # If operand contains a digit, it is almost certainly an identifier, and should
756 # not be stemmed. This is particularly relevant for ISBNs and ISSNs, which
757 # can contain the letter "X" - for example, _build_stemmend_operand would reduce
758 # "014100018X" to "x ", which for a MARC21 database would bring up irrelevant
759 # results (e.g., "23 x 29 cm." from the 300$c). Bug 2098.
760 return $operand if $operand =~ /\d/;
762 # FIXME: the locale should be set based on the user's language and/or search choice
763 my $stemmer = Lingua::Stem->new( -locale => 'EN-US' );
765 # FIXME: these should be stored in the db so the librarian can modify the behavior
766 $stemmer->add_exceptions(
773 my @words = split( / /, $operand );
774 my $stems = $stemmer->stem(@words);
775 for my $stem (@$stems) {
776 $stemmed_operand .= "$stem";
777 $stemmed_operand .= "?"
778 unless ( $stem =~ /(and$|or$|not$)/ ) || ( length($stem) < 3 );
779 $stemmed_operand .= " ";
781 warn "STEMMED OPERAND: $stemmed_operand" if $DEBUG;
782 return $stemmed_operand;
786 sub _build_weighted_query {
788 # FIELD WEIGHTING - This is largely experimental stuff. What I'm committing works
789 # pretty well but could work much better if we had a smarter query parser
790 my ( $operand, $stemmed_operand, $index ) = @_;
791 my $stemming = C4::Context->preference("QueryStemming") || 0;
792 my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
793 my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
795 my $weighted_query .= "(rk=("; # Specifies that we're applying rank
797 # Keyword, or, no index specified
798 if ( ( $index eq 'kw' ) || ( !$index ) ) {
800 "Title-cover,ext,r1=\"$operand\""; # exact title-cover
801 $weighted_query .= " or ti,ext,r2=\"$operand\""; # exact title
802 $weighted_query .= " or ti,phr,r3=\"$operand\""; # phrase title
803 #$weighted_query .= " or any,ext,r4=$operand"; # exact any
804 #$weighted_query .=" or kw,wrdl,r5=\"$operand\""; # word list any
805 $weighted_query .= " or wrdl,fuzzy,r8=\"$operand\""
806 if $fuzzy_enabled; # add fuzzy, word list
807 $weighted_query .= " or wrdl,right-Truncation,r9=\"$stemmed_operand\""
808 if ( $stemming and $stemmed_operand )
809 ; # add stemming, right truncation
810 $weighted_query .= " or wrdl,r9=\"$operand\"";
812 # embedded sorting: 0 a-z; 1 z-a
813 # $weighted_query .= ") or (sort1,aut=1";
816 # Barcode searches should skip this process
817 elsif ( $index eq 'bc' ) {
818 $weighted_query .= "bc=\"$operand\"";
821 # Authority-number searches should skip this process
822 elsif ( $index eq 'an' ) {
823 $weighted_query .= "an=\"$operand\"";
826 # If the index already has more than one qualifier, wrap the operand
827 # in quotes and pass it back (assumption is that the user knows what they
828 # are doing and won't appreciate us mucking up their query
829 elsif ( $index =~ ',' ) {
830 $weighted_query .= " $index=\"$operand\"";
833 #TODO: build better cases based on specific search indexes
835 $weighted_query .= " $index,ext,r1=\"$operand\""; # exact index
836 #$weighted_query .= " or (title-sort-az=0 or $index,startswithnt,st-word,r3=$operand #)";
837 $weighted_query .= " or $index,phr,r3=\"$operand\""; # phrase index
839 " or $index,rt,wrdl,r3=\"$operand\""; # word list index
842 $weighted_query .= "))"; # close rank specification
843 return $weighted_query;
849 $simple_query, $query_cgi,
851 $limit_cgi, $limit_desc,
852 $stopwords_removed, $query_type ) = getRecords ( $operators, $operands, $indexes, $limits, $sort_by, $scan);
854 Build queries and limits in CCL, CGI, Human,
855 handle truncation, stemming, field weighting, stopwords, fuzziness, etc.
857 See verbose embedded documentation.
863 my ( $operators, $operands, $indexes, $limits, $sort_by, $scan ) = @_;
865 warn "---------\nEnter buildQuery\n---------" if $DEBUG;
868 my @operators = @$operators if $operators;
869 my @indexes = @$indexes if $indexes;
870 my @operands = @$operands if $operands;
871 my @limits = @$limits if $limits;
872 my @sort_by = @$sort_by if $sort_by;
874 my $stemming = C4::Context->preference("QueryStemming") || 0;
875 my $auto_truncation = C4::Context->preference("QueryAutoTruncate") || 0;
876 my $weight_fields = C4::Context->preference("QueryWeightFields") || 0;
877 my $fuzzy_enabled = C4::Context->preference("QueryFuzzy") || 0;
878 my $remove_stopwords = C4::Context->preference("QueryRemoveStopwords") || 0;
880 # no stemming/weight/fuzzy in NoZebra
881 if ( C4::Context->preference("NoZebra") ) {
887 my $query = $operands[0];
888 my $simple_query = $operands[0];
890 # initialize the variables we're passing back
899 my $stopwords_removed; # flag to determine if stopwords have been removed
901 # for handling ccl, cql, pqf queries in diagnostic mode, skip the rest of the steps
903 if ( $query =~ /^ccl=/ ) {
904 return ( undef, $', $', $', $', '', '', '', '', 'ccl' );
906 if ( $query =~ /^cql=/ ) {
907 return ( undef, $', $', $', $', '', '', '', '', 'cql' );
909 if ( $query =~ /^pqf=/ ) {
910 return ( undef, $', $', $', $', '', '', '', '', 'pqf' );
913 # pass nested queries directly
914 # FIXME: need better handling of some of these variables in this case
915 if ( $query =~ /(\(|\))/ ) {
917 undef, $query, $simple_query, $query_cgi,
918 $query, $limit, $limit_cgi, $limit_desc,
919 $stopwords_removed, 'ccl'
923 # Form-based queries are non-nested and fixed depth, so we can easily modify the incoming
924 # query operands and indexes and add stemming, truncation, field weighting, etc.
925 # Once we do so, we'll end up with a value in $query, just like if we had an
926 # incoming $query from the user
929 ; # clear it out so we can populate properly with field-weighted, stemmed, etc. query
931 ; # a flag used to keep track if there was a previous query
932 # if there was, we can apply the current operator
934 for ( my $i = 0 ; $i <= @operands ; $i++ ) {
936 # COMBINE OPERANDS, INDEXES AND OPERATORS
937 if ( $operands[$i] ) {
939 # A flag to determine whether or not to add the index to the query
942 # If the user is sophisticated enough to specify an index, turn off field weighting, stemming, and stopword handling
943 if ( $operands[$i] =~ /(:|=)/ || $scan ) {
946 $remove_stopwords = 0;
948 my $operand = $operands[$i];
949 my $index = $indexes[$i];
951 # Add index-specific attributes
952 # Date of Publication
953 if ( $index eq 'yr' ) {
954 $index .= ",st-numeric";
956 $stemming = $auto_truncation = $weight_fields = $fuzzy_enabled = $remove_stopwords = 0;
959 # Date of Acquisition
960 elsif ( $index eq 'acqdate' ) {
961 $index .= ",st-date-normalized";
963 $stemming = $auto_truncation = $weight_fields = $fuzzy_enabled = $remove_stopwords = 0;
965 # ISBN,ISSN,Standard Number, don't need special treatment
966 elsif ( $index eq 'nb' || $index eq 'ns' ) {
969 $stemming, $auto_truncation,
970 $weight_fields, $fuzzy_enabled,
972 ) = ( 0, 0, 0, 0, 0 );
975 # Set default structure attribute (word list)
977 unless ( $indexes_set || !$index || $index =~ /(st-|phr|ext|wrdl)/ ) {
978 $struct_attr = ",wrdl";
981 # Some helpful index variants
982 my $index_plus = $index . $struct_attr . ":" if $index;
983 my $index_plus_comma = $index . $struct_attr . "," if $index;
986 if ($remove_stopwords) {
987 ( $operand, $stopwords_removed ) =
988 _remove_stopwords( $operand, $index );
989 warn "OPERAND w/out STOPWORDS: >$operand<" if $DEBUG;
990 warn "REMOVED STOPWORDS: @$stopwords_removed"
991 if ( $stopwords_removed && $DEBUG );
995 my $truncated_operand;
996 my( $nontruncated, $righttruncated, $lefttruncated,
997 $rightlefttruncated, $regexpr
998 ) = _detect_truncation( $operand, $index );
1000 "TRUNCATION: NON:>@$nontruncated< RIGHT:>@$righttruncated< LEFT:>@$lefttruncated< RIGHTLEFT:>@$rightlefttruncated< REGEX:>@$regexpr<"
1005 scalar(@$righttruncated) + scalar(@$lefttruncated) +
1006 scalar(@$rightlefttruncated) > 0 )
1009 # Don't field weight or add the index to the query, we do it here
1011 undef $weight_fields;
1012 my $previous_truncation_operand;
1013 if ( scalar(@$nontruncated) > 0 ) {
1014 $truncated_operand .= "$index_plus @$nontruncated ";
1015 $previous_truncation_operand = 1;
1017 if ( scalar(@$righttruncated) > 0 ) {
1018 $truncated_operand .= "and "
1019 if $previous_truncation_operand;
1020 $truncated_operand .=
1021 "$index_plus_comma" . "rtrn:@$righttruncated ";
1022 $previous_truncation_operand = 1;
1024 if ( scalar(@$lefttruncated) > 0 ) {
1025 $truncated_operand .= "and "
1026 if $previous_truncation_operand;
1027 $truncated_operand .=
1028 "$index_plus_comma" . "ltrn:@$lefttruncated ";
1029 $previous_truncation_operand = 1;
1031 if ( scalar(@$rightlefttruncated) > 0 ) {
1032 $truncated_operand .= "and "
1033 if $previous_truncation_operand;
1034 $truncated_operand .=
1035 "$index_plus_comma" . "rltrn:@$rightlefttruncated ";
1036 $previous_truncation_operand = 1;
1039 $operand = $truncated_operand if $truncated_operand;
1040 warn "TRUNCATED OPERAND: >$truncated_operand<" if $DEBUG;
1043 my $stemmed_operand;
1044 $stemmed_operand = _build_stemmed_operand($operand)
1046 warn "STEMMED OPERAND: >$stemmed_operand<" if $DEBUG;
1048 # Handle Field Weighting
1049 my $weighted_operand;
1051 _build_weighted_query( $operand, $stemmed_operand, $index )
1053 warn "FIELD WEIGHTED OPERAND: >$weighted_operand<" if $DEBUG;
1054 $operand = $weighted_operand if $weight_fields;
1055 $indexes_set = 1 if $weight_fields;
1057 # If there's a previous operand, we need to add an operator
1058 if ($previous_operand) {
1060 # User-specified operator
1061 if ( $operators[ $i - 1 ] ) {
1062 $query .= " $operators[$i-1] ";
1063 $query .= " $index_plus " unless $indexes_set;
1064 $query .= " $operand";
1065 $query_cgi .= "&op=$operators[$i-1]";
1066 $query_cgi .= "&idx=$index" if $index;
1067 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1069 " $operators[$i-1] $index_plus $operands[$i]";
1072 # Default operator is and
1075 $query .= "$index_plus " unless $indexes_set;
1076 $query .= "$operand";
1077 $query_cgi .= "&op=and&idx=$index" if $index;
1078 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1079 $query_desc .= " and $index_plus $operands[$i]";
1083 # There isn't a pervious operand, don't need an operator
1086 # Field-weighted queries already have indexes set
1087 $query .= " $index_plus " unless $indexes_set;
1089 $query_desc .= " $index_plus $operands[$i]";
1090 $query_cgi .= "&idx=$index" if $index;
1091 $query_cgi .= "&q=$operands[$i]" if $operands[$i];
1092 $previous_operand = 1;
1097 warn "QUERY BEFORE LIMITS: >$query<" if $DEBUG;
1100 my $group_OR_limits;
1101 my $availability_limit;
1102 foreach my $this_limit (@limits) {
1103 if ( $this_limit =~ /available/ ) {
1105 # 'available' is defined as (items.onloan is NULL) and (items.itemlost = 0)
1107 # all records not indexed in the onloan register (zebra) and all records with a value of lost equal to 0
1108 $availability_limit .=
1109 "( ( allrecords,AlwaysMatches='' not onloan,AlwaysMatches='') and (lost,st-numeric=0) )"; #or ( allrecords,AlwaysMatches='' not lost,AlwaysMatches='')) )";
1110 $limit_cgi .= "&limit=available";
1114 # group_OR_limits, prefixed by mc-
1115 # OR every member of the group
1116 elsif ( $this_limit =~ /mc/ ) {
1117 $group_OR_limits .= " or " if $group_OR_limits;
1118 $limit_desc .= " or " if $group_OR_limits;
1119 $group_OR_limits .= "$this_limit";
1120 $limit_cgi .= "&limit=$this_limit";
1121 $limit_desc .= " $this_limit";
1124 # Regular old limits
1126 $limit .= " and " if $limit || $query;
1127 $limit .= "$this_limit";
1128 $limit_cgi .= "&limit=$this_limit";
1129 if ($this_limit =~ /^branch:(.+)/) {
1130 my $branchcode = $1;
1131 my $branchname = GetBranchName($branchcode);
1132 if (defined $branchname) {
1133 $limit_desc .= " branch:$branchname";
1135 $limit_desc .= " $this_limit";
1138 $limit_desc .= " $this_limit";
1142 if ($group_OR_limits) {
1143 $limit .= " and " if ( $query || $limit );
1144 $limit .= "($group_OR_limits)";
1146 if ($availability_limit) {
1147 $limit .= " and " if ( $query || $limit );
1148 $limit .= "($availability_limit)";
1151 # Normalize the query and limit strings
1154 for ( $query, $query_desc, $limit, $limit_desc ) {
1155 $_ =~ s/ / /g; # remove extra spaces
1156 $_ =~ s/^ //g; # remove any beginning spaces
1157 $_ =~ s/ $//g; # remove any ending spaces
1158 $_ =~ s/==/=/g; # remove double == from query
1160 $query_cgi =~ s/^&//; # remove unnecessary & from beginning of the query cgi
1162 for ($query_cgi,$simple_query) {
1165 # append the limit to the query
1166 $query .= " " . $limit;
1170 warn "QUERY:" . $query;
1171 warn "QUERY CGI:" . $query_cgi;
1172 warn "QUERY DESC:" . $query_desc;
1173 warn "LIMIT:" . $limit;
1174 warn "LIMIT CGI:" . $limit_cgi;
1175 warn "LIMIT DESC:" . $limit_desc;
1176 warn "---------\nLeave buildQuery\n---------";
1179 undef, $query, $simple_query, $query_cgi,
1180 $query_desc, $limit, $limit_cgi, $limit_desc,
1181 $stopwords_removed, $query_type
1185 =head2 searchResults
1187 Format results in a form suitable for passing to the template
1191 # IMO this subroutine is pretty messy still -- it's responsible for
1192 # building the HTML output for the template
1194 my ( $searchdesc, $hits, $results_per_page, $offset, $scan, @marcresults ) = @_;
1195 my $dbh = C4::Context->dbh;
1199 # add search-term highlighting via <span>s on the search terms
1200 my $span_terms_hashref;
1201 for my $span_term ( split( / /, $searchdesc ) ) {
1202 $span_term =~ s/(.*=|\)|\(|\+|\.|\*)//g;
1203 $span_terms_hashref->{$span_term}++;
1206 #Build branchnames hash
1208 #get branch information.....
1211 $dbh->prepare("SELECT branchcode,branchname FROM branches")
1212 ; # FIXME : use C4::Koha::GetBranches
1214 while ( my $bdata = $bsth->fetchrow_hashref ) {
1215 $branches{ $bdata->{'branchcode'} } = $bdata->{'branchname'};
1217 # FIXME - We build an authorised values hash here, using the default framework
1218 # though it is possible to have different authvals for different fws.
1220 my $shelflocations =GetKohaAuthorisedValues('items.location','');
1222 # get notforloan authorised value list (see $shelflocations FIXME)
1223 my $notforloan_authorised_value = GetAuthValCode('items.notforloan','');
1225 #Build itemtype hash
1226 #find itemtype & itemtype image
1230 "SELECT itemtype,description,imageurl,summary,notforloan FROM itemtypes"
1233 while ( my $bdata = $bsth->fetchrow_hashref ) {
1234 foreach (qw(description imageurl summary notforloan)) {
1235 $itemtypes{ $bdata->{'itemtype'} }->{$_} = $bdata->{$_};
1239 #search item field code
1242 "SELECT tagfield FROM marc_subfield_structure WHERE kohafield LIKE 'items.itemnumber'"
1245 my ($itemtag) = $sth->fetchrow;
1247 ## find column names of items related to MARC
1248 my $sth2 = $dbh->prepare("SHOW COLUMNS FROM items");
1250 my %subfieldstosearch;
1251 while ( ( my $column ) = $sth2->fetchrow ) {
1252 my ( $tagfield, $tagsubfield ) =
1253 &GetMarcFromKohaField( "items." . $column, "" );
1254 $subfieldstosearch{$column} = $tagsubfield;
1257 # handle which records to actually retrieve
1259 if ( $hits && $offset + $results_per_page <= $hits ) {
1260 $times = $offset + $results_per_page;
1263 $times = $hits; # FIXME: if $hits is undefined, why do we want to equal it?
1266 my $marcflavour = C4::Context->preference("marcflavour");
1267 # loop through all of the records we've retrieved
1268 for ( my $i = $offset ; $i <= $times - 1 ; $i++ ) {
1269 my $marcrecord = MARC::File::USMARC::decode( $marcresults[$i] );
1270 my $oldbiblio = TransformMarcToKoha( $dbh, $marcrecord, '' );
1271 $oldbiblio->{subtitle} = C4::Biblio::get_koha_field_from_marc('bibliosubtitle', 'subtitle', $marcrecord, '');
1272 $oldbiblio->{result_number} = $i + 1;
1274 # add imageurl to itemtype if there is one
1275 $oldbiblio->{imageurl} = getitemtypeimagelocation( 'opac', $itemtypes{ $oldbiblio->{itemtype} }->{imageurl} );
1277 $oldbiblio->{'authorised_value_images'} = C4::Items::get_authorised_value_images( C4::Biblio::get_biblio_authorised_values( $oldbiblio->{'biblionumber'}, $marcrecord ) );
1278 $oldbiblio->{normalized_upc} = GetNormalizedUPC($marcrecord,$marcflavour);
1279 $oldbiblio->{normalized_ean} = GetNormalizedEAN($marcrecord,$marcflavour);
1280 $oldbiblio->{normalized_oclc} = GetNormalizedOCLCNumber($marcrecord,$marcflavour);
1281 $oldbiblio->{normalized_isbn} = GetNormalizedISBN(undef,$marcrecord,$marcflavour);
1282 $oldbiblio->{content_identifier_exists} = 1 if ($oldbiblio->{normalized_isbn} or $oldbiblio->{normalized_oclc} or $oldbiblio->{normalized_ean} or $oldbiblio->{normalized_upc});
1283 $oldbiblio->{description} = $itemtypes{ $oldbiblio->{itemtype} }->{description};
1284 # Build summary if there is one (the summary is defined in the itemtypes table)
1285 # FIXME: is this used anywhere, I think it can be commented out? -- JF
1286 if ( $itemtypes{ $oldbiblio->{itemtype} }->{summary} ) {
1287 my $summary = $itemtypes{ $oldbiblio->{itemtype} }->{summary};
1288 my @fields = $marcrecord->fields();
1289 foreach my $field (@fields) {
1290 my $tag = $field->tag();
1291 my $tagvalue = $field->as_string();
1293 s/\[(.?.?.?.?)$tag\*(.*?)]/$1$tagvalue$2\[$1$tag$2]/g;
1294 unless ( $tag < 10 ) {
1295 my @subf = $field->subfields;
1296 for my $i ( 0 .. $#subf ) {
1297 my $subfieldcode = $subf[$i][0];
1298 my $subfieldvalue = $subf[$i][1];
1299 my $tagsubf = $tag . $subfieldcode;
1301 s/\[(.?.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue$2\[$1$tagsubf$2]/g;
1306 $summary =~ s/\[(.*?)]//g;
1307 $summary =~ s/\n/<br\/>/g;
1308 $oldbiblio->{summary} = $summary;
1311 # save an author with no <span> tag, for the <a href=search.pl?q=<!--tmpl_var name="author"-->> link
1312 $oldbiblio->{'author_nospan'} = $oldbiblio->{'author'};
1313 $oldbiblio->{'title_nospan'} = $oldbiblio->{'title'};
1314 $oldbiblio->{'subtitle_nospan'} = $oldbiblio->{'subtitle'};
1315 # Add search-term highlighting to the whole record where they match using <span>s
1316 if (C4::Context->preference("OpacHighlightedWords")){
1317 my $searchhighlightblob;
1318 for my $highlight_field ( $marcrecord->fields ) {
1320 # FIXME: need to skip title, subtitle, author, etc., as they are handled below
1321 next if $highlight_field->tag() =~ /(^00)/; # skip fixed fields
1322 for my $subfield ($highlight_field->subfields()) {
1324 next if $subfield->[0] eq '9';
1325 my $field = $subfield->[1];
1326 for my $term ( keys %$span_terms_hashref ) {
1327 if ( ( $field =~ /$term/i ) && (( length($term) > 3 ) || ($field =~ / $term /i)) ) {
1328 $field =~ s/$term/<span class=\"term\">$&<\/span>/gi;
1332 $searchhighlightblob .= $field . " ... " if $match;
1336 $searchhighlightblob = ' ... '.$searchhighlightblob if $searchhighlightblob;
1337 $oldbiblio->{'searchhighlightblob'} = $searchhighlightblob;
1340 # Add search-term highlighting to the title, subtitle, etc. fields
1341 for my $term ( keys %$span_terms_hashref ) {
1342 my $old_term = $term;
1343 if ( length($term) > 3 ) {
1344 $term =~ s/(.*=|\)|\(|\+|\.|\?|\[|\]|\\|\*)//g;
1345 foreach(qw(title subtitle author publishercode place pages notes size)) {
1346 $oldbiblio->{$_} =~ s/$term/<span class=\"term\">$&<\/span>/gi;
1351 ($i % 2) and $oldbiblio->{'toggle'} = 1;
1353 # Pull out the items fields
1354 my @fields = $marcrecord->field($itemtag);
1356 # Setting item statuses for display
1357 my @available_items_loop;
1358 my @onloan_items_loop;
1359 my @other_items_loop;
1361 my $available_items;
1365 my $ordered_count = 0;
1366 my $available_count = 0;
1367 my $onloan_count = 0;
1368 my $longoverdue_count = 0;
1369 my $other_count = 0;
1370 my $wthdrawn_count = 0;
1371 my $itemlost_count = 0;
1372 my $itembinding_count = 0;
1373 my $itemdamaged_count = 0;
1374 my $item_in_transit_count = 0;
1375 my $can_place_holds = 0;
1376 my $items_count = scalar(@fields);
1378 ( C4::Context->preference('maxItemsinSearchResults') )
1379 ? C4::Context->preference('maxItemsinSearchResults') - 1
1382 # loop through every item
1383 foreach my $field (@fields) {
1386 # populate the items hash
1387 foreach my $code ( keys %subfieldstosearch ) {
1388 $item->{$code} = $field->subfield( $subfieldstosearch{$code} );
1390 my $hbranch = C4::Context->preference('HomeOrHoldingBranch') eq 'homebranch' ? 'homebranch' : 'holdingbranch';
1391 my $otherbranch = C4::Context->preference('HomeOrHoldingBranch') eq 'homebranch' ? 'holdingbranch' : 'homebranch';
1392 # set item's branch name, use HomeOrHoldingBranch syspref first, fall back to the other one
1393 if ($item->{$hbranch}) {
1394 $item->{'branchname'} = $branches{$item->{$hbranch}};
1396 elsif ($item->{$otherbranch}) { # Last resort
1397 $item->{'branchname'} = $branches{$item->{$otherbranch}};
1400 my $prefix = $item->{$hbranch} . '--' . $item->{location} . $item->{itype} . $item->{itemcallnumber};
1401 # For each grouping of items (onloan, available, unavailable), we build a key to store relevant info about that item
1402 if ( $item->{onloan} ) {
1404 my $key = $prefix . $item->{due_date};
1405 $onloan_items->{$key}->{due_date} = format_date($item->{onloan});
1406 $onloan_items->{$key}->{count}++ if $item->{$hbranch};
1407 $onloan_items->{$key}->{branchname} = $item->{branchname};
1408 $onloan_items->{$key}->{location} = $shelflocations->{ $item->{location} };
1409 $onloan_items->{$key}->{itemcallnumber} = $item->{itemcallnumber};
1410 $onloan_items->{$key}->{imageurl} = getitemtypeimagelocation( 'opac', $itemtypes{ $item->{itype} }->{imageurl} );
1411 # if something's checked out and lost, mark it as 'long overdue'
1412 if ( $item->{itemlost} ) {
1413 $onloan_items->{$prefix}->{longoverdue}++;
1414 $longoverdue_count++;
1415 } else { # can place holds as long as item isn't lost
1416 $can_place_holds = 1;
1420 # items not on loan, but still unavailable ( lost, withdrawn, damaged )
1424 if ( $item->{notforloan} == -1 ) {
1428 # is item in transit?
1429 my $transfertwhen = '';
1430 my ($transfertfrom, $transfertto);
1432 unless ($item->{wthdrawn}
1433 || $item->{itemlost}
1435 || $item->{notforloan}
1436 || $items_count > 20) {
1438 # A couple heuristics to limit how many times
1439 # we query the database for item transfer information, sacrificing
1440 # accuracy in some cases for speed;
1442 # 1. don't query if item has one of the other statuses
1443 # 2. don't check transit status if the bib has
1444 # more than 20 items
1446 # FIXME: to avoid having the query the database like this, and to make
1447 # the in transit status count as unavailable for search limiting,
1448 # should map transit status to record indexed in Zebra.
1450 ($transfertwhen, $transfertfrom, $transfertto) = C4::Circulation::GetTransfers($item->{itemnumber});
1453 # item is withdrawn, lost or damaged
1454 if ( $item->{wthdrawn}
1455 || $item->{itemlost}
1457 || $item->{notforloan}
1458 || ($transfertwhen ne ''))
1460 $wthdrawn_count++ if $item->{wthdrawn};
1461 $itemlost_count++ if $item->{itemlost};
1462 $itemdamaged_count++ if $item->{damaged};
1463 $item_in_transit_count++ if $transfertwhen ne '';
1464 $item->{status} = $item->{wthdrawn} . "-" . $item->{itemlost} . "-" . $item->{damaged} . "-" . $item->{notforloan};
1467 my $key = $prefix . $item->{status};
1468 foreach (qw(wthdrawn itemlost damaged branchname itemcallnumber)) {
1469 $other_items->{$key}->{$_} = $item->{$_};
1471 $other_items->{$key}->{intransit} = ($transfertwhen ne '') ? 1 : 0;
1472 $other_items->{$key}->{notforloan} = GetAuthorisedValueDesc('','',$item->{notforloan},'','',$notforloan_authorised_value) if $notforloan_authorised_value;
1473 $other_items->{$key}->{count}++ if $item->{$hbranch};
1474 $other_items->{$key}->{location} = $shelflocations->{ $item->{location} };
1475 $other_items->{$key}->{imageurl} = getitemtypeimagelocation( 'opac', $itemtypes{ $item->{itype} }->{imageurl} );
1479 $can_place_holds = 1;
1481 $available_items->{$prefix}->{count}++ if $item->{$hbranch};
1482 foreach (qw(branchname itemcallnumber)) {
1483 $available_items->{$prefix}->{$_} = $item->{$_};
1485 $available_items->{$prefix}->{location} = $shelflocations->{ $item->{location} };
1486 $available_items->{$prefix}->{imageurl} = getitemtypeimagelocation( 'opac', $itemtypes{ $item->{itype} }->{imageurl} );
1489 } # notforloan, item level and biblioitem level
1490 my ( $availableitemscount, $onloanitemscount, $otheritemscount );
1492 ( C4::Context->preference('maxItemsinSearchResults') )
1493 ? C4::Context->preference('maxItemsinSearchResults') - 1
1495 for my $key ( sort keys %$onloan_items ) {
1496 (++$onloanitemscount > $maxitems) and last;
1497 push @onloan_items_loop, $onloan_items->{$key};
1499 for my $key ( sort keys %$other_items ) {
1500 (++$otheritemscount > $maxitems) and last;
1501 push @other_items_loop, $other_items->{$key};
1503 for my $key ( sort keys %$available_items ) {
1504 (++$availableitemscount > $maxitems) and last;
1505 push @available_items_loop, $available_items->{$key}
1508 # XSLT processing of some stuff
1509 if (C4::Context->preference("XSLTResultsDisplay") && !$scan) {
1510 my $newxmlrecord = XSLTParse4Display($oldbiblio->{biblionumber}, $marcrecord, C4::Context->config('opachtdocs')."/prog/en/xslt/MARC21slim2OPACResults.xsl");
1511 $oldbiblio->{XSLTResultsRecord} = $newxmlrecord;
1514 # last check for norequest : if itemtype is notforloan, it can't be reserved either, whatever the items
1515 $can_place_holds = 0
1516 if $itemtypes{ $oldbiblio->{itemtype} }->{notforloan};
1517 $oldbiblio->{norequests} = 1 unless $can_place_holds;
1518 $oldbiblio->{itemsplural} = 1 if $items_count > 1;
1519 $oldbiblio->{items_count} = $items_count;
1520 $oldbiblio->{available_items_loop} = \@available_items_loop;
1521 $oldbiblio->{onloan_items_loop} = \@onloan_items_loop;
1522 $oldbiblio->{other_items_loop} = \@other_items_loop;
1523 $oldbiblio->{availablecount} = $available_count;
1524 $oldbiblio->{availableplural} = 1 if $available_count > 1;
1525 $oldbiblio->{onloancount} = $onloan_count;
1526 $oldbiblio->{onloanplural} = 1 if $onloan_count > 1;
1527 $oldbiblio->{othercount} = $other_count;
1528 $oldbiblio->{otherplural} = 1 if $other_count > 1;
1529 $oldbiblio->{wthdrawncount} = $wthdrawn_count;
1530 $oldbiblio->{itemlostcount} = $itemlost_count;
1531 $oldbiblio->{damagedcount} = $itemdamaged_count;
1532 $oldbiblio->{intransitcount} = $item_in_transit_count;
1533 $oldbiblio->{orderedcount} = $ordered_count;
1534 push( @newresults, $oldbiblio );
1539 #----------------------------------------------------------------------
1541 # Non-Zebra GetRecords#
1542 #----------------------------------------------------------------------
1546 NZgetRecords has the same API as zera getRecords, even if some parameters are not managed
1552 $query, $simple_query, $sort_by_ref, $servers_ref,
1553 $results_per_page, $offset, $expanded_facet, $branches,
1556 warn "query =$query" if $DEBUG;
1557 my $result = NZanalyse($query);
1558 warn "results =$result" if $DEBUG;
1560 NZorder( $result, @$sort_by_ref[0], $results_per_page, $offset ),
1566 NZanalyse : get a CQL string as parameter, and returns a list of biblionumber;title,biblionumber;title,...
1567 the list is built from an inverted index in the nozebra SQL table
1568 note that title is here only for convenience : the sorting will be very fast when requested on title
1569 if the sorting is requested on something else, we will have to reread all results, and that may be longer.
1574 my ( $string, $server ) = @_;
1575 # warn "---------" if $DEBUG;
1576 warn " NZanalyse" if $DEBUG;
1577 # warn "---------" if $DEBUG;
1579 # $server contains biblioserver or authorities, depending on what we search on.
1580 #warn "querying : $string on $server";
1581 $server = 'biblioserver' unless $server;
1583 # if we have a ", replace the content to discard temporarily any and/or/not inside
1585 if ( $string =~ /"/ ) {
1586 $string =~ s/"(.*?)"/__X__/;
1588 warn "commacontent : $commacontent" if $DEBUG;
1591 # split the query string in 3 parts : X AND Y means : $left="X", $operand="AND" and $right="Y"
1592 # then, call again NZanalyse with $left and $right
1593 # (recursive until we find a leaf (=> something without and/or/not)
1594 # delete repeated operator... Would then go in infinite loop
1595 while ( $string =~ s/( and| or| not| AND| OR| NOT)\1/$1/g ) {
1598 #process parenthesis before.
1599 if ( $string =~ /^\s*\((.*)\)(( and | or | not | AND | OR | NOT )(.*))?/ ) {
1602 my $operator = lc($3); # FIXME: and/or/not are operators, not operands
1604 "dealing w/parenthesis before recursive sub call. left :$left operator:$operator right:$right"
1606 my $leftresult = NZanalyse( $left, $server );
1608 my $rightresult = NZanalyse( $right, $server );
1610 # OK, we have the results for right and left part of the query
1611 # depending of operand, intersect, union or exclude both lists
1612 # to get a result list
1613 if ( $operator eq ' and ' ) {
1614 return NZoperatorAND($leftresult,$rightresult);
1616 elsif ( $operator eq ' or ' ) {
1618 # just merge the 2 strings
1619 return $leftresult . $rightresult;
1621 elsif ( $operator eq ' not ' ) {
1622 return NZoperatorNOT($leftresult,$rightresult);
1626 # this error is impossible, because of the regexp that isolate the operand, but just in case...
1630 warn "string :" . $string if $DEBUG;
1634 if ($string =~ /(.*?)( and | or | not | AND | OR | NOT )(.*)/) {
1637 $operator = lc($2); # FIXME: and/or/not are operators, not operands
1639 warn "no parenthesis. left : $left operator: $operator right: $right"
1642 # it's not a leaf, we have a and/or/not
1645 # reintroduce comma content if needed
1646 $right =~ s/__X__/"$commacontent"/ if $commacontent;
1647 $left =~ s/__X__/"$commacontent"/ if $commacontent;
1648 warn "node : $left / $operator / $right\n" if $DEBUG;
1649 my $leftresult = NZanalyse( $left, $server );
1650 my $rightresult = NZanalyse( $right, $server );
1651 warn " leftresult : $leftresult" if $DEBUG;
1652 warn " rightresult : $rightresult" if $DEBUG;
1653 # OK, we have the results for right and left part of the query
1654 # depending of operand, intersect, union or exclude both lists
1655 # to get a result list
1656 if ( $operator eq ' and ' ) {
1658 return NZoperatorAND($leftresult,$rightresult);
1660 elsif ( $operator eq ' or ' ) {
1662 # just merge the 2 strings
1663 return $leftresult . $rightresult;
1665 elsif ( $operator eq ' not ' ) {
1666 return NZoperatorNOT($leftresult,$rightresult);
1670 # this error is impossible, because of the regexp that isolate the operand, but just in case...
1671 die "error : operand unknown : $operator for $string";
1674 # it's a leaf, do the real SQL query and return the result
1677 $string =~ s/__X__/"$commacontent"/ if $commacontent;
1678 $string =~ s/-|\.|\?|,|;|!|'|\(|\)|\[|\]|{|}|"|&|\+|\*|\// /g;
1679 #remove trailing blank at the beginning
1681 warn "leaf:$string" if $DEBUG;
1683 # parse the string in in operator/operand/value again
1687 if ($string =~ /(.*)(>=|<=)(.*)/) {
1694 # warn "handling leaf... left:$left operator:$operator right:$right"
1696 unless ($operator) {
1697 if ($string =~ /(.*)(>|<|=)(.*)/) {
1702 "handling unless (operator)... left:$left operator:$operator right:$right"
1710 # strip adv, zebra keywords, currently not handled in nozebra: wrdl, ext, phr...
1713 # automatic replace for short operators
1714 $left = 'title' if $left =~ '^ti$';
1715 $left = 'author' if $left =~ '^au$';
1716 $left = 'publisher' if $left =~ '^pb$';
1717 $left = 'subject' if $left =~ '^su$';
1718 $left = 'koha-Auth-Number' if $left =~ '^an$';
1719 $left = 'keyword' if $left =~ '^kw$';
1720 warn "handling leaf... left:$left operator:$operator right:$right" if $DEBUG;
1721 if ( $operator && $left ne 'keyword' ) {
1723 #do a specific search
1724 my $dbh = C4::Context->dbh;
1725 $operator = 'LIKE' if $operator eq '=' and $right =~ /%/;
1728 "SELECT biblionumbers,value FROM nozebra WHERE server=? AND indexname=? AND value $operator ?"
1730 warn "$left / $operator / $right\n" if $DEBUG;
1732 # split each word, query the DB and build the biblionumbers result
1733 #sanitizing leftpart
1734 $left =~ s/^\s+|\s+$//;
1735 foreach ( split / /, $right ) {
1737 $_ =~ s/^\s+|\s+$//;
1739 warn "EXECUTE : $server, $left, $_" if $DEBUG;
1740 $sth->execute( $server, $left, $_ )
1741 or warn "execute failed: $!";
1742 while ( my ( $line, $value ) = $sth->fetchrow ) {
1744 # if we are dealing with a numeric value, use only numeric results (in case of >=, <=, > or <)
1745 # otherwise, fill the result
1746 $biblionumbers .= $line
1747 unless ( $right =~ /^\d+$/ && $value =~ /\D/ );
1748 warn "result : $value "
1749 . ( $right =~ /\d/ ) . "=="
1750 . ( $value =~ /\D/?$line:"" ) if $DEBUG; #= $line";
1753 # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
1755 warn "NZAND" if $DEBUG;
1756 $results = NZoperatorAND($biblionumbers,$results);
1759 $results = $biblionumbers;
1765 #do a complete search (all indexes), if index='kw' do complete search too.
1766 my $dbh = C4::Context->dbh;
1769 "SELECT biblionumbers FROM nozebra WHERE server=? AND value LIKE ?"
1772 # split each word, query the DB and build the biblionumbers result
1773 foreach ( split / /, $string ) {
1774 next if C4::Context->stopwords->{ uc($_) }; # skip if stopword
1775 warn "search on all indexes on $_" if $DEBUG;
1778 $sth->execute( $server, $_ );
1779 while ( my $line = $sth->fetchrow ) {
1780 $biblionumbers .= $line;
1783 # do a AND with existing list if there is one, otherwise, use the biblionumbers list as 1st result list
1785 $results = NZoperatorAND($biblionumbers,$results);
1788 warn "NEW RES for $_ = $biblionumbers" if $DEBUG;
1789 $results = $biblionumbers;
1793 warn "return : $results for LEAF : $string" if $DEBUG;
1796 warn "---------\nLeave NZanalyse\n---------" if $DEBUG;
1800 my ($rightresult, $leftresult)=@_;
1802 my @leftresult = split /;/, $leftresult;
1803 warn " @leftresult / $rightresult \n" if $DEBUG;
1805 # my @rightresult = split /;/,$leftresult;
1808 # parse the left results, and if the biblionumber exist in the right result, save it in finalresult
1809 # the result is stored twice, to have the same weight for AND than OR.
1810 # example : TWO : 61,61,64,121 (two is twice in the biblio #61) / TOWER : 61,64,130
1811 # result : 61,61,61,61,64,64 for two AND tower : 61 has more weight than 64
1812 foreach (@leftresult) {
1815 ( $value, $countvalue ) = ( $1, $2 ) if ($value=~/(.*)-(\d+)$/);
1816 if ( $rightresult =~ /\Q$value\E-(\d+);/ ) {
1817 $countvalue = ( $1 > $countvalue ? $countvalue : $1 );
1819 "$value-$countvalue;$value-$countvalue;";
1822 warn "NZAND DONE : $finalresult \n" if $DEBUG;
1823 return $finalresult;
1827 my ($rightresult, $leftresult)=@_;
1828 return $rightresult.$leftresult;
1832 my ($leftresult, $rightresult)=@_;
1834 my @leftresult = split /;/, $leftresult;
1836 # my @rightresult = split /;/,$leftresult;
1838 foreach (@leftresult) {
1840 $value=$1 if $value=~m/(.*)-\d+$/;
1841 unless ($rightresult =~ "$value-") {
1842 $finalresult .= "$_;";
1845 return $finalresult;
1850 $finalresult = NZorder($biblionumbers, $ordering,$results_per_page,$offset);
1857 my ( $biblionumbers, $ordering, $results_per_page, $offset ) = @_;
1858 warn "biblionumbers = $biblionumbers and ordering = $ordering\n" if $DEBUG;
1860 # order title asc by default
1861 # $ordering = '1=36 <i' unless $ordering;
1862 $results_per_page = 20 unless $results_per_page;
1863 $offset = 0 unless $offset;
1864 my $dbh = C4::Context->dbh;
1867 # order by POPULARITY
1869 if ( $ordering =~ /popularity/ ) {
1873 # popularity is not in MARC record, it's builded from a specific query
1875 $dbh->prepare("select sum(issues) from items where biblionumber=?");
1876 foreach ( split /;/, $biblionumbers ) {
1877 my ( $biblionumber, $title ) = split /,/, $_;
1878 $result{$biblionumber} = GetMarcBiblio($biblionumber);
1879 $sth->execute($biblionumber);
1880 my $popularity = $sth->fetchrow || 0;
1882 # hint : the key is popularity.title because we can have
1883 # many results with the same popularity. In this cas, sub-ordering is done by title
1884 # we also have biblionumber to avoid bug for 2 biblios with the same title & popularity
1885 # (un-frequent, I agree, but we won't forget anything that way ;-)
1886 $popularity{ sprintf( "%10d", $popularity ) . $title
1887 . $biblionumber } = $biblionumber;
1890 # sort the hash and return the same structure as GetRecords (Zebra querying)
1893 if ( $ordering eq 'popularity_dsc' ) { # sort popularity DESC
1894 foreach my $key ( sort { $b cmp $a } ( keys %popularity ) ) {
1895 $result_hash->{'RECORDS'}[ $numbers++ ] =
1896 $result{ $popularity{$key} }->as_usmarc();
1899 else { # sort popularity ASC
1900 foreach my $key ( sort ( keys %popularity ) ) {
1901 $result_hash->{'RECORDS'}[ $numbers++ ] =
1902 $result{ $popularity{$key} }->as_usmarc();
1905 my $finalresult = ();
1906 $result_hash->{'hits'} = $numbers;
1907 $finalresult->{'biblioserver'} = $result_hash;
1908 return $finalresult;
1914 elsif ( $ordering =~ /author/ ) {
1916 foreach ( split /;/, $biblionumbers ) {
1917 my ( $biblionumber, $title ) = split /,/, $_;
1918 my $record = GetMarcBiblio($biblionumber);
1920 if ( C4::Context->preference('marcflavour') eq 'UNIMARC' ) {
1921 $author = $record->subfield( '200', 'f' );
1922 $author = $record->subfield( '700', 'a' ) unless $author;
1925 $author = $record->subfield( '100', 'a' );
1928 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
1929 # and we don't want to get only 1 result for each of them !!!
1930 $result{ $author . $biblionumber } = $record;
1933 # sort the hash and return the same structure as GetRecords (Zebra querying)
1936 if ( $ordering eq 'author_za' ) { # sort by author desc
1937 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
1938 $result_hash->{'RECORDS'}[ $numbers++ ] =
1939 $result{$key}->as_usmarc();
1942 else { # sort by author ASC
1943 foreach my $key ( sort ( keys %result ) ) {
1944 $result_hash->{'RECORDS'}[ $numbers++ ] =
1945 $result{$key}->as_usmarc();
1948 my $finalresult = ();
1949 $result_hash->{'hits'} = $numbers;
1950 $finalresult->{'biblioserver'} = $result_hash;
1951 return $finalresult;
1954 # ORDER BY callnumber
1957 elsif ( $ordering =~ /callnumber/ ) {
1959 foreach ( split /;/, $biblionumbers ) {
1960 my ( $biblionumber, $title ) = split /,/, $_;
1961 my $record = GetMarcBiblio($biblionumber);
1963 my $frameworkcode = GetFrameworkCode($biblionumber);
1964 my ( $callnumber_tag, $callnumber_subfield ) = GetMarcFromKohaField( 'items.itemcallnumber', $frameworkcode);
1965 ( $callnumber_tag, $callnumber_subfield ) = GetMarcFromKohaField('biblioitems.callnumber', $frameworkcode)
1966 unless $callnumber_tag;
1967 if ( C4::Context->preference('marcflavour') eq 'UNIMARC' ) {
1968 $callnumber = $record->subfield( '200', 'f' );
1970 $callnumber = $record->subfield( '100', 'a' );
1973 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
1974 # and we don't want to get only 1 result for each of them !!!
1975 $result{ $callnumber . $biblionumber } = $record;
1978 # sort the hash and return the same structure as GetRecords (Zebra querying)
1981 if ( $ordering eq 'call_number_dsc' ) { # sort by title desc
1982 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
1983 $result_hash->{'RECORDS'}[ $numbers++ ] =
1984 $result{$key}->as_usmarc();
1987 else { # sort by title ASC
1988 foreach my $key ( sort { $a cmp $b } ( keys %result ) ) {
1989 $result_hash->{'RECORDS'}[ $numbers++ ] =
1990 $result{$key}->as_usmarc();
1993 my $finalresult = ();
1994 $result_hash->{'hits'} = $numbers;
1995 $finalresult->{'biblioserver'} = $result_hash;
1996 return $finalresult;
1998 elsif ( $ordering =~ /pubdate/ ) { #pub year
2000 foreach ( split /;/, $biblionumbers ) {
2001 my ( $biblionumber, $title ) = split /,/, $_;
2002 my $record = GetMarcBiblio($biblionumber);
2003 my ( $publicationyear_tag, $publicationyear_subfield ) =
2004 GetMarcFromKohaField( 'biblioitems.publicationyear', '' );
2005 my $publicationyear =
2006 $record->subfield( $publicationyear_tag,
2007 $publicationyear_subfield );
2009 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2010 # and we don't want to get only 1 result for each of them !!!
2011 $result{ $publicationyear . $biblionumber } = $record;
2014 # sort the hash and return the same structure as GetRecords (Zebra querying)
2017 if ( $ordering eq 'pubdate_dsc' ) { # sort by pubyear desc
2018 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2019 $result_hash->{'RECORDS'}[ $numbers++ ] =
2020 $result{$key}->as_usmarc();
2023 else { # sort by pub year ASC
2024 foreach my $key ( sort ( keys %result ) ) {
2025 $result_hash->{'RECORDS'}[ $numbers++ ] =
2026 $result{$key}->as_usmarc();
2029 my $finalresult = ();
2030 $result_hash->{'hits'} = $numbers;
2031 $finalresult->{'biblioserver'} = $result_hash;
2032 return $finalresult;
2038 elsif ( $ordering =~ /title/ ) {
2040 # the title is in the biblionumbers string, so we just need to build a hash, sort it and return
2042 foreach ( split /;/, $biblionumbers ) {
2043 my ( $biblionumber, $title ) = split /,/, $_;
2045 # hint : the result is sorted by title.biblionumber because we can have X biblios with the same title
2046 # and we don't want to get only 1 result for each of them !!!
2047 # hint & speed improvement : we can order without reading the record
2048 # so order, and read records only for the requested page !
2049 $result{ $title . $biblionumber } = $biblionumber;
2052 # sort the hash and return the same structure as GetRecords (Zebra querying)
2055 if ( $ordering eq 'title_az' ) { # sort by title desc
2056 foreach my $key ( sort ( keys %result ) ) {
2057 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2060 else { # sort by title ASC
2061 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2062 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2066 # limit the $results_per_page to result size if it's more
2067 $results_per_page = $numbers - 1 if $numbers < $results_per_page;
2069 # for the requested page, replace biblionumber by the complete record
2070 # speed improvement : avoid reading too much things
2072 my $counter = $offset ;
2073 $counter <= $offset + $results_per_page ;
2077 $result_hash->{'RECORDS'}[$counter] =
2078 GetMarcBiblio( $result_hash->{'RECORDS'}[$counter] )->as_usmarc;
2080 my $finalresult = ();
2081 $result_hash->{'hits'} = $numbers;
2082 $finalresult->{'biblioserver'} = $result_hash;
2083 return $finalresult;
2090 # we need 2 hashes to order by ranking : the 1st one to count the ranking, the 2nd to order by ranking
2093 foreach ( split /;/, $biblionumbers ) {
2094 my ( $biblionumber, $title ) = split /,/, $_;
2095 $title =~ /(.*)-(\d)/;
2100 # note that we + the ranking because ranking is calculated on weight of EACH term requested.
2101 # if we ask for "two towers", and "two" has weight 2 in biblio N, and "towers" has weight 4 in biblio N
2102 # biblio N has ranking = 6
2103 $count_ranking{$biblionumber} += $ranking;
2106 # build the result by "inverting" the count_ranking hash
2107 # hing : as usual, we don't order by ranking only, to avoid having only 1 result for each rank. We build an hash on concat(ranking,biblionumber) instead
2109 foreach ( keys %count_ranking ) {
2110 $result{ sprintf( "%10d", $count_ranking{$_} ) . '-' . $_ } = $_;
2113 # sort the hash and return the same structure as GetRecords (Zebra querying)
2116 foreach my $key ( sort { $b cmp $a } ( keys %result ) ) {
2117 $result_hash->{'RECORDS'}[ $numbers++ ] = $result{$key};
2120 # limit the $results_per_page to result size if it's more
2121 $results_per_page = $numbers - 1 if $numbers < $results_per_page;
2123 # for the requested page, replace biblionumber by the complete record
2124 # speed improvement : avoid reading too much things
2126 my $counter = $offset ;
2127 $counter <= $offset + $results_per_page ;
2131 $result_hash->{'RECORDS'}[$counter] =
2132 GetMarcBiblio( $result_hash->{'RECORDS'}[$counter] )->as_usmarc
2133 if $result_hash->{'RECORDS'}[$counter];
2135 my $finalresult = ();
2136 $result_hash->{'hits'} = $numbers;
2137 $finalresult->{'biblioserver'} = $result_hash;
2138 return $finalresult;
2144 ($countchanged,$listunchanged) = ModBiblios($listbiblios, $tagsubfield,$initvalue,$targetvalue,$test);
2146 this function changes all the values $initvalue in subfield $tag$subfield in any record in $listbiblios
2147 test parameter if set donot perform change to records in database.
2153 * $listbiblios is an array ref to marcrecords to be changed
2154 * $tagsubfield is the reference of the subfield to change.
2155 * $initvalue is the value to search the record for
2156 * $targetvalue is the value to set the subfield to
2157 * $test is to be set only not to perform changes in database.
2159 =item C<Output arg:>
2160 * $countchanged counts all the changes performed.
2161 * $listunchanged contains the list of all the biblionumbers of records unchanged.
2163 =item C<usage in the script:>
2167 my ($countchanged, $listunchanged) = EditBiblios($results->{RECORD}, $tagsubfield,$initvalue,$targetvalue);;
2168 #If one wants to display unchanged records, you should get biblios foreach @$listunchanged
2169 $template->param(countchanged => $countchanged, loopunchanged=>$listunchanged);
2174 my ( $listbiblios, $tagsubfield, $initvalue, $targetvalue, $test ) = @_;
2177 my ( $tag, $subfield ) = ( $1, $2 )
2178 if ( $tagsubfield =~ /^(\d{1,3})([a-z0-9A-Z@])?$/ );
2179 if ( ( length($tag) < 3 ) && $subfield =~ /0-9/ ) {
2180 $tag = $tag . $subfield;
2183 my ( $bntag, $bnsubf ) = GetMarcFromKohaField('biblio.biblionumber', '');
2184 my ( $itemtag, $itemsubf ) = GetMarcFromKohaField('items.itemnumber', '');
2185 if ($tag eq $itemtag) {
2186 # do not allow the embedded item tag to be
2188 warn "Attempting to edit item tag via C4::Search::ModBiblios -- not allowed";
2191 foreach my $usmarc (@$listbiblios) {
2193 $record = eval { MARC::Record->new_from_usmarc($usmarc) };
2197 # usmarc is not a valid usmarc May be a biblionumber
2198 # FIXME - sorry, please let's figure out whether
2199 # this function is to be passed a list of
2200 # record numbers or a list of MARC::Record
2201 # objects. The former is probably better
2202 # because the MARC records supplied by Zebra
2203 # may be not current.
2204 $record = GetMarcBiblio($usmarc);
2205 $biblionumber = $usmarc;
2208 if ( $bntag >= 010 ) {
2209 $biblionumber = $record->subfield( $bntag, $bnsubf );
2212 $biblionumber = $record->field($bntag)->data;
2216 #GetBiblionumber is to be written.
2217 #Could be replaced by TransformMarcToKoha (But Would be longer)
2218 if ( $record->field($tag) ) {
2220 foreach my $field ( $record->field($tag) ) {
2223 $field->delete_subfield(
2224 'code' => $subfield,
2225 'match' => qr($initvalue)
2231 $field->update( $subfield, $targetvalue )
2236 if ( $tag >= 010 ) {
2237 if ( $field->delete_field($field) ) {
2243 $field->data = $targetvalue
2244 if ( $field->data =~ qr($initvalue) );
2249 # warn $record->as_formatted;
2251 ModBiblio( $record, $biblionumber,
2252 GetFrameworkCode($biblionumber) )
2256 push @unmatched, $biblionumber;
2260 push @unmatched, $biblionumber;
2263 return ( $countmatched, \@unmatched );
2266 END { } # module clean-up code here (global destructor)
2273 Koha Developement team <info@koha.org>