Field weighting applied to ranked searches. A new facets table in mysql db
[koha.git] / C4 / AuthoritiesMarc.pm
1 package C4::AuthoritiesMarc;
2 # Copyright 2000-2002 Katipo Communications
3 #
4 # This file is part of Koha.
5 #
6 # Koha is free software; you can redistribute it and/or modify it under the
7 # terms of the GNU General Public License as published by the Free Software
8 # Foundation; either version 2 of the License, or (at your option) any later
9 # version.
10 #
11 # Koha is distributed in the hope that it will be useful, but WITHOUT ANY
12 # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
13 # A PARTICULAR PURPOSE.  See the GNU General Public License for more details.
14 #
15 # You should have received a copy of the GNU General Public License along with
16 # Koha; if not, write to the Free Software Foundation, Inc., 59 Temple Place,
17 # Suite 330, Boston, MA  02111-1307 USA
18
19 use strict;
20 require Exporter;
21 use C4::Context;
22 use C4::Koha;
23 use Encode;
24 use C4::Biblio;
25
26 use vars qw($VERSION @ISA @EXPORT);
27
28 # set the version for version checking
29 $VERSION = 0.01;
30
31 @ISA = qw(Exporter);
32 @EXPORT = qw(
33         &AUTHgettagslib
34         &AUTHfindsubfield
35         &AUTHfind_authtypecode
36         &AUTHaddauthority
37         &AUTHmodauthority
38         &AUTHdelauthority
39         &AUTHaddsubfield
40
41         &AUTHfind_marc_from_kohafield
42         &AUTHgetauth_type
43         &AUTHcount_usage
44         &getsummary
45         &authoritysearch
46         &XMLgetauthority
47         &XMLgetauthorityhash
48         &XML_readline_withtags
49         &merge
50         &FindDuplicateauth
51         &ZEBRAdelauthority
52  );
53
54 sub AUTHfind_marc_from_kohafield {
55     my ( $dbh, $kohafield,$authtypecode ) = @_;
56     return 0, 0 unless $kohafield;
57 $authtypecode="" unless $authtypecode;
58 my $marcfromkohafield;
59         my $sth = $dbh->prepare("select tagfield,tagsubfield from auth_subfield_structure where kohafield= ? and authtypecode=? ");
60         $sth->execute($kohafield,$authtypecode);
61         my ($tagfield,$tagsubfield) = $sth->fetchrow;   
62         return  ($tagfield,$tagsubfield);
63 }
64 sub authoritysearch {
65 ## This routine requires rewrite--TG
66         my ($dbh, $tags, $operator, $value, $offset,$length,$authtypecode,$dictionary) = @_;
67 ###Dictionary flag used to set what to show in summary;
68         my $query;
69         my $attr;
70         my $server;
71         my $mainentrytag;
72         ##first set the authtype search and may be multiple authorities( linked authorities)
73         my $n=0;
74         my @authtypecode;
75                                 my @auths=split / /,$authtypecode ;
76                                 my ($attrfield)=MARCfind_attr_from_kohafield("authtypecode");
77                                 foreach my  $auth (@auths){
78                                 $query .=$attrfield." ".$auth." "; ##No truncation on authtype
79                                 push @authtypecode ,$auth;
80                                 $n++;
81                                 }
82                         if ($n>1){
83                          $query= "\@or ".$query;
84                         }
85         
86         my $dosearch;
87         my $and;
88         my $q2;
89         for(my $i = 0 ; $i <= $#{$value} ; $i++)
90         {
91
92         if (@$value[$i]){
93         ##If mainentry search $a tag
94                 if (@$tags[$i] eq "mainentry") {
95                  ($attr)=MARCfind_attr_from_kohafield("mainentry")." ";         
96                 }else{
97                 ($attr) =MARCfind_attr_from_kohafield("allentry")." ";
98                 }
99                 if (@$operator[$i] eq 'phrase') {
100                          $attr.="  \@attr 4=1  \@attr 5=100  \@attr 6=3 ";##Phrase, No truncation,all of subfield field must match
101                 
102                 } else {
103                 
104                          $attr .=" \@attr 4=6  \@attr 5=1  ";## Word list, right truncated, anywhere
105                 }                
106         
107                 
108                 $and .=" \@and " ;
109                 $attr =$attr."\"".@$value[$i]."\"";
110                 $q2 .=$attr;
111         $dosearch=1;            
112         }#if value              
113                 
114         }## value loop
115 ##Add how many queries generated
116 $query= $and.$query.$q2;
117 #warn $query;
118
119 $offset=0 unless $offset;
120 my $counter = $offset;
121 $length=10 unless $length;
122 my @oAuth;
123 my $i;
124  $oAuth[0]=C4::Context->Zconnauth("authorityserver");
125 my ($mainentry)=MARCfind_attr_from_kohafield("mainentry");
126 my ($allentry)=MARCfind_attr_from_kohafield("allentry");
127
128 $query="\@attr 2=102 \@or \@or ".$query." \@attr 7=1 ".$mainentry." 0 \@attr 7=1 ".$allentry." 1"; ## sort on mainfield and subfields
129
130
131 my $oAResult;
132  $oAResult= $oAuth[0]->search_pqf($query) ; 
133 while (($i = ZOOM::event(\@oAuth)) != 0) {
134     my $ev = $oAuth[$i-1]->last_event();
135 #   warn("Authority ", $i-1, ": event $ev (", ZOOM::event_str($ev), ")\n");
136     last if $ev == ZOOM::Event::ZEND;
137 }
138  my($error, $errmsg, $addinfo, $diagset) = $oAuth[0]->error_x();
139     if ($error) {
140         warn  "oAuth error: $errmsg ($error) $addinfo $diagset\n";
141         goto NOLUCK;
142     }
143
144
145 my $nbresults;
146  $nbresults=$oAResult->size();
147 my $nremains=$nbresults;        
148         my @result = ();
149         my @finalresult = ();
150
151 if ($nbresults>0){
152
153 ##Find authid and linkid fields
154
155
156 while (($counter < $nbresults) && ($counter < ($offset + $length))) {
157 ##Here we have to extract MARC record and $authid from ZEBRA AUTHORITIES
158 my $rec=$oAResult->record($counter);
159 my $marcdata=$rec->raw();
160 my $authrecord=Encode::decode("utf8",$marcdata);
161 $authrecord=XML_xml2hash_onerecord($authrecord);                
162 my @linkids;    
163 my $separator=C4::Context->preference('authoritysep');
164 my $linksummary=" ".$separator; 
165 my $authid=XML_readline_onerecord($authrecord,"authid","authorities");  
166 my @linkid=XML_readline_asarray($authrecord,"linkid","authorities");##May have many linked records      
167         
168         foreach my $linkid (@linkid){
169                 my $linktype=AUTHfind_authtypecode($dbh,$linkid);
170                 my $linkrecord=XMLgetauthorityhash($dbh,$linkid);
171                 $linksummary.="<br>&nbsp;&nbsp;&nbsp;&nbsp;<a href='detail.pl?authid=$linkid'>".getsummary($dbh,$linkrecord,$linkid,$linktype).".</a>".$separator;
172                 
173         }
174 my  $summary;
175 unless ($dictionary){
176  $summary=getsummary($dbh,$authrecord,$authid,$authtypecode);
177 $summary="<a href='detail.pl?authid=$authid'>".$summary.".</a>";
178         if ( $linksummary ne " ".$separator){
179         $summary="<b>".$summary."</b>".$linksummary;
180         }
181 }else{
182  $summary=getdictsummary($dbh,$authrecord,$authid,$authtypecode);
183 }
184 my $toggle;
185         if ($counter % 2) {
186                 $toggle="#ffffcc";
187         } else {
188                 $toggle="white";
189         }
190 my %newline;
191         $newline{'toggle'}=$toggle;     
192         $newline{summary} = $summary;
193         $newline{authid} = $authid;
194         $newline{linkid} = $linkid[0];
195         $newline{even} = $counter % 2;
196         $counter++;
197         push @finalresult, \%newline;
198         }## while counter
199
200
201 for (my $z=0; $z<$length; $z++){
202                 $finalresult[$z]{used}=AUTHcount_usage($finalresult[$z]{authid});
203         
204  }# all $z's
205
206
207 }## if nbresult
208 NOLUCK:
209 $oAResult->destroy();
210 $oAuth[0]->destroy();
211
212         return (\@finalresult, $nbresults);
213 }
214
215
216
217 sub AUTHcount_usage {
218         my ($authid) = @_;
219 ### try ZOOM search here
220 my @oConnection;
221 $oConnection[0]=C4::Context->Zconn("biblioserver");
222 my $query;
223 my ($attrfield)=MARCfind_attr_from_kohafield("authid");
224 $query= $attrfield." ".$authid;
225
226 my $oResult = $oConnection[0]->search_pqf($query);
227 my $event;
228 my $i;
229    while (($i = ZOOM::event(\@oConnection)) != 0) {
230         $event = $oConnection[$i-1]->last_event();
231         last if $event == ZOOM::Event::ZEND;
232    }# while
233 my $result=$oResult->size() ;
234         return ($result);
235 }
236
237
238
239 sub AUTHfind_authtypecode {
240         my ($dbh,$authid) = @_;
241         my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
242         $sth->execute($authid);
243         my ($authtypecode) = $sth->fetchrow;
244         return $authtypecode;
245 }
246  
247
248 sub AUTHgettagslib {
249         my ($dbh,$forlibrarian,$authtypecode)= @_;
250         $authtypecode="" unless $authtypecode;
251         my $sth;
252         my $libfield = ($forlibrarian eq 1)? 'liblibrarian' : 'libopac';
253
254
255         # check that authority exists
256         $sth=$dbh->prepare("select count(*) from auth_tag_structure where authtypecode=?");
257         $sth->execute($authtypecode);
258         my ($total) = $sth->fetchrow;
259         $authtypecode="" unless ($total >0);
260         $sth= $dbh->prepare(
261 "select tagfield,liblibrarian,libopac,mandatory,repeatable from auth_tag_structure where authtypecode=? order by tagfield"
262     );
263
264 $sth->execute($authtypecode);
265          my ( $liblibrarian, $libopac, $tag, $res, $tab, $mandatory, $repeatable );
266
267     while ( ( $tag, $liblibrarian, $libopac, $mandatory, $repeatable ) = $sth->fetchrow ) {
268         $res->{$tag}->{lib}        = ($forlibrarian or !$libopac)?$liblibrarian:$libopac;
269         $res->{$tab}->{tab}        = "";            # XXX
270         $res->{$tag}->{mandatory}  = $mandatory;
271         $res->{$tag}->{repeatable} = $repeatable;
272     }
273         $sth=      $dbh->prepare("select tagfield,tagsubfield,liblibrarian,libopac,tab, mandatory, repeatable,authorised_value,authtypecode,value_builder,seealso,hidden,isurl,link from auth_subfield_structure where authtypecode=? order by tagfield,tagsubfield"
274     );
275         $sth->execute($authtypecode);
276
277          my $subfield;
278     my $authorised_value;
279     my $authtypecode;
280     my $value_builder;
281     my $kohafield;
282     my $seealso;
283     my $hidden;
284     my $isurl;
285         my $link;
286
287     while (
288         ( $tag,         $subfield,   $liblibrarian,   , $libopac,      $tab,
289         $mandatory,     $repeatable, $authorised_value, $authtypecode,
290         $value_builder,   $seealso,          $hidden,
291         $isurl,                 $link )
292         = $sth->fetchrow
293       )
294     {
295         $res->{$tag}->{$subfield}->{lib}              = ($forlibrarian or !$libopac)?$liblibrarian:$libopac;
296         $res->{$tag}->{$subfield}->{tab}              = $tab;
297         $res->{$tag}->{$subfield}->{mandatory}        = $mandatory;
298         $res->{$tag}->{$subfield}->{repeatable}       = $repeatable;
299         $res->{$tag}->{$subfield}->{authorised_value} = $authorised_value;
300         $res->{$tag}->{$subfield}->{authtypecode}     = $authtypecode;
301         $res->{$tag}->{$subfield}->{value_builder}    = $value_builder;
302         $res->{$tag}->{$subfield}->{seealso}          = $seealso;
303         $res->{$tag}->{$subfield}->{hidden}           = $hidden;
304         $res->{$tag}->{$subfield}->{isurl}            = $isurl;
305         $res->{$tag}->{$subfield}->{link}            = $link;
306     }
307     return $res;
308 }
309
310 sub AUTHaddauthority {
311 # pass the XML hash to this function, and it will create the records in the authority table
312         my ($dbh,$record,$authid,$authtypecode) = @_;
313 # if authid empty => true add, find a new authid number
314         if (!$authid) {
315         my      $sth=$dbh->prepare("select max(authid) from auth_header");
316                 $sth->execute;
317                 ($authid)=$sth->fetchrow;
318                 $authid=$authid+1;
319         }       
320
321 ##Modified record may also come here use REPLACE -- bulk import comes here
322 XML_writeline($record,"authid",$authid,"authorities");
323 XML_writeline($record,"authtypecode",$authtypecode,"authorities");
324 my $xml=XML_hash2xml($record);
325         my $sth=$dbh->prepare("REPLACE auth_header set marcxml=?,  authid=?,authtypecode=?,datecreated=now()");
326         $sth->execute($xml,$authid,$authtypecode);
327         $sth->finish;   
328         ZEBRAop($dbh,$authid,'specialUpdate',"authorityserver");
329 ## If the record is linked to another update the linked authorities with new authid
330 my @linkids=XML_readline_asarray($record,"linkid","authorities");
331         foreach my $linkid (@linkids){
332         ##Modify the record of linked 
333         AUTHaddlink($dbh,$linkid,$authid);
334         }
335 return ($authid);
336 }
337
338 sub AUTHaddlink{
339 my ($dbh,$linkid,$authid)=@_;
340 my $record=XMLgetauthorityhash($dbh,$linkid);
341 my $authtypecode=AUTHfind_authtypecode($dbh,$linkid);
342 #warn "adding l:$linkid,a:$authid,auth:$authtypecode";
343 XML_writeline($record,"linkid",$authid,"authorities");
344 my $xml=XML_hash2xml($record);
345 $dbh->do("lock tables header WRITE");
346         my $sth=$dbh->prepare("update auth_header set marcxml=? where authid=?");
347         $sth->execute($xml,$linkid);
348         $sth->finish;   
349         $dbh->do("unlock tables");
350         ZEBRAop($dbh,$linkid,'specialUpdate',"authorityserver");
351 }
352
353
354
355 sub XMLgetauthority {
356     # Returns MARC::XML of the authority passed in parameter.
357     my ( $dbh, $authid ) = @_;
358     my $sth =  $dbh->prepare("select marcxml from auth_header where authid=? "  );
359     $sth->execute($authid);
360  my ($marcxml)=$sth->fetchrow;
361         $marcxml=Encode::decode('utf8',$marcxml);
362  return ($marcxml);
363 }
364
365 sub XMLgetauthorityhash {
366 ## Utility to return  hashed MARCXML
367 my ($dbh,$authid)=@_;
368 my $xml=XMLgetauthority($dbh,$authid);
369 my $xmlhash=XML_xml2hash_onerecord($xml);
370 return $xmlhash;
371 }
372
373
374
375
376 sub AUTHgetauth_type {
377         my ($authtypecode) = @_;
378         my $dbh=C4::Context->dbh;
379         my $sth=$dbh->prepare("select * from auth_types where authtypecode=?");
380         $sth->execute($authtypecode);
381         return $sth->fetchrow_hashref;
382 }
383
384
385 sub AUTHmodauthority {
386 ## $record is expected to be an xmlhash
387         my ($dbh,$authid,$record,$authtypecode)=@_;
388         my ($oldrecord)=&XMLgetauthorityhash($dbh,$authid);
389 ### This equality is very dodgy ,It porobaby wont work
390         if ($oldrecord eq $record) {
391                 return $authid;
392         }
393 ##
394 my $sth=$dbh->prepare("update auth_header set marcxml=? where authid=?");
395 # find if linked records exist and delete the link in them
396 my @linkids=XML_readline_asarray($oldrecord,"linkid","authorities");
397
398         foreach my $linkid (@linkids){
399                 ##Modify the record of linked 
400                 my $linkrecord=XMLgetauthorityhash($dbh,$linkid);
401                 my $linktypecode=AUTHfind_authtypecode($dbh,$linkid);
402                 my @linkfields=XML_readline_asarray($linkrecord,"linkid","authorities");
403                 my $updated;
404                        foreach my $linkfield (@linkfields){
405                         if ($linkfield eq $authid){
406                                 XML_writeline_id($linkrecord,"linkid",$linkfield,"","authorities");
407                                 $updated=1;
408                         }
409                        }#foreach linkfield
410                         my $linkedxml=XML_hash2xml($linkrecord);
411                         if ($updated==1){
412                         $sth->execute($linkedxml,$linkid);
413                         ZEBRAop($dbh,$linkid,'specialUpdate',"authorityserver");
414                         }
415         
416         }#foreach linkid
417
418 #Now rewrite the $record to table with an add
419 $authid=AUTHaddauthority($dbh,$record,$authid,$authtypecode);
420
421
422 ### If a library thinks that updating all biblios is a long process and wishes to leave that to a cron job to use merge_authotities.pl
423 ### they should have a system preference "dontmerge=1" otherwise by default biblios will be updated
424
425 if (C4::Context->preference('dontmerge') ){
426 # save the file in localfile/modified_authorities
427         my $cgidir = C4::Context->intranetdir ."/cgi-bin";
428         unless (opendir(DIR, "$cgidir")) {
429                         $cgidir = C4::Context->intranetdir."/";
430         } 
431
432         my $filename = $cgidir."/localfile/modified_authorities/$authid.authid";
433         open AUTH, "> $filename";
434         print AUTH $authid;
435         close AUTH;
436 }else{
437         &merge($dbh,$authid,$record,$authid,$record);
438 }
439 return $authid;
440 }
441
442 sub AUTHdelauthority {
443         my ($dbh,$authid,$keep_biblio) = @_;
444
445 # if the keep_biblio is set to 1, then authority entries in biblio are preserved.
446 # FIXME : delete or not in biblio tables (depending on $keep_biblio flag) is not implemented
447 ZEBRAop($dbh,$authid,"recordDelete","authorityserver");
448 }
449
450 sub ZEBRAdelauthority {
451 my ($dbh,$authid)=@_;
452         $dbh->do("delete from auth_header where authid=$authid") ;
453 }
454
455 sub AUTHfind_authtypecode {
456         my ($dbh,$authid) = @_;
457         my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
458         $sth->execute($authid);
459         my ($authtypecode) = $sth->fetchrow;
460         return $authtypecode;
461 }
462
463
464 sub FindDuplicateauth {
465 ### Should receive an xmlhash
466         my ($record,$authtypecode)=@_;
467         my $dbh = C4::Context->dbh;
468         my $sth = $dbh->prepare("select auth_tag_to_report from auth_types where authtypecode=?");
469         $sth->execute($authtypecode);
470         my ($auth_tag_to_report) = $sth->fetchrow;
471         $sth->finish;
472         # build a request for authoritysearch
473         my (@tags, @and_or, @excluding, @operator, @value, $offset, $length);
474         
475 #       if ($record->field($auth_tag_to_report)) {
476                                 push @tags, $auth_tag_to_report;
477                                 push @operator, "all";
478                                  @value, XML_readline_asarray($record,"","",$auth_tag_to_report);
479 #                       }
480  
481         my ($finalresult,$nbresult) = authoritysearch($dbh,\@tags,\@and_or,\@excluding,\@operator,\@value,0,10,$authtypecode);
482         # there is at least 1 result => return the 1st one
483         if ($nbresult>0) {
484                 return @$finalresult[0]->{authid},@$finalresult[0]->{summary};
485         }
486         # no result, returns nothing
487         return;
488 }
489
490 sub getsummary{
491 ## give this an XMLhash record to return summary
492 my ($dbh,$record,$authid,$authtypecode)=@_;
493  my $authref = getauthtype($authtypecode);
494                 my $summary = $authref->{summary};
495                 # if the library has a summary defined, use it. Otherwise, build a standard one
496         if ($summary) {
497                         my $fields = $record->{'datafield'};
498                         foreach my $field (@$fields) {
499                                 my $tag = $field->{'tag'};                              
500                                 if ($tag<10) {
501                                 my $tagvalue = XML_readline_onerecord($record,"","",$field->{tag});
502                                 $summary =~ s/\[(.?.?.?.?)$tag\*(.*?)]/$1$tagvalue$2\[$1$tag$2]/g;
503                                 } else {
504                                         my @subf = XML_readline_withtags($record,"","",$tag);
505                                         for my $i (0..$#subf) {
506                                                 my $subfieldcode = $subf[$i][0];
507                                                 my $subfieldvalue = $subf[$i][1];
508                                                 my $tagsubf = $tag.$subfieldcode;
509                                                 $summary =~ s/\[(.?.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue$2\[$1$tagsubf$2]/g;
510                                         }## each subf
511                                 }#tag >10
512                         }##each field
513                         $summary =~ s/\[(.*?)]//g;
514                         $summary =~ s/\n/<br>/g;
515         } else {
516 ## $summary did not exist create a standard summary
517                         my $heading; # = $authref->{summary};
518                         my $altheading;
519                         my $seeheading;
520                         my $see;
521                         my $fields = $record->{datafield};
522                         if (C4::Context->preference('marcflavour') eq 'UNIMARC') {
523                         # construct UNIMARC summary, that is quite different from MARC21 one
524                         foreach my $field (@$fields) {
525                                 # accepted form
526                                 if ($field->{tag} = ~/'2..'/) {
527                                         foreach my $subfield ("a".."z"){
528                                         ## Fixme-- if UNICODE uses numeric subfields as well add them
529                                         $heading.=XML_readline_onerecord($record,"","",$field->{tag},$subfield); 
530                                         }
531                                 }##tag 2..
532                                 # rejected form(s)
533                                 if ($field->{tag} = ~/'4..'/) {
534                                         my $value;
535                                         foreach my $subfield ("a".."z"){
536                                         ## Fixme-- if UNICODE uses numeric subfields as well add them
537                                         $value.=XML_readline_onerecord($record,"","",$field->{tag},$subfield);
538                                         }
539                                         $summary.= "&nbsp;&nbsp;&nbsp;<i>".$value."</i><br/>";
540                                         $summary.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see:</i> ".$heading."<br/>";
541                                 }##tag 4..
542                                 # see :
543                                 if ($field->{tag} = ~/'5..'/) {
544                                         my $value;
545                                         foreach my $subfield ("a".."z"){
546                                         ## Fixme-- if UNICODE uses numeric subfields as well add them
547                                         $value.=XML_readline_onerecord($record,"","",$field->{tag},$subfield);
548                                         }
549                                         $summary.= "&nbsp;&nbsp;&nbsp;<i>".$value."</i><br/>";
550                                         $summary.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see:</i> ".$heading."<br/>";
551                                 }# tag 5..
552                                 # // form
553                                 if ($field->{tag} = ~/'7..'/) {
554                                         my $value;
555                                         foreach my $subfield ("a".."z"){
556                                         ## Fixme-- if UNICODE uses numeric subfields as well add them
557                                         $value.=XML_readline_onerecord($record,"","",$field->{tag},$subfield);
558                                         }
559                                         $seeheading.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see also:</i> ".$value."<br />";  
560                                         $altheading.= "&nbsp;&nbsp;&nbsp;".$value."<br />";
561                                         $altheading.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see also:</i> ".$heading."<br />";
562                                 }# tag 7..
563                         }## Foreach fields
564                                 $summary = "<b>".$heading."</b><br />".$seeheading.$altheading.$summary;        
565                      } else {
566                         # construct MARC21 summary
567                         foreach my $field (@$fields) {
568                                 my $tag="1..";
569                                   if($field->{tag}  =~ /^$tag/) {
570                                               if ($field->{tag} eq '150') {
571                                                 my $value;
572                                                 foreach my $subfield ("a".."z"){
573                                                  $value=XML_readline_onerecord($record,"","","150",$subfield); 
574                                                 $heading.="\$".$subfield.$value if $value;
575                                                         }
576                                               }else{                            
577                                                 foreach my $subfield ("a".."z"){
578                                                 $heading.=XML_readline_onerecord($record,"","",$field->{tag},$subfield); 
579                                                         }
580                                              }### tag 150 or else
581                                    }##tag 1..
582                                 my $tag="4..";
583                                  if($field->{tag}  =~ /^$tag/) {
584                                         foreach my $subfield ("a".."z"){
585                                                 $seeheading.=XML_readline_onerecord($record,"","",$field->{tag},$subfield); 
586                                                 }
587                                         $seeheading.= "&nbsp;&nbsp;&nbsp;".$seeheading."<br />";
588                                         $seeheading.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see:</i> ".$seeheading."<br />";  
589                                 } #tag 4..
590                                 my $tag="5..";
591                                  if($field->{tag}  =~ /^$tag/) {
592                                         my $value;
593                                         foreach my $subfield ("a".."z"){
594                                                 $value.=XML_readline_onerecord($record,"","",$field->{tag},$subfield); 
595                                                 }
596                                         $seeheading.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see also:</i> ".$value."<br />";  
597                                         $altheading.= "&nbsp;&nbsp;&nbsp;".$value."<br />";
598                                         $altheading.= "&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;<i>see also:</i> ".$altheading."<br />";
599                                 }#tag 5..
600                                         
601                         }##for each field
602                     $summary.=$heading.$seeheading.$altheading;         
603                 }##USMARC vs UNIMARC
604         }###Summary exists or not
605 return $summary;
606 }
607 sub getdictsummary{
608 ## give this a XML record to return a brief summary
609 my ($dbh,$record,$authid,$authtypecode)=@_;
610  my $authref = getauthtype($authtypecode);
611                 my $summary = $authref->{summary};
612                 my $fields = $record->{'datafield'};
613                 # if the library has a summary defined, use it. Otherwise, build a standard one
614         if ($summary) {
615                         foreach my $field (@$fields) {
616                                 my $tag = $field->{'tag'};                              
617                                 if ($tag<10) {
618                                 my $tagvalue = XML_readline_onerecord($record,"","",$field->{tag});
619                                 $summary =~ s/\[(.?.?.?.?)$tag\*(.*?)]/$1$tagvalue$2\[$1$tag$2]/g;
620                                 } else {
621                                         my @subf = XML_readline_withtags($record,"","",$tag);
622                                         for my $i (0..$#subf) {
623                                                 my $subfieldcode = $subf[$i][0];
624                                                 my $subfieldvalue = $subf[$i][1];
625                                                 my $tagsubf = $tag.$subfieldcode;
626                                                 $summary =~ s/\[(.?.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue$2\[$1$tagsubf$2]/g;
627                                         }## each subf
628                                 }#tag >10
629                         }##each field
630                         $summary =~ s/\[(.*?)]//g;
631                         $summary =~ s/\n/<br>/g;
632                 } else {
633                         my $heading; # = $authref->{summary};
634                         my $altheading;
635                         my $seeheading;
636                         my $see;
637                         my @fields = $record->{datafields};
638                         if (C4::Context->preference('marcflavour') eq 'UNIMARC') {
639                         # construct UNIMARC summary, that is quite different from MARC21 one
640                         foreach my $field (@$fields) {
641                                 # accepted form
642                                 if ($field->{tag} = ~/'2..'/) {
643                                         foreach my $subfield ("a".."z"){
644                                         ## Fixme-- if UNICODE uses numeric subfields as well add them
645                                         $heading.=XML_readline_onerecord($record,"","",$field->{tag},$subfield); 
646                                         }
647                                 }##tag 2..
648                         }
649                                 $summary = $heading;    
650                         } else {
651                         # construct MARC21 summary
652                                 foreach my $field (@fields) {   
653                                         if ($field->{tag}=~/'1..'/){                    
654                                                 $heading.= XML_readline_onerecord($record,"","",$field->{tag},"a");
655                                         }
656                                 } #each fieldd
657                                 
658                                 $summary=$heading;
659                         }# USMARC vs UNIMARC
660                 }### Summary exists
661 return $summary;
662 }
663
664
665 sub merge {
666 ##mergefrom is authid MARCfrom is marcxml hash of authority
667 ### mergeto ditto
668         my ($dbh,$mergefrom,$MARCfrom,$mergeto,$MARCto) = @_;
669         return unless (defined $MARCfrom);
670         return unless (defined $MARCto);
671         my $authtypecodefrom = AUTHfind_authtypecode($dbh,$mergefrom);
672         my $authtypecodeto = AUTHfind_authtypecode($dbh,$mergeto);
673         # return if authority does not exist
674         
675         # search the tag to report
676         my $sth = $dbh->prepare("select auth_tag_to_report from auth_types where authtypecode=?");
677         $sth->execute($authtypecodefrom);
678         my ($auth_tag_to_report) = $sth->fetchrow;
679         my @record_to;
680         # search all biblio tags using this authority.
681         $sth = $dbh->prepare("select distinct tagfield from biblios_subfield_structure where authtypecode=? ");
682         $sth->execute($authtypecodefrom);
683 my @tags_using_authtype;
684         while (my ($tagfield) = $sth->fetchrow) {
685                 push @tags_using_authtype,$tagfield ;
686         }
687 ## The subfield for linking authorities is stored in koha_attr named auth_biblio_link_subf
688 ## This way we may use whichever subfield we want without harcoding 9 in
689 my ($dummyfield,$tagsubfield)=MARCfind_marc_from_kohafield("auth_biblio_link_subf","biblios");
690         # now, find every biblio using this authority
691 ### try ZOOM search here
692 my @oConnection;
693  $oConnection[0]=C4::Context->Zconn("biblioserver");
694 ##$oConnection[0]->option(elementSetName=>"biblios"); ##  Needs a fix
695 my $query;
696 my ($attr2)=MARCfind_attr_from_kohafield("authid");
697 my $attrfield.=$attr2;
698 $query= $attrfield." ".$mergefrom;
699 my ($event,$i);
700 my $oResult = $oConnection[0]->search_pqf($query);
701   while (($i = ZOOM::event(\@oConnection)) != 0) {
702         $event = $oConnection[$i-1]->last_event();
703         last if $event == ZOOM::Event::ZEND;
704    }# while event
705 my $count=$oResult->size();
706 my @reccache;
707 my $z=0;
708 while ( $z<$count ) {
709 my $rec;
710         $rec=$oResult->record($z);
711         my $marcdata = $rec->raw();
712 my $koharecord=Encode::decode("utf8",$marcdata);
713 $koharecord=XML_xml2hash($koharecord);
714  my ( $xmlrecord, @itemsrecord) = XML_separate($koharecord);
715
716 push @reccache, $xmlrecord;
717 $z++;
718 }
719 $oResult->destroy();
720 $oConnection[0]->destroy();
721       foreach my $xmlhash (@reccache){
722         my $update;
723         foreach my $tagfield (@tags_using_authtype){
724
725         ###Change the authid in biblio
726         $xmlhash=XML_writeline_id($xmlhash,$mergefrom,$mergeto,$tagfield,$tagsubfield);
727         ### delete all subfields of bibliorecord
728         $xmlhash=XML_delete_withid($xmlhash,$mergeto,$tagfield,$tagsubfield);
729         ####Read all the data in from authrecord
730         my @record_to=XML_readline_withtags($MARCto,"","",$auth_tag_to_report);
731         ##Write the data to biblio
732                 foreach my $subfield (@record_to) {
733                 ## Replace the data in MARCXML with the new matching authid
734                 XML_writeline_withid($xmlhash,$tagsubfield,$mergeto,$subfield->[1],$tagfield,$subfield->[0]);
735                 $update=1;
736                 }#foreach  $subfield            
737         }#foreach tagfield
738                 if ($update==1){
739                 my $biblionumber=XML_readline_onerecord($xmlhash,"biblionumber","biblios");
740                 my $frameworkcode=MARCfind_frameworkcode($dbh,$biblionumber);
741                 NEWmodbiblio($dbh,$biblionumber,$xmlhash,$frameworkcode) ;
742                 }
743                 
744      }#foreach $xmlhash
745 }#sub
746
747 sub XML_writeline_withid{
748 ## Only used in authorities to update biblios with matching authids
749 my ($xml,$idsubf,$id,$newvalue,$tag,$subf)=@_;
750 my $biblio=$xml->{'datafield'};
751 my $updated=0;
752     if ($tag>9){
753         foreach my $data (@$biblio){
754                         if ($data->{'tag'} eq $tag){
755                         my @subfields=$data->{'subfield'};
756                         foreach my $subfield ( @subfields){
757                               foreach my $code ( @$subfield){
758                                 if ($code->{'code'} eq $idsubf && $code->{'content'} eq $id){
759                                 ###This is the correct tag -- Now reiterate and update
760                                         my @newsubs;
761                                           foreach my $code ( @$subfield){               
762                                                 if ($code->{'code'} eq $subf ){
763                                                 $code->{'content'}=$newvalue;
764                                                 $updated=1;
765                                                 }
766                                            push @newsubs, $code;
767                                         }## each code updated
768                                         if (!$updated){
769                                         ##Create the subfield if it did not exist       
770                                         push @newsubs,{code=>$subf,content=>$newvalue};
771                                         $data->{subfield}= \@newsubs;
772                                         $updated=1;
773                                          }### created   
774                                 }### correct tag with id
775                               }#each code
776                         }##each subfield        
777                 }# tag match
778          }## each datafield
779     }### tag >9
780 return $xml;
781 }
782 sub XML_delete_withid{
783 ## Currently  only usedin authorities
784 ### deletes all the subfields of a matching authid
785 my ($xml,$id,$tag,$idsubf)=@_;
786 my $biblio=$xml->{'datafield'};
787     if ($tag>9){
788         foreach my $data (@$biblio){
789                         if ($data->{'tag'} eq $tag){
790                         my @subfields=$data->{'subfield'};
791                         foreach my $subfield ( @subfields){
792                               foreach my $code ( @$subfield){
793                                 if ($code->{'code'} eq $idsubf && $code->{'content'} eq $id){
794                                 ###This is the correct tag -- Now reiterate and delete all but id subfield
795                                           foreach my $code ( @$subfield){               
796                                                 if ($code->{'code'} ne $idsubf ){
797                                                 $code->{'content'}="";                                  
798                                                 }                                          
799                                           }## each code deleted 
800                                 }### correct tag with id
801                               }#each code
802                         }## each subfield       
803                 }## tag matches
804          }## each datafield
805     }# tag >9
806 return $xml;
807 }
808
809 sub XML_readline_withtags {
810 my ($xml,$kohafield,$recordtype,$tag,$subf)=@_;
811 #$xml represents one record of MARCXML as perlhashed 
812 ## returns an array of read fields--useful for reading repeated fields
813 ### $recordtype is needed for mapping the correct field if supplied
814 ### If only $tag is given reads the whole tag
815 ###Returns subfieldcodes as well
816 my @value;
817  ($tag,$subf)=MARCfind_marc_from_kohafield($kohafield,$recordtype) if $kohafield;
818 if ($tag){
819 ### Only datafields are read
820 my $biblio=$xml->{'datafield'};
821  if ($tag>9){
822         foreach my $data (@$biblio){
823             if ($data->{'tag'} eq $tag){
824                 foreach my $subfield ( $data->{'subfield'}){
825                     foreach my $code ( @$subfield){
826                         if ($code->{'code'} eq $subf || !$subf){
827                         push @value,[$code->{'code'},$code->{'content'}];
828                         }
829                    }# each code
830                 }# each subfield
831            }### tag found
832         }## each tag
833    }##tag >9
834 }## if tag 
835 return @value;
836 }
837
838 END { }       # module clean-up code here (global destructor)
839
840 =back
841
842 =head1 AUTHOR
843
844 Koha Developement team <info@koha.org>
845
846 Paul POULAIN paul.poulain@free.fr
847
848 =cut
849
850 # $Id$
851
852 # Revision 1.30  2006/09/06 16:21:03  tgarip1957
853 # Clean up before final commits
854 #
855 # Revision 1.9.2.6  2005/06/07 10:02:00  tipaul
856 # porting dictionnary search from head to 2.2. there is now a ... facing titles, author & subject, to search in biblio & authorities existing values.
857 #
858 # Revision 1.9.2.5  2005/05/31 14:50:46  tipaul
859 # fix for authority merging. There was a bug on official installs
860 #
861 # Revision 1.9.2.4  2005/05/30 11:24:15  tipaul
862 # fixing a bug : when a field was repeated, the last field was also repeated. (Was due to the "empty" field in html between fields : to separate fields, in html, an empty field is automatically added. in AUTHhtml2marc, this empty field was not discarded correctly)
863 #
864 # Revision 1.9.2.3  2005/04/28 08:45:33  tipaul
865 # porting FindDuplicate feature for authorities from HEAD to rel_2_2, works correctly now.
866 #
867 # Revision 1.9.2.2  2005/02/28 14:03:13  tipaul
868 # * adding search on "main entry" (ie $a subfield) on a given authority (the "search everywhere" field is still here).
869 # * adding a select box to requet "contain" or "begin with" search.
870 # * fixing some bug in authority search (related to "main entry" search)
871 #
872 # Revision 1.9.2.1  2005/02/24 13:12:13  tipaul
873 # saving authority modif in a text file. This will be used soon with another script (in crontab). The script in crontab will retrieve every authorityid in the directory localfile/authorities and modify every biblio using this authority. Those modifs may be long. So they can't be done through http, because we may encounter a webserver timeout, and kill the process before end of the job.
874 # So, it will be done through a cron job.
875 # (/me agree we need some doc for command line scripts)
876 #
877 # Revision 1.9  2004/12/23 09:48:11  tipaul
878 # Minor changes in summary "exploding" (the 3 digits AFTER the subfield were not on the right place).
879 #
880 # Revision 1.8  2004/11/05 10:11:39  tipaul
881 # export auth_count_usage (bugfix)
882 #
883 # Revision 1.7  2004/09/23 16:13:00  tipaul
884 # Bugfix in modification
885 #
886 # Revision 1.6  2004/08/18 16:00:24  tipaul
887 # fixes for authorities management
888 #
889 # Revision 1.5  2004/07/05 13:37:22  doxulting
890 # First step for working authorities
891 #
892 # Revision 1.4  2004/06/22 11:35:37  tipaul
893 # removing % at the beginning of a string to avoid loooonnnngggg searchs
894 #
895 # Revision 1.3  2004/06/17 08:02:13  tipaul
896 # merging tag & subfield in auth_word for better perfs
897 #
898 # Revision 1.2  2004/06/10 08:29:01  tipaul
899 # MARC authority management (continued)
900 #
901 # Revision 1.1  2004/06/07 07:35:01  tipaul
902 # MARC authority management package
903 #
904