Koha/C4/AuthoritiesMarc.pm

834 lines
27 KiB
Perl
Raw Blame History

package C4::AuthoritiesMarc;
# Copyright 2000-2002 Katipo Communications
#
# This file is part of Koha.
#
# Koha is free software; you can redistribute it and/or modify it under the
# terms of the GNU General Public License as published by the Free Software
# Foundation; either version 2 of the License, or (at your option) any later
# version.
#
# Koha is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
# A PARTICULAR PURPOSE. See the GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License along with
# Koha; if not, write to the Free Software Foundation, Inc., 59 Temple Place,
# Suite 330, Boston, MA 02111-1307 USA
use strict;
require Exporter;
use C4::Context;
use C4::Database;
use C4::Koha;
use MARC::Record;
use C4::Biblio;
use vars qw($VERSION @ISA @EXPORT);
# set the version for version checking
$VERSION = 0.01;
@ISA = qw(Exporter);
@EXPORT = qw(
&AUTHgettagslib
&AUTHfindsubfield
&AUTHfind_authtypecode
&AUTHaddauthority
&AUTHmodauthority
&AUTHdelauthority
&AUTHaddsubfield
&AUTHgetauthority
&authoritysearch
&MARCmodsubfield
&AUTHhtml2marc
&AUTHaddword
&MARCaddword &MARCdelword
&char_decode
);
sub authoritysearch {
my ($dbh, $tags, $and_or, $excluding, $operator, $value, $offset,$length,$authtypecode) = @_;
# build the sql request. She will look like :
# select m1.bibid
# from auth_subfield_table as m1, auth_subfield_table as m2
# where m1.authid=m2.authid and
# (m1.subfieldvalue like "Des%" and m2.subfieldvalue like "27%")
# "Normal" statements
my @normal_tags = ();
my @normal_and_or = ();
my @normal_operator = ();
my @normal_value = ();
# Extracts the NOT statements from the list of statements
for(my $i = 0 ; $i <= $#{$value} ; $i++)
{
if(@$operator[$i] eq "contains") # if operator is contains, splits the words in separate requests
{
foreach my $word (split(/ /, @$value[$i]))
{
unless (C4::Context->stopwords->{uc($word)}) { #it's NOT a stopword => use it. Otherwise, ignore
my $tag = substr(@$tags[$i],0,3);
my $subf = substr(@$tags[$i],3,1);
push @normal_tags, @$tags[$i];
push @normal_and_or, "and"; # assumes "foo" and "bar" if "foo bar" is entered
push @normal_operator, @$operator[$i];
push @normal_value, $word;
}
}
}
else
{
push @normal_tags, @$tags[$i];
push @normal_and_or, @$and_or[$i];
push @normal_operator, @$operator[$i];
push @normal_value, @$value[$i];
}
}
# Finds the basic results without the NOT requests
my ($sql_tables, $sql_where1, $sql_where2) = create_request($dbh,\@normal_tags, \@normal_and_or, \@normal_operator, \@normal_value);
my $sth;
if ($sql_where2) {
$sth = $dbh->prepare("select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where2 and ($sql_where1)");
warn "Q2 : select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where2 and ($sql_where1)";
} else {
$sth = $dbh->prepare("select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where1");
warn "Q : select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where1";
}
$sth->execute($authtypecode);
my @result = ();
while (my ($authid) = $sth->fetchrow) {
warn "AUTH: $authid";
push @result,$authid;
}
# we have authid list. Now, loads summary from [offset] to [offset]+[length]
my $counter = $offset;
my @finalresult = ();
my $oldline;
while (($counter <= $#result) && ($counter <= ($offset + $length))) {
# warn " HERE : $counter, $#result, $offset, $length";
# get MARC::Record of the authority
my $record = AUTHgetauthority($dbh,$result[$counter]);
# then build the summary
my $authtypecode = AUTHfind_authtypecode($dbh,$result[$counter]);
my $authref = getauthtype($authtypecode);
my $summary = $authref->{summary};
my @fields = $record->fields();
foreach my $field (@fields) {
my $tag = $field->tag();
if ($tag<10) {
} else {
my @subf = $field->subfields;
for my $i (0..$#subf) {
my $subfieldcode = $subf[$i][0];
my $subfieldvalue = $subf[$i][1];
my $tagsubf = $tag.$subfieldcode;
$summary =~ s/\[(.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue\[$1$tagsubf$2]$2$3/g;
}
}
}
$summary =~ s/\[(.*?)]//g;
$summary =~ s/\n/<br>/g;
# find biblio MARC field using this authtypecode (to jump to biblio)
my $authtypecode = AUTHfind_authtypecode($dbh,$result[$counter]);
my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
$sth->execute($authtypecode);
my $tags_using_authtype;
while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
$tags_using_authtype.= $tagfield."9,";
}
chop $tags_using_authtype;
# then add a line for the template loop
my %newline;
$newline{summary} = $summary;
$newline{authid} = $result[$counter];
$newline{used} = &AUTHcount_usage($result[$counter]);
$newline{biblio_fields} = $tags_using_authtype;
$counter++;
push @finalresult, \%newline;
}
my $nbresults = $#result + 1;
return (\@finalresult, $nbresults);
}
# Creates the SQL Request
sub create_request {
my ($dbh,$tags, $and_or, $operator, $value) = @_;
my $sql_tables; # will contain marc_subfield_table as m1,...
my $sql_where1; # will contain the "true" where
my $sql_where2 = "("; # will contain m1.authid=m2.authid
my $nb_active=0; # will contain the number of "active" entries. and entry is active is a value is provided.
my $nb_table=1; # will contain the number of table. ++ on each entry EXCEPT when an OR is provided.
for(my $i=0; $i<=@$value;$i++) {
if (@$value[$i]) {
$nb_active++;
if ($nb_active==1) {
if (@$operator[$i] eq "start") {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "(m1.subfieldvalue like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tag+m1.subfieldcode in (@$tags[$i])";
}
$sql_where1.=")";
} elsif (@$operator[$i] eq "contains") {
$sql_tables .= "auth_word as m$nb_table,";
$sql_where1 .= "(m1.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tagsubfield in (@$tags[$i])";
}
$sql_where1.=")";
} else {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "(m1.subfieldvalue @$operator[$i] ".$dbh->quote("@$value[$i]");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tag+m1.subfieldcode in (@$tags[$i])";
}
$sql_where1.=")";
}
} else {
if (@$operator[$i] eq "start") {
$nb_table++;
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.subfieldvalue like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldcode in (@$tags[$i])";
}
$sql_where1.=")";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
} elsif (@$operator[$i] eq "contains") {
if (@$and_or[$i] eq 'and') {
$nb_table++;
$sql_tables .= "auth_word as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tagsubfield in(@$tags[$i])";
}
$sql_where1.=")";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
} else {
$sql_where1 .= "@$and_or[$i] (m$nb_table.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldid in (@$tags[$i])";
}
$sql_where1.=")";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
}
} else {
$nb_table++;
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.subfieldvalue @$operator[$i] ".$dbh->quote(@$value[$i]);
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldcode in (@$tags[$i])";
}
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
$sql_where1.=")";
}
}
}
}
if($sql_where2 ne "(") # some datas added to sql_where2, processing
{
$sql_where2 = substr($sql_where2, 0, (length($sql_where2)-5)); # deletes the trailing ' and '
$sql_where2 .= ")";
}
else # no sql_where2 statement, deleting '('
{
$sql_where2 = "";
}
chop $sql_tables; # deletes the trailing ','
return ($sql_tables, $sql_where1, $sql_where2);
}
sub AUTHcount_usage {
my ($authid) = @_;
my $dbh = C4::Context->dbh;
# find MARC fields using this authtype
my $authtypecode = AUTHfind_authtypecode($dbh,$authid);
my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
$sth->execute($authtypecode);
my $tags_using_authtype;
while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
$tags_using_authtype.= "'".$tagfield."9',";
}
chop $tags_using_authtype;
$sth = $dbh->prepare("select count(*) from marc_subfield_table where concat(tag,subfieldcode) in ($tags_using_authtype) and subfieldvalue=?");
# warn "Q : select count(*) from marc_subfield_table where concat(tag,subfieldcode) in ($tags_using_authtype) and subfieldvalue=$authid";
$sth->execute($authid);
my ($result) = $sth->fetchrow;
# warn "Authority $authid TOTAL USED : $result";
return $result;
}
# merging 2 authority entries. After a merge, the "from" can be deleted.
# sub AUTHmerge {
# my ($auth_merge_from,$auth_merge_to) = @_;
# my $dbh = C4::Context->dbh;
# # find MARC fields using this authtype
# my $authtypecode = AUTHfind_authtypecode($dbh,$authid);
# # retrieve records
# my $record_from = AUTHgetauthority($dbh,$auth_merge_from);
# my $record_to = AUTHgetauthority($dbh,$auth_merge_to);
# my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
# $sth->execute($authtypecode);
# my $tags_using_authtype;
# while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
# $tags_using_authtype.= "'".$tagfield."9',";
# }
# chop $tags_using_authtype;
# # now, find every biblio using this authority
# $sth = $dbh->prepare("select bibid,tag,tag_indicator,tagorder from marc_subfield_table where tag+subfieldid in ($tags_using_authtype) and subfieldvalue=?");
# $sth->execute($authid);
# # and delete entries before recreating them
# while (my ($bibid,$tag,$tag_indicator,$tagorder) = $sth->fetchrow) {
# &MARCdelsubfield($dbh,$bibid,$tag);
#
# }
#
# }
sub AUTHfind_authtypecode {
my ($dbh,$authid) = @_;
my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
$sth->execute($authid);
my ($authtypecode) = $sth->fetchrow;
return $authtypecode;
}
sub AUTHgettagslib {
my ($dbh,$forlibrarian,$authtypecode)= @_;
# warn "AUTH : $authtypecode";
$authtypecode="" unless $authtypecode;
# warn "AUTH : $authtypecode";
my $sth;
my $libfield = ($forlibrarian eq 1)? 'liblibrarian' : 'libopac';
# check that framework exists
$sth=$dbh->prepare("select count(*) from auth_tag_structure where authtypecode=?");
$sth->execute($authtypecode);
my ($total) = $sth->fetchrow;
$authtypecode="" unless ($total >0);
$sth=$dbh->prepare("select tagfield,$libfield as lib,mandatory,repeatable from auth_tag_structure where authtypecode=? order by tagfield");
$sth->execute($authtypecode);
my ($lib,$tag,$res,$tab,$mandatory,$repeatable);
while ( ($tag,$lib,$mandatory,$repeatable) = $sth->fetchrow) {
$res->{$tag}->{lib}=$lib;
$res->{$tab}->{tab}=""; # XXX
$res->{$tag}->{mandatory}=$mandatory;
$res->{$tag}->{repeatable}=$repeatable;
}
$sth=$dbh->prepare("select tagfield,tagsubfield,$libfield as lib,tab, mandatory, repeatable,authorised_value,value_builder,seealso from auth_subfield_structure where authtypecode=? order by tagfield,tagsubfield");
$sth->execute($authtypecode);
my $subfield;
my $authorised_value;
my $thesaurus_category;
my $value_builder;
my $kohafield;
my $seealso;
my $hidden;
my $isurl;
while ( ($tag, $subfield, $lib, $tab, $mandatory, $repeatable,$authorised_value,$value_builder,$seealso) = $sth->fetchrow) {
$res->{$tag}->{$subfield}->{lib}=$lib;
$res->{$tag}->{$subfield}->{tab}=$tab;
$res->{$tag}->{$subfield}->{mandatory}=$mandatory;
$res->{$tag}->{$subfield}->{repeatable}=$repeatable;
$res->{$tag}->{$subfield}->{authorised_value}=$authorised_value;
$res->{$tag}->{$subfield}->{thesaurus_category}=$thesaurus_category;
$res->{$tag}->{$subfield}->{value_builder}=$value_builder;
$res->{$tag}->{$subfield}->{seealso}=$seealso;
$res->{$tag}->{$subfield}->{hidden}=$hidden;
$res->{$tag}->{$subfield}->{isurl}=$isurl;
}
return $res;
}
sub AUTHaddauthority {
# pass the MARC::Record to this function, and it will create the records in the marc tables
my ($dbh,$record,$authid,$authtypecode) = @_;
my @fields=$record->fields();
# warn "IN AUTHaddauthority $authid => ".$record->as_formatted;
# adding main table, and retrieving authid
# if authid is sent, then it's not a true add, it's only a re-add, after a delete (ie, a mod)
# if authid empty => true add, find a new authid number
unless ($authid) {
$dbh->do("lock tables auth_header WRITE,auth_subfield_table WRITE, auth_word WRITE, stopwords READ");
my $sth=$dbh->prepare("insert into auth_header (datecreated,authtypecode) values (now(),?)");
$sth->execute($authtypecode);
$sth=$dbh->prepare("select max(authid) from auth_header");
$sth->execute;
($authid)=$sth->fetchrow;
$sth->finish;
}
my $fieldcount=0;
# now, add subfields...
foreach my $field (@fields) {
$fieldcount++;
if ($field->tag() <10) {
&AUTHaddsubfield($dbh,$authid,
$field->tag(),
'',
$fieldcount,
'',
1,
$field->data()
);
} else {
my @subfields=$field->subfields();
foreach my $subfieldcount (0..$#subfields) {
&AUTHaddsubfield($dbh,$authid,
$field->tag(),
$field->indicator(1).$field->indicator(2),
$fieldcount,
$subfields[$subfieldcount][0],
$subfieldcount+1,
$subfields[$subfieldcount][1]
);
}
}
}
$dbh->do("unlock tables");
return $authid;
}
sub AUTHaddsubfield {
# Add a new subfield to a tag into the DB.
my ($dbh,$authid,$tagid,$tag_indicator,$tagorder,$subfieldcode,$subfieldorder,$subfieldvalues) = @_;
# if not value, end of job, we do nothing
if (length($subfieldvalues) ==0) {
return;
}
if (not($subfieldcode)) {
$subfieldcode=' ';
}
my @subfieldvalues = split /\|/,$subfieldvalues;
foreach my $subfieldvalue (@subfieldvalues) {
my $sth=$dbh->prepare("insert into auth_subfield_table (authid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue) values (?,?,?,?,?,?,?)");
$sth->execute($authid,(sprintf "%03s",$tagid),$tagorder,$tag_indicator,$subfieldcode,$subfieldorder,$subfieldvalue);
if ($sth->errstr) {
warn "ERROR ==> insert into auth_subfield_table (authid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue) values ($authid,$tagid,$tagorder,$tag_indicator,$subfieldcode,$subfieldorder,$subfieldvalue)\n";
}
&AUTHaddword($dbh,$authid,$tagid,$tagorder,$subfieldcode,$subfieldorder,$subfieldvalue);
}
}
sub AUTHgetauthority {
# Returns MARC::Record of the biblio passed in parameter.
my ($dbh,$authid)=@_;
my $record = MARC::Record->new();
#---- TODO : the leader is missing
$record->leader(' ');
my $sth=$dbh->prepare("select authid,subfieldid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue
from auth_subfield_table
where authid=? order by tag,tagorder,subfieldcode
");
$sth->execute($authid);
my $prevtagorder=1;
my $prevtag='XXX';
my $previndicator;
my $field; # for >=10 tags
my $prevvalue; # for <10 tags
while (my $row=$sth->fetchrow_hashref) {
if ($row->{tagorder} ne $prevtagorder || $row->{tag} ne $prevtag) {
$previndicator.=" ";
if ($prevtag <10) {
$record->add_fields((sprintf "%03s",$prevtag),$prevvalue) unless $prevtag eq "XXX"; # ignore the 1st loop
} else {
$record->add_fields($field) unless $prevtag eq "XXX";
}
undef $field;
$prevtagorder=$row->{tagorder};
$prevtag = $row->{tag};
$previndicator=$row->{tag_indicator};
if ($row->{tag}<10) {
$prevvalue = $row->{subfieldvalue};
} else {
$field = MARC::Field->new((sprintf "%03s",$prevtag), substr($row->{tag_indicator}.' ',0,1), substr($row->{tag_indicator}.' ',1,1), $row->{'subfieldcode'}, $row->{'subfieldvalue'} );
}
} else {
if ($row->{tag} <10) {
$record->add_fields((sprintf "%03s",$row->{tag}), $row->{'subfieldvalue'});
} else {
$field->add_subfields($row->{'subfieldcode'}, $row->{'subfieldvalue'} );
}
$prevtag= $row->{tag};
$previndicator=$row->{tag_indicator};
}
}
# the last has not been included inside the loop... do it now !
if ($prevtag ne "XXX") { # check that we have found something. Otherwise, prevtag is still XXX and we
# must return an empty record, not make MARC::Record fail because we try to
# create a record with XXX as field :-(
if ($prevtag <10) {
$record->add_fields($prevtag,$prevvalue);
} else {
# my $field = MARC::Field->new( $prevtag, "", "", %subfieldlist);
$record->add_fields($field);
}
}
return $record;
}
sub AUTHmodauthority {
my ($dbh,$authid,$record,$delete)=@_;
my $oldrecord=&AUTHgetauthority($dbh,$authid);
if ($oldrecord eq $record) {
return;
}
# 1st delete the authority,
# 2nd recreate it
&AUTHdelauthority($dbh,$authid,1);
&AUTHaddauthority($dbh,$record,$authid);
# FIXME : modify the authority in biblio too.
}
sub AUTHdelauthority {
my ($dbh,$authid,$keep_biblio) = @_;
# if the keep_biblio is set to 1, then authority entries in biblio are preserved.
# This flag is set when the delauthority is called by modauthority
# due to a too complex structure of MARC (repeatable fields and subfields),
# the best solution for a modif is to delete / recreate the record.
my $record = AUTHgetauthority($dbh,$authid);
$dbh->do("delete from auth_header where authid=$authid");
$dbh->do("delete from auth_subfield_table where authid=$authid");
$dbh->do("delete from auth_word where authid=$authid");
# FIXME : delete or not in biblio tables (depending on $keep_biblio flag)
}
sub AUTHmodsubfield {
# Subroutine changes a subfield value given a subfieldid.
my ($dbh, $subfieldid, $subfieldvalue )=@_;
$dbh->do("lock tables auth_subfield_table WRITE");
my $sth=$dbh->prepare("update auth_subfield_table set subfieldvalue=? where subfieldid=?");
$sth->execute($subfieldvalue, $subfieldid);
$dbh->do("unlock tables");
$sth->finish;
$sth=$dbh->prepare("select authid,tag,tagorder,subfieldcode,subfieldid,subfieldorder from auth_subfield_table where subfieldid=?");
$sth->execute($subfieldid);
my ($authid,$tagid,$tagorder,$subfieldcode,$x,$subfieldorder) = $sth->fetchrow;
$subfieldid=$x;
&AUTHdelword($dbh,$authid,$tagid,$tagorder,$subfieldcode,$subfieldorder);
&AUTHaddword($dbh,$authid,$tagid,$tagorder,$subfieldcode,$subfieldorder,$subfieldvalue);
return($subfieldid, $subfieldvalue);
}
sub AUTHfindsubfield {
my ($dbh,$authid,$tag,$subfieldcode,$subfieldorder,$subfieldvalue) = @_;
my $resultcounter=0;
my $subfieldid;
my $lastsubfieldid;
my $query="select subfieldid from auth_subfield_table where authid=? and tag=? and subfieldcode=?";
my @bind_values = ($authid,$tag, $subfieldcode);
if ($subfieldvalue) {
$query .= " and subfieldvalue=?";
push(@bind_values,$subfieldvalue);
} else {
if ($subfieldorder<1) {
$subfieldorder=1;
}
$query .= " and subfieldorder=?";
push(@bind_values,$subfieldorder);
}
my $sti=$dbh->prepare($query);
$sti->execute(@bind_values);
while (($subfieldid) = $sti->fetchrow) {
$resultcounter++;
$lastsubfieldid=$subfieldid;
}
if ($resultcounter>1) {
# Error condition. Values given did not resolve into a unique record. Don't know what to edit
# should rarely occur (only if we use subfieldvalue with a value that exists twice, which is strange)
return -1;
} else {
return $lastsubfieldid;
}
}
sub AUTHfindsubfieldid {
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
my $sth=$dbh->prepare("select subfieldid from auth_subfield_table
where authid=? and tag=? and tagorder=?
and subfieldcode=? and subfieldorder=?");
$sth->execute($authid,$tag,$tagorder,$subfield,$subfieldorder);
my ($res) = $sth->fetchrow;
unless ($res) {
$sth=$dbh->prepare("select subfieldid from auth_subfield_table
where authid=? and tag=? and tagorder=?
and subfieldcode=?");
$sth->execute($authid,$tag,$tagorder,$subfield);
($res) = $sth->fetchrow;
}
return $res;
}
sub AUTHfind_authtypecode {
my ($dbh,$authid) = @_;
my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
$sth->execute($authid);
my ($authtypecode) = $sth->fetchrow;
return $authtypecode;
}
sub AUTHdelsubfield {
# delete a subfield for $authid / tag / tagorder / subfield / subfieldorder
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
$dbh->do("delete from auth_subfield_table where authid='$authid' and
tag='$tag' and tagorder='$tagorder'
and subfieldcode='$subfield' and subfieldorder='$subfieldorder'
");
}
sub AUTHhtml2marc {
my ($dbh,$rtags,$rsubfields,$rvalues,%indicators) = @_;
my $prevtag = -1;
my $record = MARC::Record->new();
# my %subfieldlist=();
my $prevvalue; # if tag <10
my $field; # if tag >=10
for (my $i=0; $i< @$rtags; $i++) {
# rebuild MARC::Record
if (@$rtags[$i] ne $prevtag) {
if ($prevtag < 10) {
if ($prevvalue) {
$record->add_fields((sprintf "%03s",$prevtag),$prevvalue);
}
} else {
if ($field) {
$record->add_fields($field);
}
}
$indicators{@$rtags[$i]}.=' ';
if (@$rtags[$i] <10) {
$prevvalue= @$rvalues[$i];
} else {
$field = MARC::Field->new( (sprintf "%03s",@$rtags[$i]), substr($indicators{@$rtags[$i]},0,1),substr($indicators{@$rtags[$i]},1,1), @$rsubfields[$i] => @$rvalues[$i]);
}
$prevtag = @$rtags[$i];
} else {
if (@$rtags[$i] <10) {
$prevvalue=@$rvalues[$i];
} else {
if (@$rvalues[$i]) {
$field->add_subfields(@$rsubfields[$i] => @$rvalues[$i]);
}
}
$prevtag= @$rtags[$i];
}
}
# the last has not been included inside the loop... do it now !
$record->add_fields($field);
# warn $record->as_formatted;
return $record;
}
sub AUTHaddword {
# split a subfield string and adds it into the word table.
# removes stopwords
my ($dbh,$authid,$tag,$tagorder,$subfieldid,$subfieldorder,$sentence) =@_;
$sentence =~ s/(\.|\?|\:|\!|\'|,|\-|\"|\(|\)|\[|\]|\{|\})/ /g;
my @words = split / /,$sentence;
my $stopwords= C4::Context->stopwords;
my $sth=$dbh->prepare("insert into auth_word (authid, tagsubfield, tagorder, subfieldorder, word, sndx_word)
values (?,concat(?,?),?,?,?,soundex(?))");
foreach my $word (@words) {
# we record only words longer than 2 car and not in stopwords hash
if (length($word)>2 and !($stopwords->{uc($word)})) {
$sth->execute($authid,$tag,$subfieldid,$tagorder,$subfieldorder,$word,$word);
if ($sth->err()) {
warn "ERROR ==> insert into auth_word (authid, tagsubfield, tagorder, subfieldorder, word, sndx_word) values ($authid,concat($tag,$subfieldid),$tagorder,$subfieldorder,$word,soundex($word))\n";
}
}
}
}
sub AUTHdelword {
# delete words. this sub deletes all the words from a sentence. a subfield modif is done by a delete then a add
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
my $sth=$dbh->prepare("delete from auth_word where authid=? and tagsubfield=concat(?,?) and tagorder=? and subfieldorder=?");
$sth->execute($authid,$tag,$subfield,$tagorder,$subfieldorder);
}
sub char_decode {
# converts ISO 5426 coded string to ISO 8859-1
# sloppy code : should be improved in next issue
my ($string,$encoding) = @_ ;
$_ = $string ;
# $encoding = C4::Context->preference("marcflavour") unless $encoding;
if ($encoding eq "UNIMARC") {
s/\xe1/<2F>/gm ;
s/\xe2/<2F>/gm ;
s/\xe9/<2F>/gm ;
s/\xec/<2F>/gm ;
s/\xf1/<2F>/gm ;
s/\xf3/<2F>/gm ;
s/\xf9/<2F>/gm ;
s/\xfb/<2F>/gm ;
s/\xc1\x61/<2F>/gm ;
s/\xc1\x65/<2F>/gm ;
s/\xc1\x69/<2F>/gm ;
s/\xc1\x6f/<2F>/gm ;
s/\xc1\x75/<2F>/gm ;
s/\xc1\x41/<2F>/gm ;
s/\xc1\x45/<2F>/gm ;
s/\xc1\x49/<2F>/gm ;
s/\xc1\x4f/<2F>/gm ;
s/\xc1\x55/<2F>/gm ;
s/\xc2\x41/<2F>/gm ;
s/\xc2\x45/<2F>/gm ;
s/\xc2\x49/<2F>/gm ;
s/\xc2\x4f/<2F>/gm ;
s/\xc2\x55/<2F>/gm ;
s/\xc2\x59/<2F>/gm ;
s/\xc2\x61/<2F>/gm ;
s/\xc2\x65/<2F>/gm ;
s/\xc2\x69/<2F>/gm ;
s/\xc2\x6f/<2F>/gm ;
s/\xc2\x75/<2F>/gm ;
s/\xc2\x79/<2F>/gm ;
s/\xc3\x41/<2F>/gm ;
s/\xc3\x45/<2F>/gm ;
s/\xc3\x49/<2F>/gm ;
s/\xc3\x4f/<2F>/gm ;
s/\xc3\x55/<2F>/gm ;
s/\xc3\x61/<2F>/gm ;
s/\xc3\x65/<2F>/gm ;
s/\xc3\x69/<2F>/gm ;
s/\xc3\x6f/<2F>/gm ;
s/\xc3\x75/<2F>/gm ;
s/\xc4\x41/<2F>/gm ;
s/\xc4\x4e/<2F>/gm ;
s/\xc4\x4f/<2F>/gm ;
s/\xc4\x61/<2F>/gm ;
s/\xc4\x6e/<2F>/gm ;
s/\xc4\x6f/<2F>/gm ;
s/\xc8\x45/<2F>/gm ;
s/\xc8\x49/<2F>/gm ;
s/\xc8\x65/<2F>/gm ;
s/\xc8\x69/<2F>/gm ;
s/\xc8\x76/<2F>/gm ;
s/\xc9\x41/<2F>/gm ;
s/\xc9\x4f/<2F>/gm ;
s/\xc9\x55/<2F>/gm ;
s/\xc9\x61/<2F>/gm ;
s/\xc9\x6f/<2F>/gm ;
s/\xc9\x75/<2F>/gm ;
s/\xca\x41/<2F>/gm ;
s/\xca\x61/<2F>/gm ;
s/\xd0\x43/<2F>/gm ;
s/\xd0\x63/<2F>/gm ;
# this handles non-sorting blocks (if implementation requires this)
$string = nsb_clean($_) ;
} elsif ($encoding eq "USMARC" || $encoding eq "MARC21") {
if(/[\xc1-\xff]/) {
s/\xe1\x61/<2F>/gm ;
s/\xe1\x65/<2F>/gm ;
s/\xe1\x69/<2F>/gm ;
s/\xe1\x6f/<2F>/gm ;
s/\xe1\x75/<2F>/gm ;
s/\xe1\x41/<2F>/gm ;
s/\xe1\x45/<2F>/gm ;
s/\xe1\x49/<2F>/gm ;
s/\xe1\x4f/<2F>/gm ;
s/\xe1\x55/<2F>/gm ;
s/\xe2\x41/<2F>/gm ;
s/\xe2\x45/<2F>/gm ;
s/\xe2\x49/<2F>/gm ;
s/\xe2\x4f/<2F>/gm ;
s/\xe2\x55/<2F>/gm ;
s/\xe2\x59/<2F>/gm ;
s/\xe2\x61/<2F>/gm ;
s/\xe2\x65/<2F>/gm ;
s/\xe2\x69/<2F>/gm ;
s/\xe2\x6f/<2F>/gm ;
s/\xe2\x75/<2F>/gm ;
s/\xe2\x79/<2F>/gm ;
s/\xe3\x41/<2F>/gm ;
s/\xe3\x45/<2F>/gm ;
s/\xe3\x49/<2F>/gm ;
s/\xe3\x4f/<2F>/gm ;
s/\xe3\x55/<2F>/gm ;
s/\xe3\x61/<2F>/gm ;
s/\xe3\x65/<2F>/gm ;
s/\xe3\x69/<2F>/gm ;
s/\xe3\x6f/<2F>/gm ;
s/\xe3\x75/<2F>/gm ;
s/\xe4\x41/<2F>/gm ;
s/\xe4\x4e/<2F>/gm ;
s/\xe4\x4f/<2F>/gm ;
s/\xe4\x61/<2F>/gm ;
s/\xe4\x6e/<2F>/gm ;
s/\xe4\x6f/<2F>/gm ;
s/\xe8\x45/<2F>/gm ;
s/\xe8\x49/<2F>/gm ;
s/\xe8\x65/<2F>/gm ;
s/\xe8\x69/<2F>/gm ;
s/\xe8\x76/<2F>/gm ;
s/\xe9\x41/<2F>/gm ;
s/\xe9\x4f/<2F>/gm ;
s/\xe9\x55/<2F>/gm ;
s/\xe9\x61/<2F>/gm ;
s/\xe9\x6f/<2F>/gm ;
s/\xe9\x75/<2F>/gm ;
s/\xea\x41/<2F>/gm ;
s/\xea\x61/<2F>/gm ;
# this handles non-sorting blocks (if implementation requires this)
$string = nsb_clean($_) ;
}
}
return($string) ;
}
sub nsb_clean {
my $NSB = '\x88' ; # NSB : begin Non Sorting Block
my $NSE = '\x89' ; # NSE : Non Sorting Block end
# handles non sorting blocks
my ($string) = @_ ;
$_ = $string ;
s/$NSB/(/gm ;
s/[ ]{0,1}$NSE/) /gm ;
$string = $_ ;
return($string) ;
}
END { } # module clean-up code here (global destructor)
=back
=head1 AUTHOR
Koha Developement team <info@koha.org>
Paul POULAIN paul.poulain@free.fr
=cut
# $Id$
# $Log$
# Revision 1.3 2004/06/17 08:02:13 tipaul
# merging tag & subfield in auth_word for better perfs
#
# Revision 1.2 2004/06/10 08:29:01 tipaul
# MARC authority management (continued)
#
# Revision 1.1 2004/06/07 07:35:01 tipaul
# MARC authority management package
#