2005-08-04 13:27:37 +00:00

984 lines
33 KiB
Raw Blame History

package C4::AuthoritiesMarc;
# Copyright 2000-2002 Katipo Communications
# This file is part of Koha.
# Koha is free software; you can redistribute it and/or modify it under the
# terms of the GNU General Public License as published by the Free Software
# Foundation; either version 2 of the License, or (at your option) any later
# version.
# Koha is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
# A PARTICULAR PURPOSE. See the GNU General Public License for more details.
# You should have received a copy of the GNU General Public License along with
# Koha; if not, write to the Free Software Foundation, Inc., 59 Temple Place,
# Suite 330, Boston, MA 02111-1307 USA
use strict;
require Exporter;
use C4::Context;
use C4::Database;
use C4::Koha;
use MARC::Record;
use C4::Biblio;
use vars qw($VERSION @ISA @EXPORT);
# set the version for version checking
$VERSION = 0.01;
@ISA = qw(Exporter);
@EXPORT = qw(
&MARCaddword &MARCdelword
sub authoritysearch {
my ($dbh, $tags, $and_or, $excluding, $operator, $value, $offset,$length,$authtypecode) = @_;
# build the sql request. She will look like :
# select m1.bibid
# from auth_subfield_table as m1, auth_subfield_table as m2
# where m1.authid=m2.authid and
# (m1.subfieldvalue like "Des%" and m2.subfieldvalue like "27%")
# the marclist may contain "mainentry". In this case, search the tag_to_report, that depends on
# the authtypecode. Then, search on $a of this tag_to_report
# also store main entry MARC tag, to extract it at end of search
my $mainentrytag;
my $sth = $dbh->prepare("select auth_tag_to_report from auth_types where authtypecode=?");
my ($tag_to_report) = $sth->fetchrow;
$mainentrytag = $tag_to_report;
for (my $i=0;$i<$#{$tags};$i++) {
if (@$tags[$i] eq "mainentry") {
@$tags[$i] = $tag_to_report."a";
# "Normal" statements
# quote marc fields/subfields
for (my $i=0;$i<=$#{$tags};$i++) {
if (@$tags[$i]) {
@$tags[$i] = $dbh->quote(@$tags[$i]);
my @normal_tags = ();
my @normal_and_or = ();
my @normal_operator = ();
my @normal_value = ();
# Extracts the NOT statements from the list of statements
for(my $i = 0 ; $i <= $#{$value} ; $i++)
# replace * by %
@$value[$i] =~ s/\*/%/g;
# remove % at the beginning
@$value[$i] =~ s/^%//g;
@$value[$i] =~ s/(\.|\?|\:|\!|\'|,|\-|\"|\(|\)|\[|\]|\{|\}|\/)/ /g if @$operator[$i] eq "contains";
if(@$operator[$i] eq "contains") # if operator is contains, splits the words in separate requests
foreach my $word (split(/ /, @$value[$i]))
unless (C4::Context->stopwords->{uc($word)}) { #it's NOT a stopword => use it. Otherwise, ignore
my $tag = substr(@$tags[$i],0,3);
my $subf = substr(@$tags[$i],3,1);
push @normal_tags, @$tags[$i];
push @normal_and_or, "and"; # assumes "foo" and "bar" if "foo bar" is entered
push @normal_operator, @$operator[$i];
push @normal_value, $word;
push @normal_tags, @$tags[$i];
push @normal_and_or, @$and_or[$i];
push @normal_operator, @$operator[$i];
push @normal_value, @$value[$i];
# Finds the basic results without the NOT requests
my ($sql_tables, $sql_where1, $sql_where2) = create_request($dbh,\@normal_tags, \@normal_and_or, \@normal_operator, \@normal_value);
my $sth;
if ($sql_where2) {
$sth = $dbh->prepare("select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where2 and ($sql_where1)");
warn "Q2 : select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where2 and ($sql_where1)";
} else {
$sth = $dbh->prepare("select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where1");
warn "Q : select distinct m1.authid from auth_header,$sql_tables where m1.authid=auth_header.authid and auth_header.authtypecode=? and $sql_where1";
my @result = ();
while (my ($authid) = $sth->fetchrow) {
push @result,$authid;
# we have authid list. Now, loads summary from [offset] to [offset]+[length]
my $counter = $offset;
my @finalresult = ();
my $oldline;
while (($counter <= $#result) && ($counter <= ($offset + $length))) {
# warn " HERE : $counter, $#result, $offset, $length";
# get MARC::Record of the authority
my $record = AUTHgetauthority($dbh,$result[$counter]);
# then build the summary
my $authtypecode = AUTHfind_authtypecode($dbh,$result[$counter]);
my $authref = getauthtype($authtypecode);
my $summary = $authref->{summary};
my @fields = $record->fields();
foreach my $field (@fields) {
my $tag = $field->tag();
if ($tag<10) {
} else {
my @subf = $field->subfields;
for my $i (0..$#subf) {
my $subfieldcode = $subf[$i][0];
my $subfieldvalue = $subf[$i][1];
my $tagsubf = $tag.$subfieldcode;
$summary =~ s/\[(.?.?.?.?)$tagsubf(.*?)]/$1$subfieldvalue\[$1$tagsubf$2]$2/g;
$summary =~ s/\[(.*?)]//g;
$summary =~ s/\n/<br>/g;
# find biblio MARC field using this authtypecode (to jump to biblio)
my $authtypecode = AUTHfind_authtypecode($dbh,$result[$counter]);
my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
my $tags_using_authtype;
while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
$tags_using_authtype.= $tagfield."9,";
chop $tags_using_authtype;
# then add a line for the template loop
my %newline;
$newline{summary} = $summary;
$newline{authid} = $result[$counter];
$newline{used} = &AUTHcount_usage($result[$counter]);
$newline{biblio_fields} = $tags_using_authtype;
$newline{even} = $counter % 2;
$newline{mainentry} = $record->field($mainentrytag)->subfield('a')." ".$record->field($mainentrytag)->subfield('b') if $record->field($mainentrytag);
push @finalresult, \%newline;
my $nbresults = $#result + 1;
return (\@finalresult, $nbresults);
# Creates the SQL Request
sub create_request {
my ($dbh,$tags, $and_or, $operator, $value) = @_;
my $sql_tables; # will contain marc_subfield_table as m1,...
my $sql_where1; # will contain the "true" where
my $sql_where2 = "("; # will contain m1.authid=m2.authid
my $nb_active=0; # will contain the number of "active" entries. and entry is active is a value is provided.
my $nb_table=1; # will contain the number of table. ++ on each entry EXCEPT when an OR is provided.
for(my $i=0; $i<=@$value;$i++) {
if (@$value[$i]) {
# warn " @$tags[$i]";
if ($nb_active==1) {
if (@$operator[$i] eq "start") {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "(m1.subfieldvalue like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tag+m1.subfieldcode in (@$tags[$i])";
} elsif (@$operator[$i] eq "contains") {
$sql_tables .= "auth_word as m$nb_table,";
$sql_where1 .= "(m1.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tagsubfield in (@$tags[$i])";
} else {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "(m1.subfieldvalue @$operator[$i] ".$dbh->quote("@$value[$i]");
if (@$tags[$i]) {
$sql_where1 .=" and m1.tag+m1.subfieldcode in (@$tags[$i])";
} else {
if (@$operator[$i] eq "start") {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.subfieldvalue like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldcode in (@$tags[$i])";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
} elsif (@$operator[$i] eq "contains") {
if (@$and_or[$i] eq 'and') {
$sql_tables .= "auth_word as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tagsubfield in(@$tags[$i])";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
} else {
$sql_where1 .= "@$and_or[$i] (m$nb_table.word like ".$dbh->quote("@$value[$i]%");
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldid in (@$tags[$i])";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
} else {
$sql_tables .= "auth_subfield_table as m$nb_table,";
$sql_where1 .= "@$and_or[$i] (m$nb_table.subfieldvalue @$operator[$i] ".$dbh->quote(@$value[$i]);
if (@$tags[$i]) {
$sql_where1 .=" and m$nb_table.tag+m$nb_table.subfieldcode in (@$tags[$i])";
$sql_where2 .= "m1.authid=m$nb_table.authid and ";
if($sql_where2 ne "(") # some datas added to sql_where2, processing
$sql_where2 = substr($sql_where2, 0, (length($sql_where2)-5)); # deletes the trailing ' and '
$sql_where2 .= ")";
else # no sql_where2 statement, deleting '('
$sql_where2 = "";
chop $sql_tables; # deletes the trailing ','
return ($sql_tables, $sql_where1, $sql_where2);
sub AUTHcount_usage {
my ($authid) = @_;
my $dbh = C4::Context->dbh;
# find MARC fields using this authtype
my $authtypecode = AUTHfind_authtypecode($dbh,$authid);
my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
my $tags_using_authtype;
while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
$tags_using_authtype.= "'".$tagfield."9',";
chop $tags_using_authtype;
if ($tags_using_authtype) {
$sth = $dbh->prepare("select count(*) from marc_subfield_table where concat(tag,subfieldcode) in ($tags_using_authtype) and subfieldvalue=?");
} else {
$sth = $dbh->prepare("select count(*) from marc_subfield_table where subfieldvalue=?");
# warn "Q : select count(*) from marc_subfield_table where concat(tag,subfieldcode) in ($tags_using_authtype) and subfieldvalue=$authid";
my ($result) = $sth->fetchrow;
# warn "Authority $authid TOTAL USED : $result";
return $result;
# merging 2 authority entries. After a merge, the "from" can be deleted.
# sub AUTHmerge {
# my ($auth_merge_from,$auth_merge_to) = @_;
# my $dbh = C4::Context->dbh;
# # find MARC fields using this authtype
# my $authtypecode = AUTHfind_authtypecode($dbh,$authid);
# # retrieve records
# my $record_from = AUTHgetauthority($dbh,$auth_merge_from);
# my $record_to = AUTHgetauthority($dbh,$auth_merge_to);
# my $sth = $dbh->prepare("select distinct tagfield from marc_subfield_structure where authtypecode=?");
# $sth->execute($authtypecode);
# my $tags_using_authtype;
# while (my ($tagfield) = $sth->fetchrow) {
# warn "TAG : $tagfield";
# $tags_using_authtype.= "'".$tagfield."9',";
# }
# chop $tags_using_authtype;
# # now, find every biblio using this authority
# $sth = $dbh->prepare("select bibid,tag,tag_indicator,tagorder from marc_subfield_table where tag+subfieldid in ($tags_using_authtype) and subfieldvalue=?");
# $sth->execute($authid);
# # and delete entries before recreating them
# while (my ($bibid,$tag,$tag_indicator,$tagorder) = $sth->fetchrow) {
# &MARCdelsubfield($dbh,$bibid,$tag);
# }
# }
sub AUTHfind_authtypecode {
my ($dbh,$authid) = @_;
my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
my ($authtypecode) = $sth->fetchrow;
return $authtypecode;
sub AUTHgettagslib {
my ($dbh,$forlibrarian,$authtypecode)= @_;
$authtypecode="" unless $authtypecode;
my $sth;
my $libfield = ($forlibrarian eq 1)? 'liblibrarian' : 'libopac';
# check that framework exists
$sth=$dbh->prepare("select count(*) from auth_tag_structure where authtypecode=?");
my ($total) = $sth->fetchrow;
$authtypecode="" unless ($total >0);
$sth=$dbh->prepare("select tagfield,$libfield as lib,mandatory,repeatable from auth_tag_structure where authtypecode=? order by tagfield");
my ($lib,$tag,$res,$tab,$mandatory,$repeatable);
while ( ($tag,$lib,$mandatory,$repeatable) = $sth->fetchrow) {
$res->{$tab}->{tab}=""; # XXX
$sth=$dbh->prepare("select tagfield,tagsubfield,$libfield as lib,tab, mandatory, repeatable,authorised_value,value_builder,seealso from auth_subfield_structure where authtypecode=? order by tagfield,tagsubfield");
my $subfield;
my $authorised_value;
my $thesaurus_category;
my $value_builder;
my $kohafield;
my $seealso;
my $hidden;
my $isurl;
while ( ($tag, $subfield, $lib, $tab, $mandatory, $repeatable,$authorised_value,$value_builder,$seealso) = $sth->fetchrow) {
return $res;
sub AUTHaddauthority {
# pass the MARC::Record to this function, and it will create the records in the marc tables
my ($dbh,$record,$authid,$authtypecode) = @_;
my @fields=$record->fields();
# warn "IN AUTHaddauthority $authid => ".$record->as_formatted;
# adding main table, and retrieving authid
# if authid is sent, then it's not a true add, it's only a re-add, after a delete (ie, a mod)
# if authid empty => true add, find a new authid number
unless ($authid) {
$dbh->do("lock tables auth_header WRITE,auth_subfield_table WRITE, auth_word WRITE, stopwords READ");
my $sth=$dbh->prepare("insert into auth_header (datecreated,authtypecode) values (now(),?)");
$sth=$dbh->prepare("select max(authid) from auth_header");
my $fieldcount=0;
# now, add subfields...
foreach my $field (@fields) {
if ($field->tag() <10) {
} else {
my @subfields=$field->subfields();
foreach my $subfieldcount (0..$#subfields) {
$dbh->do("unlock tables");
return $authid;
sub AUTHaddsubfield {
# Add a new subfield to a tag into the DB.
my ($dbh,$authid,$tagid,$tag_indicator,$tagorder,$subfieldcode,$subfieldorder,$subfieldvalues) = @_;
# if not value, end of job, we do nothing
if (length($subfieldvalues) ==0) {
if (not($subfieldcode)) {
$subfieldcode=' ';
my @subfieldvalues = split /\|/,$subfieldvalues;
foreach my $subfieldvalue (@subfieldvalues) {
my $sth=$dbh->prepare("insert into auth_subfield_table (authid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue) values (?,?,?,?,?,?,?)");
$sth->execute($authid,(sprintf "%03s",$tagid),$tagorder,$tag_indicator,$subfieldcode,$subfieldorder,$subfieldvalue);
if ($sth->errstr) {
warn "ERROR ==> insert into auth_subfield_table (authid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue) values ($authid,$tagid,$tagorder,$tag_indicator,$subfieldcode,$subfieldorder,$subfieldvalue)\n";
sub AUTHgetauthority {
# Returns MARC::Record of the biblio passed in parameter.
my ($dbh,$authid)=@_;
my $record = MARC::Record->new();
#---- TODO : the leader is missing
$record->leader(' ');
my $sth=$dbh->prepare("select authid,subfieldid,tag,tagorder,tag_indicator,subfieldcode,subfieldorder,subfieldvalue
from auth_subfield_table
where authid=? order by tag,tagorder,subfieldcode
my $prevtagorder=1;
my $prevtag='XXX';
my $previndicator;
my $field; # for >=10 tags
my $prevvalue; # for <10 tags
while (my $row=$sth->fetchrow_hashref) {
if ($row->{tagorder} ne $prevtagorder || $row->{tag} ne $prevtag) {
$previndicator.=" ";
if ($prevtag <10) {
$record->add_fields((sprintf "%03s",$prevtag),$prevvalue) unless $prevtag eq "XXX"; # ignore the 1st loop
} else {
$record->add_fields($field) unless $prevtag eq "XXX";
undef $field;
$prevtag = $row->{tag};
if ($row->{tag}<10) {
$prevvalue = $row->{subfieldvalue};
} else {
$field = MARC::Field->new((sprintf "%03s",$prevtag), substr($row->{tag_indicator}.' ',0,1), substr($row->{tag_indicator}.' ',1,1), $row->{'subfieldcode'}, $row->{'subfieldvalue'} );
} else {
if ($row->{tag} <10) {
$record->add_fields((sprintf "%03s",$row->{tag}), $row->{'subfieldvalue'});
} else {
$field->add_subfields($row->{'subfieldcode'}, $row->{'subfieldvalue'} );
$prevtag= $row->{tag};
# the last has not been included inside the loop... do it now !
if ($prevtag ne "XXX") { # check that we have found something. Otherwise, prevtag is still XXX and we
# must return an empty record, not make MARC::Record fail because we try to
# create a record with XXX as field :-(
if ($prevtag <10) {
} else {
# my $field = MARC::Field->new( $prevtag, "", "", %subfieldlist);
return $record;
sub AUTHgetauth_type {
my ($authtypecode) = @_;
my $dbh=C4::Context->dbh;
my $sth=$dbh->prepare("select * from auth_types where authtypecode=?");
return $sth->fetchrow_hashref;
sub AUTHmodauthority {
my ($dbh,$authid,$record,$delete)=@_;
my $oldrecord=&AUTHgetauthority($dbh,$authid);
if ($oldrecord eq $record) {
# 1st delete the authority,
# 2nd recreate it
# save the file in localfile/modified_authorities
my $cgidir = C4::Context->intranetdir ."/cgi-bin";
unless (opendir(DIR, "$cgidir")) {
$cgidir = C4::Context->intranetdir."/";
my $filename = $cgidir."/localfile/modified_authorities/$authid.authid";
open AUTH, "> $filename";
print AUTH $authid;
close AUTH;
sub AUTHdelauthority {
my ($dbh,$authid,$keep_biblio) = @_;
# if the keep_biblio is set to 1, then authority entries in biblio are preserved.
# This flag is set when the delauthority is called by modauthority
# due to a too complex structure of MARC (repeatable fields and subfields),
# the best solution for a modif is to delete / recreate the record.
my $record = AUTHgetauthority($dbh,$authid);
$dbh->do("delete from auth_header where authid=$authid") unless $keep_biblio;
$dbh->do("delete from auth_subfield_table where authid=$authid");
$dbh->do("delete from auth_word where authid=$authid");
# FIXME : delete or not in biblio tables (depending on $keep_biblio flag)
sub AUTHmodsubfield {
# Subroutine changes a subfield value given a subfieldid.
my ($dbh, $subfieldid, $subfieldvalue )=@_;
$dbh->do("lock tables auth_subfield_table WRITE");
my $sth=$dbh->prepare("update auth_subfield_table set subfieldvalue=? where subfieldid=?");
$sth->execute($subfieldvalue, $subfieldid);
$dbh->do("unlock tables");
$sth=$dbh->prepare("select authid,tag,tagorder,subfieldcode,subfieldid,subfieldorder from auth_subfield_table where subfieldid=?");
my ($authid,$tagid,$tagorder,$subfieldcode,$x,$subfieldorder) = $sth->fetchrow;
return($subfieldid, $subfieldvalue);
sub AUTHfindsubfield {
my ($dbh,$authid,$tag,$subfieldcode,$subfieldorder,$subfieldvalue) = @_;
my $resultcounter=0;
my $subfieldid;
my $lastsubfieldid;
my $query="select subfieldid from auth_subfield_table where authid=? and tag=? and subfieldcode=?";
my @bind_values = ($authid,$tag, $subfieldcode);
if ($subfieldvalue) {
$query .= " and subfieldvalue=?";
} else {
if ($subfieldorder<1) {
$query .= " and subfieldorder=?";
my $sti=$dbh->prepare($query);
while (($subfieldid) = $sti->fetchrow) {
if ($resultcounter>1) {
# Error condition. Values given did not resolve into a unique record. Don't know what to edit
# should rarely occur (only if we use subfieldvalue with a value that exists twice, which is strange)
return -1;
} else {
return $lastsubfieldid;
sub AUTHfindsubfieldid {
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
my $sth=$dbh->prepare("select subfieldid from auth_subfield_table
where authid=? and tag=? and tagorder=?
and subfieldcode=? and subfieldorder=?");
my ($res) = $sth->fetchrow;
unless ($res) {
$sth=$dbh->prepare("select subfieldid from auth_subfield_table
where authid=? and tag=? and tagorder=?
and subfieldcode=?");
($res) = $sth->fetchrow;
return $res;
sub AUTHfind_authtypecode {
my ($dbh,$authid) = @_;
my $sth = $dbh->prepare("select authtypecode from auth_header where authid=?");
my ($authtypecode) = $sth->fetchrow;
return $authtypecode;
sub AUTHdelsubfield {
# delete a subfield for $authid / tag / tagorder / subfield / subfieldorder
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
$dbh->do("delete from auth_subfield_table where authid='$authid' and
tag='$tag' and tagorder='$tagorder'
and subfieldcode='$subfield' and subfieldorder='$subfieldorder'
sub AUTHhtml2marc {
my ($dbh,$rtags,$rsubfields,$rvalues,%indicators) = @_;
my $prevtag = -1;
my $record = MARC::Record->new();
# my %subfieldlist=();
my $prevvalue; # if tag <10
my $field; # if tag >=10
for (my $i=0; $i< @$rtags; $i++) {
# rebuild MARC::Record
if (@$rtags[$i] ne $prevtag) {
if ($prevtag < 10) {
if ($prevvalue) {
$record->add_fields((sprintf "%03s",$prevtag),$prevvalue);
} else {
if ($field) {
$indicators{@$rtags[$i]}.=' ';
if (@$rtags[$i] <10) {
$prevvalue= @$rvalues[$i];
undef $field;
} else {
undef $prevvalue;
$field = MARC::Field->new( (sprintf "%03s",@$rtags[$i]), substr($indicators{@$rtags[$i]},0,1),substr($indicators{@$rtags[$i]},1,1), @$rsubfields[$i] => @$rvalues[$i]);
$prevtag = @$rtags[$i];
} else {
if (@$rtags[$i] <10) {
} else {
if (length(@$rvalues[$i])>0) {
$field->add_subfields(@$rsubfields[$i] => @$rvalues[$i]);
$prevtag= @$rtags[$i];
# the last has not been included inside the loop... do it now !
$record->add_fields($field) if $field;
return $record;
sub AUTHaddword {
# split a subfield string and adds it into the word table.
# removes stopwords
my ($dbh,$authid,$tag,$tagorder,$subfieldid,$subfieldorder,$sentence) =@_;
$sentence =~ s/(\.|\?|\:|\!|\'|,|\-|\"|\(|\)|\[|\]|\{|\})/ /g;
my @words = split / /,$sentence;
my $stopwords= C4::Context->stopwords;
my $sth=$dbh->prepare("insert into auth_word (authid, tagsubfield, tagorder, subfieldorder, word, sndx_word)
values (?,concat(?,?),?,?,?,soundex(?))");
foreach my $word (@words) {
# we record only words longer than 2 car and not in stopwords hash
if (length($word)>2 and !($stopwords->{uc($word)})) {
if ($sth->err()) {
warn "ERROR ==> insert into auth_word (authid, tagsubfield, tagorder, subfieldorder, word, sndx_word) values ($authid,concat($tag,$subfieldid),$tagorder,$subfieldorder,$word,soundex($word))\n";
sub AUTHdelword {
# delete words. this sub deletes all the words from a sentence. a subfield modif is done by a delete then a add
my ($dbh,$authid,$tag,$tagorder,$subfield,$subfieldorder) = @_;
my $sth=$dbh->prepare("delete from auth_word where authid=? and tagsubfield=concat(?,?) and tagorder=? and subfieldorder=?");
sub char_decode {
# converts ISO 5426 coded string to ISO 8859-1
# sloppy code : should be improved in next issue
my ($string,$encoding) = @_ ;
$_ = $string ;
# $encoding = C4::Context->preference("marcflavour") unless $encoding;
if ($encoding eq "UNIMARC") {
s/\xe1/<2F>/gm ;
s/\xe2/<2F>/gm ;
s/\xe9/<2F>/gm ;
s/\xec/<2F>/gm ;
s/\xf1/<2F>/gm ;
s/\xf3/<2F>/gm ;
s/\xf9/<2F>/gm ;
s/\xfb/<2F>/gm ;
s/\xc1\x61/<2F>/gm ;
s/\xc1\x65/<2F>/gm ;
s/\xc1\x69/<2F>/gm ;
s/\xc1\x6f/<2F>/gm ;
s/\xc1\x75/<2F>/gm ;
s/\xc1\x41/<2F>/gm ;
s/\xc1\x45/<2F>/gm ;
s/\xc1\x49/<2F>/gm ;
s/\xc1\x4f/<2F>/gm ;
s/\xc1\x55/<2F>/gm ;
s/\xc2\x41/<2F>/gm ;
s/\xc2\x45/<2F>/gm ;
s/\xc2\x49/<2F>/gm ;
s/\xc2\x4f/<2F>/gm ;
s/\xc2\x55/<2F>/gm ;
s/\xc2\x59/<2F>/gm ;
s/\xc2\x61/<2F>/gm ;
s/\xc2\x65/<2F>/gm ;
s/\xc2\x69/<2F>/gm ;
s/\xc2\x6f/<2F>/gm ;
s/\xc2\x75/<2F>/gm ;
s/\xc2\x79/<2F>/gm ;
s/\xc3\x41/<2F>/gm ;
s/\xc3\x45/<2F>/gm ;
s/\xc3\x49/<2F>/gm ;
s/\xc3\x4f/<2F>/gm ;
s/\xc3\x55/<2F>/gm ;
s/\xc3\x61/<2F>/gm ;
s/\xc3\x65/<2F>/gm ;
s/\xc3\x69/<2F>/gm ;
s/\xc3\x6f/<2F>/gm ;
s/\xc3\x75/<2F>/gm ;
s/\xc4\x41/<2F>/gm ;
s/\xc4\x4e/<2F>/gm ;
s/\xc4\x4f/<2F>/gm ;
s/\xc4\x61/<2F>/gm ;
s/\xc4\x6e/<2F>/gm ;
s/\xc4\x6f/<2F>/gm ;
s/\xc8\x45/<2F>/gm ;
s/\xc8\x49/<2F>/gm ;
s/\xc8\x65/<2F>/gm ;
s/\xc8\x69/<2F>/gm ;
s/\xc8\x76/<2F>/gm ;
s/\xc9\x41/<2F>/gm ;
s/\xc9\x4f/<2F>/gm ;
s/\xc9\x55/<2F>/gm ;
s/\xc9\x61/<2F>/gm ;
s/\xc9\x6f/<2F>/gm ;
s/\xc9\x75/<2F>/gm ;
s/\xca\x41/<2F>/gm ;
s/\xca\x61/<2F>/gm ;
s/\xd0\x43/<2F>/gm ;
s/\xd0\x63/<2F>/gm ;
# this handles non-sorting blocks (if implementation requires this)
$string = nsb_clean($_) ;
} elsif ($encoding eq "USMARC" || $encoding eq "MARC21") {
if(/[\xc1-\xff]/) {
s/\xe1\x61/<2F>/gm ;
s/\xe1\x65/<2F>/gm ;
s/\xe1\x69/<2F>/gm ;
s/\xe1\x6f/<2F>/gm ;
s/\xe1\x75/<2F>/gm ;
s/\xe1\x41/<2F>/gm ;
s/\xe1\x45/<2F>/gm ;
s/\xe1\x49/<2F>/gm ;
s/\xe1\x4f/<2F>/gm ;
s/\xe1\x55/<2F>/gm ;
s/\xe2\x41/<2F>/gm ;
s/\xe2\x45/<2F>/gm ;
s/\xe2\x49/<2F>/gm ;
s/\xe2\x4f/<2F>/gm ;
s/\xe2\x55/<2F>/gm ;
s/\xe2\x59/<2F>/gm ;
s/\xe2\x61/<2F>/gm ;
s/\xe2\x65/<2F>/gm ;
s/\xe2\x69/<2F>/gm ;
s/\xe2\x6f/<2F>/gm ;
s/\xe2\x75/<2F>/gm ;
s/\xe2\x79/<2F>/gm ;
s/\xe3\x41/<2F>/gm ;
s/\xe3\x45/<2F>/gm ;
s/\xe3\x49/<2F>/gm ;
s/\xe3\x4f/<2F>/gm ;
s/\xe3\x55/<2F>/gm ;
s/\xe3\x61/<2F>/gm ;
s/\xe3\x65/<2F>/gm ;
s/\xe3\x69/<2F>/gm ;
s/\xe3\x6f/<2F>/gm ;
s/\xe3\x75/<2F>/gm ;
s/\xe4\x41/<2F>/gm ;
s/\xe4\x4e/<2F>/gm ;
s/\xe4\x4f/<2F>/gm ;
s/\xe4\x61/<2F>/gm ;
s/\xe4\x6e/<2F>/gm ;
s/\xe4\x6f/<2F>/gm ;
s/\xe8\x45/<2F>/gm ;
s/\xe8\x49/<2F>/gm ;
s/\xe8\x65/<2F>/gm ;
s/\xe8\x69/<2F>/gm ;
s/\xe8\x76/<2F>/gm ;
s/\xe9\x41/<2F>/gm ;
s/\xe9\x4f/<2F>/gm ;
s/\xe9\x55/<2F>/gm ;
s/\xe9\x61/<2F>/gm ;
s/\xe9\x6f/<2F>/gm ;
s/\xe9\x75/<2F>/gm ;
s/\xea\x41/<2F>/gm ;
s/\xea\x61/<2F>/gm ;
# this handles non-sorting blocks (if implementation requires this)
$string = nsb_clean($_) ;
return($string) ;
sub nsb_clean {
my $NSB = '\x88' ; # NSB : begin Non Sorting Block
my $NSE = '\x89' ; # NSE : Non Sorting Block end
# handles non sorting blocks
my ($string) = @_ ;
$_ = $string ;
s/$NSB/(/gm ;
s/[ ]{0,1}$NSE/) /gm ;
$string = $_ ;
return($string) ;
sub FindDuplicate {
my ($record,$authtypecode)=@_;
warn "IN for ".$record->as_formatted;
my $dbh = C4::Context->dbh;
# warn "".$record->as_formatted;
my $sth = $dbh->prepare("select auth_tag_to_report,summary from auth_types where authtypecode=?");
my ($auth_tag_to_report,$taglist) = $sth->fetchrow;
# build a request for authoritysearch
my (@tags, @and_or, @excluding, @operator, @value, $offset, $length);
# search on biblio.title
# warn " tag a reporter : $auth_tag_to_report";
# warn "taglist ".$taglist;
my @subfield = split /\[/, $taglist;
my $max = @subfield;
for (my $i=1; $i<$max;$i++){
warn " ".$subfield[$i];
# warn " ".$subfield[$i];
if ($record->fields($auth_tag_to_report)) {
my $sth = $dbh->prepare("select tagfield,tagsubfield from auth_subfield_structure where tagfield=? and authtypecode=? ");
# warn " field $auth_tag_to_report exists";
while (my ($tag,$subfield) = $sth->fetchrow){
if ($record->field($tag)->subfield($subfield)) {
warn "tag :".$tag." subfield: $subfield value : ".$record->field($tag)->subfield($subfield);
push @tags, $tag.$subfield;
# warn "'".$tag.$subfield."' value :". $record->field($tag)->subfield($subfield);
push @and_or, "and";
push @excluding, "";
push @operator, "=";
push @value, $record->field($tag)->subfield($subfield);
my ($finalresult,$nbresult) = authoritysearch($dbh,\@tags,\@and_or,\@excluding,\@operator,\@value,0,10,$authtypecode);
# there is at least 1 result => return the 1st one
if ($nbresult) {
warn "XXXXX $nbresult => ".@$finalresult[0]->{authid},@$finalresult[0]->{summary};
return @$finalresult[0]->{authid},@$finalresult[0]->{summary};
# no result, returns nothing
END { } # module clean-up code here (global destructor)
=head1 AUTHOR
Koha Developement team <info@koha.org>
Paul POULAIN paul.poulain@free.fr
# $Id$
# $Log$
# Revision 1.20 2005/08/04 13:27:47 tipaul
# synch'ing 2.2 and head
# Revision 2005/08/01 15:14:50 tipaul
# minor change in summary handling (accepting 4 digits before the field)
# Revision 2005/06/07 10:02:00 tipaul
# porting dictionnary search from head to 2.2. there is now a ... facing titles, author & subject, to search in biblio & authorities existing values.
# Revision 2005/05/31 14:50:46 tipaul
# fix for authority merging. There was a bug on official installs
# Revision 2005/05/30 11:24:15 tipaul
# fixing a bug : when a field was repeated, the last field was also repeated. (Was due to the "empty" field in html between fields : to separate fields, in html, an empty field is automatically added. in AUTHhtml2marc, this empty field was not discarded correctly)
# Revision 2005/04/28 08:45:33 tipaul
# porting FindDuplicate feature for authorities from HEAD to rel_2_2, works correctly now.
# Revision 2005/02/28 14:03:13 tipaul
# * adding search on "main entry" (ie $a subfield) on a given authority (the "search everywhere" field is still here).
# * adding a select box to requet "contain" or "begin with" search.
# * fixing some bug in authority search (related to "main entry" search)
# Revision 2005/02/24 13:12:13 tipaul
# saving authority modif in a text file. This will be used soon with another script (in crontab). The script in crontab will retrieve every authorityid in the directory localfile/authorities and modify every biblio using this authority. Those modifs may be long. So they can't be done through http, because we may encounter a webserver timeout, and kill the process before end of the job.
# So, it will be done through a cron job.
# (/me agree we need some doc for command line scripts)
# Revision 1.9 2004/12/23 09:48:11 tipaul
# Minor changes in summary "exploding" (the 3 digits AFTER the subfield were not on the right place).
# Revision 1.8 2004/11/05 10:11:39 tipaul
# export auth_count_usage (bugfix)
# Revision 1.7 2004/09/23 16:13:00 tipaul
# Bugfix in modification
# Revision 1.6 2004/08/18 16:00:24 tipaul
# fixes for authorities management
# Revision 1.5 2004/07/05 13:37:22 doxulting
# First step for working authorities
# Revision 1.4 2004/06/22 11:35:37 tipaul
# removing % at the beginning of a string to avoid loooonnnngggg searchs
# Revision 1.3 2004/06/17 08:02:13 tipaul
# merging tag & subfield in auth_word for better perfs
# Revision 1.2 2004/06/10 08:29:01 tipaul
# MARC authority management (continued)
# Revision 1.1 2004/06/07 07:35:01 tipaul
# MARC authority management package