Koha/misc/migration_tools/remove_unused_authorities.pl
Fridolin Somers fc4cffe1f0
Bug 21865: ES compatiblity of remove_unused_authorities.pl
The script misc/migration_tools/remove_unused_authorities.pl directly checks if Zebra search is OK.

This patch changes so that this test is only if Zebra is the search engine.
It also adds a test on the search off any authority number indexed (index 'an').
With Zebra its : an,alwaysmatches=''
With ES its : an:*
This test ensure that biblios records are indexed and that not all autorities will be deleted.

Test plan:
1) On a catalog create a new authority
2) Use Zebra in systempreference SearchEngine
3) Stop Zebra server
4) Run misc/migration_tools/remove_unused_authorities.pl -c
5) The script does nothing and says :
   Zebra server seems not to be available. This script needs Zebra runs.
6) Restart Zebra server
7) Delete biblio index base
8) Run misc/migration_tools/remove_unused_authorities.pl -c
9) The script does nothing and says :
   Searching authority number in biblio records seems not to be available : an,alwaysmatches=''
10) Use ElasticSearch in systempreference SearchEngine
11) Delete biblio index base
12) Run misc/migration_tools/remove_unused_authorities.pl -c
13) The script does nothing and says :
    Searching authority number in biblio records seems not to be available : an:*

Signed-off-by: Bernardo Gonzalez Kriegel <bgkriegel@gmail.com>
Signed-off-by: Jonathan Druart <jonathan.druart@bugs.koha-community.org>
Signed-off-by: Martin Renvoize <martin.renvoize@ptfs-europe.com>
2020-04-14 16:54:10 +01:00

141 lines
4.1 KiB
Perl
Executable file

#!/usr/bin/perl
#script to administer Authorities without biblio
# Copyright 2009 BibLibre
# written 2009-05-04 by paul dot poulain at biblibre.com
#
# This file is part of Koha.
#
# Koha is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# Koha is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with Koha; if not, see <http://www.gnu.org/licenses>.
use Modern::Perl;
use Koha::Script;
use C4::Context;
use C4::AuthoritiesMarc;
use Getopt::Long;
use Koha::SearchEngine::Search;
my @authtypes;
my $want_help = 0;
my $test = 0;
GetOptions(
'aut|authtypecode:s' => \@authtypes,
't|test' => \$test,
'h|help' => \$want_help
);
if ($want_help) {
print_usage();
exit 0;
}
if ($test) {
print "*** Testing only, authorities will not be deleted. ***\n";
}
if (@authtypes) {
print "Restricted to authority type(s) : ".join(',', @authtypes).".\n";
}
my $searcher = Koha::SearchEngine::Search->new( { index => 'biblios' } );
my $checksearch;
if ( C4::Context->preference("SearchEngine") eq 'Zebra' ) {
# Check server state
my $errZebraConnection = C4::Context->Zconn("biblioserver",0)->errcode();
if ( $errZebraConnection == 10000 ) {
die "Zebra server seems not to be available. This script needs Zebra runs.";
} elsif ( $errZebraConnection ) {
die "Error from Zebra: $errZebraConnection";
}
$checksearch = q{an,alwaysmatches=''};
}
else {
$checksearch = q{an:*};
}
# Check search on authority number as at least one result
my ($err,$res,$nb) = $searcher->simple_search_compat($checksearch,0,10);
unless ($nb > 0) {
die "Searching authority number in biblio records seems not to be available : $checksearch";
}
my $dbh=C4::Context->dbh;
my @results;
# prepare the request to retrieve all authorities of the requested types
my $rqsql = q{ SELECT authid,authtypecode FROM auth_header };
$rqsql .= q{ WHERE authtypecode IN (}.join(',',map{ '?' }@authtypes).')' if @authtypes;
my $rqselect = $dbh->prepare($rqsql);
$|=1;
$rqselect->execute(@authtypes);
my $counter=0;
my $totdeleted=0;
my $totundeleted=0;
while (my $data=$rqselect->fetchrow_hashref){
$counter++;
print 'authid='.$data->{'authid'};
print ' type='.$data->{'authtypecode'};
my $bibliosearch = 'an:'.$data->{'authid'};
# search for biblios mapped
my ($err,$res,$used) = $searcher->simple_search_compat($bibliosearch,0,10);
if (defined $err) {
print "\n";
warn "Error: $err on search for biblios $bibliosearch\n";
next;
}
unless ($used > 0){
unless ($test) {
DelAuthority({ authid => $data->{'authid'} });
print " : deleted";
} else {
print " : can be deleted";
}
$totdeleted++;
} else {
$totundeleted++;
print " : used $used time(s)";
}
print "\n";
}
print "$counter authorities parsed\n";
unless ($test) {
print "$totdeleted deleted because unused\n";
} else {
print "$totdeleted can be deleted because unused\n";
}
print "$totundeleted unchanged because used\n";
sub print_usage {
print <<_USAGE_;
$0: Remove unused authority records
This script removes authority records that do not have any biblio
records attached to them.
If the --aut option is supplied, only authority records of that
particular type will be checked for usage. --aut can be repeated.
If --aut is not supplied, all authority records will be checked.
Use --test to perform a test run. This script does not ask the
operator to confirm the deletion of each authority record.
parameters
--aut|authtypecode TYPE the list of authtypes to check
--test or -t test mode, don't delete really, just count
--help or -h show this message.
_USAGE_
}