From 788e51adb1423806d0e4691e4581f9a55c916a44 Mon Sep 17 00:00:00 2001 From: Robin Sheat Date: Fri, 8 Mar 2013 14:29:39 +1300 Subject: [PATCH] Bug 9035 - delete bulkauthimport.pl Then bulkauthimport.pl? bulkauthimport should not be used ever. it probably should be deleted It should be. Signed-off-by: David Cook I've poked around in bulkmarcimport.pl and it certainly seems to have the functionality that Mason (and Jared and Robin) mention. Signed-off-by: Jonathan Druart Signed-off-by: Jared Camins-Esakov --- misc/migration_tools/bulkauthimport.pl | 154 ------------------------- 1 file changed, 154 deletions(-) delete mode 100755 misc/migration_tools/bulkauthimport.pl diff --git a/misc/migration_tools/bulkauthimport.pl b/misc/migration_tools/bulkauthimport.pl deleted file mode 100755 index 2709db91c9..0000000000 --- a/misc/migration_tools/bulkauthimport.pl +++ /dev/null @@ -1,154 +0,0 @@ -#!/usr/bin/perl -# small script that import an iso2709 file into koha 2.0 - -use strict; -#use warnings; FIXME - Bug 2505 -BEGIN { - # find Koha's Perl modules - # test carefully before changing this - use FindBin; - eval { require "$FindBin::Bin/kohalib.pl" }; -} - -# Koha modules used -use Unicode::Normalize; -use MARC::File::USMARC; -use MARC::File::XML; -use MARC::Record; -use MARC::Batch; -use C4::Context; -use C4::Charset; -use C4::AuthoritiesMarc; -use Time::HiRes qw(gettimeofday); -use Getopt::Long; -use IO::File; - -my ( $input_marc_file, $number) = ('',0); -my ($version, $delete, $test_parameter,$char_encoding, $verbose, $format, $commit); -$| = 1; -GetOptions( - 'file:s' => \$input_marc_file, - 'n:i' => \$number, - 'h' => \$version, - 'd' => \$delete, - 't' => \$test_parameter, - 'c:s' => \$char_encoding, - 'v:s' => \$verbose, - 'm:s' => \$format, - 'commit:f' => \$commit, -); - -if ($version || ($input_marc_file eq '')) { - print <dbh; - -if ($delete) { - print "deleting authorities\n"; - $dbh->do("truncate auth_header"); -} -if ($test_parameter) { - print "TESTING MODE ONLY\n DOING NOTHING\n===============\n"; -} - -my $marcFlavour = C4::Context->preference('marcflavour') || 'MARC21'; -$char_encoding = 'MARC21' unless ($char_encoding); -print "CHAR : $char_encoding\n" if $verbose; -my $starttime = gettimeofday; -my $fh = IO::File->new($input_marc_file); # don't let MARC::Batch open the file, as it applies the ':utf8' IO layer -my $batch; -if ($format =~ /XML/i) { - # ugly hack follows -- MARC::File::XML, when used by MARC::Batch, - # appears to try to convert incoming XML records from MARC-8 - # to UTF-8. Setting the BinaryEncoding key turns that off - # TODO: see what happens to ISO-8859-1 XML files. - # TODO: determine if MARC::Batch can be fixed to handle - # XML records properly -- it probably should be - # be using a proper push or pull XML parser to - # extract the records, not using regexes to look - # for .*. - $MARC::File::XML::_load_args{BinaryEncoding} = 'utf-8'; - $batch = MARC::Batch->new( 'XML', $fh ); -} else { - $batch = MARC::Batch->new( 'USMARC', $fh ); -} -$batch->warnings_off(); -$batch->strict_off(); -my $i=0; - -$dbh->{AutoCommit} = 0; -my $commitnum = 50; -if ($commit) { - $commitnum = $commit; -} - -RECORD: while ( my $record = $batch->next() ) { - $i++; - print "."; - print "\r$i" unless $i % 100; - - if ($record->encoding() eq 'MARC-8') { - my ($guessed_charset, $charset_errors); - ($record, $guessed_charset, $charset_errors) = MarcToUTF8Record($record, $marcFlavour); - if ($guessed_charset eq 'failed') { - warn "ERROR: failed to perform character conversion for record $i\n"; - next RECORD; - } - } - - warn "$i ==>".$record->as_formatted() if $verbose eq 2; - my $authtypecode; - if (C4::Context->preference('marcflavour') eq 'MARC21') { - $authtypecode="PERSO_NAME" if ($record->field('100')); - $authtypecode="CORPO_NAME" if ($record->field('110')); - $authtypecode="MEETI_NAME" if ($record->field('111')); - $authtypecode="UNIF_TITLE" if ($record->field('130')); - $authtypecode="CHRON_TERM" if ($record->field('148') or $record->field('182')); - $authtypecode="TOPIC_TERM" if ($record->field('150') or $record->field('180')); - $authtypecode="GEOGR_NAME" if ($record->field('151') or $record->field('181')); - $authtypecode="GENRE/FORM" if ($record->field('155') or $record->field('185')); - next unless $authtypecode; # skip invalid records FIXME: far too simplistic - } - else { - $authtypecode=substr($record->leader(),9,1); - $authtypecode="NP" if ($authtypecode eq 'a'); # personnes - $authtypecode="CO" if ($authtypecode eq 'b'); # collectivit� - $authtypecode="NG" if ($authtypecode eq 'c'); # g�graphique - $authtypecode="NM" if ($authtypecode eq 'd'); # marque - $authtypecode="NF" if ($authtypecode eq 'e'); # famille - $authtypecode="TI" if ($authtypecode eq 'f'); # Titre uniforme - $authtypecode="TI" if ($authtypecode eq 'h'); # auteur/titre - $authtypecode="MM" if ($authtypecode eq 'j'); # mot mati�e - } - - unless ($test_parameter) { - my ($authid) = AddAuthority($record,0,$authtypecode); - warn "ADDED authority NB $authid in DB\n" if $verbose; - $dbh->commit() if (0 == $i % $commitnum); - } - - last if $i == $number; -} -$dbh->commit(); - -my $timeneeded = gettimeofday - $starttime; -print "\n$i MARC record done in $timeneeded seconds\n"; -- 2.39.5