Koha/Koha/BiblioUtils.pm
Nick Clemens e42b4088ed Bug 26180: Add descending option to rebuild_elasticsearch.pl
While the ES index is incremental and provides results as it commits, we currently index from the oldest records to the newest.

This patch provides the option to go the other direction

To test:
 1 - Have ES setup and running for Koha
 2 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -b
 3 - Note the biblios index from number 1 the end
 4 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -a
 5 - Notice the same
 6 - Apply patch
 7 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -b
 8 - Still in ascending order
 9 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -b --desc
10 - Now records index in descending order
11 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -a
12 - Still ascending
13 - perl misc/search_tools/rebuild_elasticsearch.pl -v -v -a --desc
14 - Now descending

Signed-off-by: Séverine QUEUNE <severine.queune@bulac.fr>
Signed-off-by: Martin Renvoize <martin.renvoize@ptfs-europe.com>

JD amended patch: fix typo "inde" vs "index" and add commit body

Signed-off-by: Jonathan Druart <jonathan.druart@bugs.koha-community.org>
2020-11-04 12:59:33 +01:00

197 lines
4.9 KiB
Perl

package Koha::BiblioUtils;
# This contains functions to do with managing biblio records.
# Copyright 2014 Catalyst IT
#
# This file is part of Koha.
#
# Koha is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# Koha is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with Koha; if not, see <http://www.gnu.org/licenses>.
=head1 NAME
Koha::BiblioUtils - contains fundamental biblio-related functions
=head1 DESCRIPTION
This contains functions for normal operations on biblio records.
Note: really, C4::Biblio does the main functions, but the Koha namespace is
the new thing that should be used.
=cut
use C4::Biblio; # EmbedItemsInMarcBiblio
use Koha::MetadataIterator;
use Koha::Database;
use Modern::Perl;
use Data::Dumper; # TODO remove
use base qw(Koha::MetadataRecord);
__PACKAGE__->mk_accessors(qw( record schema id datatype ));
=head1 FUNCTIONS
=head2 new
my $biblio = Koha::BiblioUtils->new($marc_record, [$biblionumber]);
Creates an instance of C<Koha::BiblioUtils> based on the marc record. If known,
the biblionumber can be provided too.
=cut
sub new {
my $class = shift;
my $record = shift;
my $biblionumber = shift;
my $self = $class->SUPER::new(
{
'record' => $record,
'schema' => lc C4::Context->preference("marcflavour"),
'id' => $biblionumber,
'datatype' => 'biblio',
}
);
bless $self, $class;
return $self;
}
=head2 get_from_biblionumber
my $biblio = Koha::BiblioUtils->get_from_biblionumber($biblionumber, %options);
This will give you an instance of L<Koha::BiblioUtils> that is the biblio that
you requested.
Options are:
=over 4
=item C<$item_data>
If true, then the item data will be merged into the record when it's loaded.
=back
It will return C<undef> if the biblio doesn't exist.
=cut
sub get_from_biblionumber {
my ($class, $bibnum, %options) = @_;
my $marc = $class->get_marc_biblio($bibnum, %options);
return $class->new($marc, $bibnum);
}
=head2 get_all_biblios_iterator
my $it = Koha::BiblioUtils->get_all_biblios_iterator(%options);
This will provide an iterator object that will, one by one, provide the
Koha::BiblioUtils of each biblio. This will include the item data.
The iterator is a Koha::MetadataIterator object.
Possible options are:
=over 4
=item C<slice>
slice may be defined as a hash of two values: index and count. index
is the slice number to process and count is total number of slices.
With this information the iterator returns just the given slice of
records instead of all.
=back
=cut
sub get_all_biblios_iterator {
my ($self, %options) = @_;
my $search_terms = {};
my ($slice_modulo, $slice_count);
if ($options{slice}) {
$slice_count = $options{slice}->{count};
$slice_modulo = $options{slice}->{index};
$search_terms = \[ 'mod(biblionumber, ?) = ?', $slice_count, $slice_modulo ];
}
my $search_options = { columns => [qw/ biblionumber /] };
if ( $options{desc} ){
$search_options->{order_by} = { -desc => 'biblionumber' };
}
my $database = Koha::Database->new();
my $schema = $database->schema();
my $rs =
$schema->resultset('Biblio')->search(
$search_terms,
$search_options );
my $next_func = sub {
# Warn and skip bad records, otherwise we break the loop
while (1) {
my $row = $rs->next();
return if !$row;
my $marc = C4::Biblio::GetMarcBiblio({
biblionumber => $row->biblionumber,
embed_items => 1 });
my $next = eval {
__PACKAGE__->new($marc, $row->biblionumber);
};
if ($@) {
warn "Something went wrong reading record for biblio $row->biblionumber: $@\n";
next;
}
return $next;
}
};
return Koha::MetadataIterator->new($next_func);
}
=head2 get_marc_biblio
my $marc = Koha::BiblioUtils->get_marc_biblio($bibnum, %options);
This non-class function fetches the MARC::Record for the given biblio number.
Nothing is returned if the biblionumber couldn't be found (or it somehow has no
MARC data.)
Options are:
=over 4
=item item_data
If set to true, item data is embedded in the record. Default is to not do this.
=back
=cut
sub get_marc_biblio {
my ($class, $bibnum, %options) = @_;
return C4::Biblio::GetMarcBiblio({
biblionumber => $bibnum,
embed_items => ($options{item_data} ? 1 : 0 ) });
}
1;