From 89f8e98846f4defbde632abafdb2a019151d6088 Mon Sep 17 00:00:00 2001 From: Mike Rylander Date: Wed, 30 Apr 2014 12:58:11 -0400 Subject: [PATCH] LP#1312945: auth-auth linking: cache less agressively and look for all links There was a logic inversion that was causing miss-use of a per- record cache mechanism. I remove that entirely, as it's not helpful in practice. Also, after finding one use of a linked field we moved on to the next, though it is possible for more than one link to exist for different uses of a name, say. Now we'll loop through all fields to find all possible linkages. Signed-off-by: Mike Rylander Signed-off-by: Srey Seng Signed-off-by: Galen Charlton --- .../authority_authority_linker.pl.in | 45 +++++++++++----------- 1 file changed, 22 insertions(+), 23 deletions(-) diff --git a/Open-ILS/src/support-scripts/authority_authority_linker.pl.in b/Open-ILS/src/support-scripts/authority_authority_linker.pl.in index 5f00f2be9b..d9ba725718 100755 --- a/Open-ILS/src/support-scripts/authority_authority_linker.pl.in +++ b/Open-ILS/src/support-scripts/authority_authority_linker.pl.in @@ -71,9 +71,10 @@ sub marcxml_eg { } sub matchable_string { - my ($field, $sf_list) = @_; + my ($field, $sf_list, $joiner) = @_; + $joiner ||= ' '; - return join("", map { $field->subfield($_) } split "", $sf_list); + return join($joiner, map { $field->subfield($_) } split "", $sf_list); } # ########### main @@ -148,19 +149,17 @@ my $problems = 0; while (my ($src, $links) = $sth->fetchrow_array) { print "src: $src\n" if $options{debug}; - my $per_src_target_cache = {}; try { my $src_rec = $e->retrieve_authority_record_entry($src) or die $e->die_event; my $src_marc = MARC::Record->new_from_xml($src_rec->marc); - LINK: for my $link (split ';', $links) { + for my $link (split ';', $links) { my ($target, $field_id) = split ',', $link; print "target: $target, field_id: $field_id\n" if $options{debug}; - my $target_rec = ($per_src_target_cache->{$src} ||= - $e->retrieve_authority_record_entry($target)) or + my $target_rec = $e->retrieve_authority_record_entry($target) or die $e->die_event; my $target_marc = MARC::Record->new_from_xml($target_rec->marc); my $cni = $target_marc->field('003')->data; @@ -169,31 +168,31 @@ while (my ($src, $links) = $sth->fetchrow_array) { for my $field ($src_marc->field($acsaf->tag)) { my $src_string = matchable_string( - $field, $acsaf->main_entry->display_sf_list + $field, $acsaf->main_entry->display_sf_list, $acsaf->main_entry->joiner ); print("at field ", $acsaf->id, " (", $acsaf->tag, "), trying to match '$src_string'...\n") if $options{debug}; - for my $tfield ($target_marc->field($acsaf->main_entry->tag)) { - my $target_string = matchable_string( - $tfield, $acsaf->main_entry->display_sf_list - ); - - if ($target_string eq $src_string) { - print "got a match ...\n" if $options{debug}; - $field->update('0' => "($cni)$target"); - $src_rec->marc(marcxml_eg($src_marc->as_xml_record)); - - $e->xact_begin; - $e->update_authority_record_entry($src_rec) or - die $e->die_event; - $e->xact_commit; - next LINK; - } + my ($tfield) = $target_marc->field($acsaf->main_entry->tag); + my $target_string = matchable_string( + $tfield, $acsaf->main_entry->display_sf_list, $acsaf->main_entry->joiner + ); + + if ($target_string eq $src_string) { + print "got a match ...\n" if $options{debug}; + $field->update('0' => "($cni)$target"); } } } + + $src_rec->marc(marcxml_eg($src_marc->as_xml_record)); + + $e->xact_begin; + $e->update_authority_record_entry($src_rec) or + die $e->die_event; + $e->xact_commit; + } otherwise { my $err = shift; print STDERR "\nRecord # $src : ", -- 2.11.0