next unless $data;
- postprocess( { bib => $bib, worm_data => $data } );
+ postprocess( { bib => $bib, ingest_data => $data } );
if (!($count % 20)) {
print NEWERR "\r$count\t". $count / (time - $starttime);
my $data = shift;
my $bib = $data->{bib};
- my $full_rec = $data->{worm_data}->{full_rec};
+ my $full_rec = $data->{ingest_data}->{full_rec};
- my $field_entries = $data->{worm_data}->{field_entries} unless ($auth);
- my $fp = $data->{worm_data}->{fingerprint} unless ($auth);
- my $rd = $data->{worm_data}->{descriptor} unless ($auth);
+ my $field_entries = $data->{ingest_data}->{field_entries} unless ($auth);
+ my $fp = $data->{ingest_data}->{fingerprint} unless ($auth);
+ my $rd = $data->{ingest_data}->{descriptor} unless ($auth);
$bib->fingerprint( $fp->{fingerprint} ) unless ($auth);
$bib->quality( $fp->{quality} ) unless ($auth);
use strict;
use Getopt::Long;
-my ($start, $stop, $count, $group, $out, $method) = (1,1,1,50,'dynamic-wormizer-script.sfsh', 'open-ils.worm.wormize.biblio.nomap.noscrub');
+my ($start, $stop, $count, $group, $out, $method) = (1,1,1,50,'dynamic-reindex-script.sfsh', 'open-ils.ingest.full.biblio.record_list');
GetOptions ( "start=i" => \$start,
"end=i" => \$stop,
"groupsize=i" => \$group,
push @list, $i;
next;
}
- print SFSH "request open-ils.storage $method [".join(',', @list)."]\n" if (@list);
- @list = ($i);
+ push @list, $i;
+ print SFSH "request open-ils.ingest $method [".join(',', @list)."]\n" if (@list);
+ @list = ();
}
-print SFSH "request open-ils.storage $method [".join(',', @list)."]\n" if (@list);
+print SFSH "request open-ils.ingest $method [".join(',', @list)."]\n" if (@list);
$apputils->commit_db_session($session);
- $logger->debug("Sending record off to be wormized");
+ $logger->debug("Sending record off to be ingested and indexed");
$client->respond_complete($record);
argc => 1,
);
+sub rw_biblio_ingest_record_list {
+ my $self = shift;
+ my $client = shift;
+ my @rec = ref($_[0]) ? @{ $_[0] } : @_ ;
+
+ OpenILS::Application::Ingest->post_init();
+ my $cstore = OpenSRF::AppSession->connect( 'open-ils.cstore' );
+ $cstore->request('open-ils.cstore.transaction.begin')->gather(1);
+
+ my $r = $cstore->request( 'open-ils.cstore.direct.biblio.record_entry.search.atomic' => { id => $rec } )->gather(1);
+
+ $cstore->request('open-ils.cstore.transaction.rollback')->gather(1);
+ $cstore->disconnect;
+
+ return undef unless ($r and @$r);
+
+ my $count = 0;
+ $count += ($self->method_lookup("open-ils.ingest.full.biblio.object")->run($_))[0] for (@$r);
+
+ return $count;
+}
+__PACKAGE__->register_method(
+ api_name => "open-ils.ingest.full.biblio.record_list",
+ method => "rw_biblio_ingest_record_list",
+ api_level => 1,
+ argc => 1,
+);
+
sub ro_biblio_ingest_single_object {
my $self = shift;
my $client = shift;
1;
-__END__
-
-sub in_transaction {
- OpenILS::Application::Ingest->post_init();
- return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-}
-
-sub begin_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- if (!$outer_xact) {
- $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
- #__PACKAGE__->st_sess->connect;
- my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.begin', $client );
- unless (defined $r and $r) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- #__PACKAGE__->st_sess->disconnect;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } otherwise {
- $log->debug("Ingest Couldn't BEGIN transaction!", ERROR)
- };
-
- return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-}
-
-sub rollback_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- if ($outer_xact) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- } else {
- $log->debug("Ingest isn't inside a transaction.", INFO);
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("Ingest Couldn't ROLLBACK transaction!")
- };
-
- return 1;
-}
-
-sub commit_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- #if (__PACKAGE__->st_sess->connected && $outer_xact) {
- if ($outer_xact) {
- my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.commit' );
- unless (defined $r and $r) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT transaction!")
- }
- #__PACKAGE__->st_sess->disconnect;
- } else {
- $log->debug("Ingest isn't inside a transaction.", INFO);
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("Ingest Couldn't COMMIT transaction!")
- };
-
- return 1;
-}
-
-sub storage_req {
- my $self = shift;
- my $method = shift;
- my @res = __PACKAGE__->method_lookup( $method )->run( @_ );
- return shift( @res );
-}
-
-sub scrub_authority_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::Ingest->in_transaction) {
- OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'scrub_authority_record' );
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.full_rec.mass_delete', { record => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_descriptor.mass_delete', { record => $rec } );
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'scrub_authority_record' );
- } otherwise {
- $log->debug('Scrubbing failed : '.shift(), ERROR);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_authority_record' );
- $success = 0;
- };
-
- OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
- OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.scrub.authority",
- method => "scrub_authority_record",
- api_level => 1,
- argc => 1,
-);
-
-
-sub scrub_metabib_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- if ( ref($rec) && ref($rec) =~ /HASH/o ) {
- $rec = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
- );
- }
-
- my $commit = 0;
- if (!OpenILS::Application::Ingest->in_transaction) {
- OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'scrub_metabib_record' );
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.full_rec.mass_delete', { record => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete', { source => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete', { record => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete', { source => $rec } );
-
- $log->debug( "Looking for metarecords whose master is $rec", DEBUG);
- my $masters = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.master_record.atomic', $rec );
-
- for my $mr (@$masters) {
- $log->debug( "Found metarecord whose master is $rec", DEBUG);
- my $others = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic', $mr->id );
-
- if (@$others) {
- $log->debug("Metarecord ".$mr->id." had master of $rec, setting to ".$others->[0]->source, DEBUG);
- $mr->master_record($others->[0]->source);
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.remote_update',
- { id => $mr->id },
- { master_record => $others->[0]->source, mods => undef }
- );
- } else {
- warn "Removing metarecord whose master is $rec";
- $log->debug( "Removing metarecord whose master is $rec", DEBUG);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.delete', $mr->id );
- warn "Metarecord removed";
- $log->debug( "Metarecord removed", DEBUG);
- }
- }
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'scrub_metabib_record' );
-
- } otherwise {
- $log->debug('Scrubbing failed : '.shift(), ERROR);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_metabib_record' );
- $success = 0;
- };
-
- OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
- OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.scrub.biblio",
- method => "scrub_metabib_record",
- api_level => 1,
- argc => 1,
-);
-
-sub wormize_biblio_metarecord {
- my $self = shift;
- my $client = shift;
- my $mrec = shift;
-
- my $recs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic' => $mrec );
-
- my $count = 0;
- for my $r (@$recs) {
- my $success = 0;
- try {
- $success = wormize_biblio_record($self => $client => $r->source);
- $client->respond(
- { record => $r->source,
- metarecord => $rec->metarecord,
- success => $success,
- }
- );
- } catch Error with {
- my $e = shift;
- $client->respond(
- { record => $r->source,
- metarecord => $rec->metarecord,
- success => $success,
- error => $e,
- }
- );
- };
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.nomap",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.noscrub",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.nomap.noscrub",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-sub wormize_biblio_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- if ( ref($rec) && ref($rec) =~ /HASH/o ) {
- $rec = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
- );
- }
-
-
- my $commit = 0;
- if (!OpenILS::Application::Ingest->in_transaction) {
- OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- # clean up the cruft
- unless ($self->api_name =~ /noscrub/o) {
- $self->method_lookup( 'open-ils.worm.scrub.biblio' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
- }
-
- # now redo 'em
- my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
-
- my @full_rec = ();
- my @rec_descriptor = ();
- my %field_entry = (
- title => [],
- author => [],
- subject => [],
- keyword => [],
- series => [],
- );
- my %metarecord = ();
- my @source_map = ();
- for my $r (@$bibs) {
- try {
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'extract_data'.$r->id );
-
- my $xml = $parser->parse_string($r->marc);
-
- #update the fingerprint
- my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $xml );
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.remote_update',
- { id => $r->id },
- { fingerprint => $fp->{fingerprint},
- quality => int($fp->{quality}) }
- ) if ($fp->{fingerprint} ne $r->fingerprint || int($fp->{quality}) ne $r->quality);
-
- # the full_rec stuff
- for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.biblio.xml' )->run( $xml ) ) {
- $fr->record( $r->id );
- push @full_rec, $fr;
- }
-
- # the rec_descriptor stuff
- my ($rd) = $self->method_lookup( 'open-ils.worm.biblio_leader.xml' )->run( $xml );
- $rd->record( $r->id );
- push @rec_descriptor, $rd;
-
- # the indexing field entry stuff
- for my $class ( qw/title author subject keyword series/ ) {
- for my $fe ( $self->method_lookup( 'open-ils.worm.field_entry.class.xml' )->run( $xml, $class ) ) {
- $fe->source( $r->id );
- push @{$field_entry{$class}}, $fe;
- }
- }
-
- unless ($self->api_name =~ /nomap/o) {
- my $mr = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic', $fp->{fingerprint} )->[0];
-
- unless ($mr) {
- $mr = Fieldmapper::metabib::metarecord->new;
- $mr->fingerprint( $fp->{fingerprint} );
- $mr->master_record( $r->id );
- $mr->id( OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
- }
-
- my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
- $mr_map->metarecord( $mr->id );
- $mr_map->source( $r->id );
- push @source_map, $mr_map;
-
- $metarecord{$mr->id} = $mr;
- }
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'extract_data'.$r->id );
- } otherwise {
- $log->debug('Data extraction failed for record '.$r->id.': '.shift(), ERROR);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'extract_data'.$r->id );
- };
- }
-
-
- if (@rec_descriptor) {
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'wormize_record' );
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.batch.create',
- @source_map
- ) if (@source_map);
-
- for my $mr ( values %metarecord ) {
- my $sources = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic',
- $mr->id
- );
-
- my $bibs = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.search.id.atomic',
- [ map { $_->source } @$sources ]
- );
-
- my $master = ( sort { $b->quality <=> $a->quality } @$bibs )[0];
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.remote_update',
- { id => $mr->id },
- { master_record => $master->id, mods => undef }
- );
- }
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.record_descriptor.batch.create',
- @rec_descriptor
- ) if (@rec_descriptor);
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.full_rec.batch.create',
- @full_rec
- ) if (@full_rec);
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.title_field_entry.batch.create',
- @{ $field_entry{title} }
- ) if (@{ $field_entry{title} });
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.author_field_entry.batch.create',
- @{ $field_entry{author} }
- ) if (@{ $field_entry{author} });
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.subject_field_entry.batch.create',
- @{ $field_entry{subject} }
- ) if (@{ $field_entry{subject} });
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create',
- @{ $field_entry{keyword} }
- ) if (@{ $field_entry{keyword} });
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.series_field_entry.batch.create',
- @{ $field_entry{series} }
- ) if (@{ $field_entry{series} });
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'wormize_record' );
- } else {
- $success = 0;
- }
-
- } otherwise {
- $log->debug('Wormization failed : '.shift(), ERROR);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_record' );
- $success = 0;
- };
-
- OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
- OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.nomap",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.noscrub",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.nomap.noscrub",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-
-sub wormize_authority_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::Ingest->in_transaction) {
- OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- # clean up the cruft
- unless ($self->api_name =~ /noscrub/o) {
- $self->method_lookup( 'open-ils.worm.scrub.authority' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
- }
-
- # now redo 'em
- my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_entry.search.id.atomic', $rec );
-
- my @full_rec = ();
- my @rec_descriptor = ();
- for my $r (@$bibs) {
- my $xml = $parser->parse_string($r->marc);
-
- # the full_rec stuff
- for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.authority.xml' )->run( $xml ) ) {
- $fr->record( $r->id );
- push @full_rec, $fr;
- }
-
- # the rec_descriptor stuff -- XXX What does this mean for authority records?
- #my ($rd) = $self->method_lookup( 'open-ils.worm.authority_leader.xml' )->run( $xml );
- #$rd->record( $r->id );
- #push @rec_descriptor, $rd;
-
- }
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'wormize_authority_record' );
-
- #OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_descriptor.batch.create', @rec_descriptor ) if (@rec_descriptor);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.full_rec.batch.create', @full_rec ) if (@full_rec);
-
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'wormize_authority_record' );
-
- } otherwise {
- $log->debug('Wormization failed : '.shift(), ERROR);
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_authority_record' );
- $success = 0;
- };
-
- OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
- OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.authority",
- method => "wormize_authority_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.authority.noscrub",
- method => "wormize_authority_record",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# MARC index extraction
-
-package OpenILS::Application::Ingest::XPATH;
-use base qw/OpenILS::Application::Ingest/;
-use Unicode::Normalize;
-
-# give this a MODS documentElement and an XPATH expression
-sub _xpath_to_string {
- my $xml = shift;
- my $xpath = shift;
- my $ns_uri = shift;
- my $ns_prefix = shift;
- my $unique = shift;
-
- $xml->setNamespace( $ns_uri, $ns_prefix, 1 ) if ($ns_uri && $ns_prefix);
-
- my $string = "";
-
- # grab the set of matching nodes
- my @nodes = $xml->findnodes( $xpath );
- for my $value (@nodes) {
-
- # grab all children of the node
- my @children = $value->childNodes();
- for my $child (@children) {
-
- # add the childs content to the growing buffer
- my $content = quotemeta($child->textContent);
- next if ($unique && $string =~ /$content/); # uniquify the values
- $string .= $child->textContent . " ";
- }
- if( ! @children ) {
- $string .= $value->textContent . " ";
- }
- }
- return NFD($string);
-}
-
-sub class_all_index_string_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $class = shift;
-
- OpenILS::Application::Ingest->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- my $class_constructor = "Fieldmapper::metabib::${class}_field_entry";
- for my $type ( keys %{ $xpathset->{$class} } ) {
- my $value = _xpath_to_string(
- $mods_sheet->transform($xml)->documentElement,
- $xpathset->{$class}->{$type}->{xpath},
- "http://www.loc.gov/mods/",
- "mods",
- 1
- );
-
- next unless $value;
-
- $value = NFD($value);
- $value =~ s/\pM+//sgo;
- $value =~ s/\pC+//sgo;
- $value =~ s/\W+$//sgo;
-
- $value =~ s/(\w)\./$1/sgo;
- $value = lc($value);
-
- my $fm = $class_constructor->new;
- $fm->value( $value );
- $fm->field( $xpathset->{$class}->{$type}->{id} );
- $client->respond($fm);
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.field_entry.class.xml",
- method => "class_all_index_string_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-sub class_all_index_string_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $class = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- for my $fm ($self->method_lookup("open-ils.worm.field_entry.class.xml")->run($r->marc, $class)) {
- $fm->source($rec);
- $client->respond($fm);
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.field_entry.class.record",
- method => "class_all_index_string_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-sub class_index_string_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $class = shift;
- my $type = shift;
-
- OpenILS::Application::Ingest->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
- return _xpath_to_string( $mods_sheet->transform($xml)->documentElement, $xpathset->{$class}->{$type}->{xpath}, "http://www.loc.gov/mods/", "mods", 1 );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.class.type.xml",
- method => "class_index_string_xml",
- api_level => 1,
- argc => 1,
-);
-
-sub class_index_string_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $class = shift;
- my $type = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.class.type.xml")->run($r->marc, $class => $type);
- $log->debug("XPath $class->$type for bib rec $rec returns ($d)", DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.class.type.record",
- method => "class_index_string_record",
- api_level => 1,
- argc => 1,
-);
-
-sub xml_xpath {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $xpath = shift;
- my $uri = shift;
- my $prefix = shift;
- my $unique = shift;
-
- OpenILS::Application::Ingest->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
- return _xpath_to_string( $xml->documentElement, $xpath, $uri, $prefix, $unique );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.xpath.xml",
- method => "xml_xpath",
- api_level => 1,
- argc => 1,
-);
-
-sub record_xpath {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $xpath = shift;
- my $uri = shift;
- my $prefix = shift;
- my $unique = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.xpath.xml")->run($r->marc, $xpath, $uri, $prefix, $unique );
- $log->debug("XPath [$xpath] bib rec $rec returns ($d)", DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.xpath.record",
- method => "record_xpath",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# MARC Descriptor
-
-package OpenILS::Application::Ingest::Biblio::Leader;
-use base qw/OpenILS::Application::Ingest/;
-use Unicode::Normalize;
-
-our %marc_type_groups = (
- BKS => q/[at]{1}/,
- SER => q/[a]{1}/,
- VIS => q/[gkro]{1}/,
- MIX => q/[p]{1}/,
- MAP => q/[ef]{1}/,
- SCO => q/[cd]{1}/,
- REC => q/[ij]{1}/,
- COM => q/[m]{1}/,
-);
-
-sub _type_re {
- my $re = '^'. join('|', $marc_type_groups{@_}) .'$';
- return qr/$re/;
-}
-
-our %biblio_descriptor_code = (
- item_type => sub { substr($ldr,6,1); },
- item_form =>
- sub {
- if (substr($ldr,6,1) =~ _type_re( qw/MAP VIS/ )) {
- return substr($oo8,29,1);
- } elsif (substr($ldr,6,1) =~ _type_re( qw/BKS SER MIX SCO REC/ )) {
- return substr($oo8,23,1);
- }
- return ' ';
- },
- bib_level => sub { substr($ldr,7,1); },
- control_type => sub { substr($ldr,8,1); },
- char_encoding => sub { substr($ldr,9,1); },
- enc_level => sub { substr($ldr,17,1); },
- cat_form => sub { substr($ldr,18,1); },
- pub_status => sub { substr($ldr,5,1); },
- item_lang => sub { substr($oo8,35,3); },
- lit_form => sub { (substr($ldr,6,1) =~ _type_re('BKS')) ? substr($oo8,33,1) : undef; },
- type_mat => sub { (substr($ldr,6,1) =~ _type_re('VIS')) ? substr($oo8,33,1) : undef; },
- audience => sub { substr($oo8,22,1); },
-);
-
-sub _extract_biblio_descriptors {
- my $xml = shift;
-
- local $ldr = $xml->findvalue('//*[local-name()="leader"]');
- local $oo8 = $xml->findvalue('//*[local-name()="controlfield" and @tag="008"]');
- local $oo7 = $xml->findvalue('//*[local-name()="controlfield" and @tag="007"]');
-
- my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
- for my $rd_field ( keys %biblio_descriptor_code ) {
- $rd_obj->$rd_field( $biblio_descriptor_code{$rd_field}->() );
- }
-
- return $rd_obj;
-}
-
-sub extract_biblio_desc_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- return _extract_biblio_descriptors( $xml );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.biblio_leader.xml",
- method => "extract_biblio_desc_xml",
- api_level => 1,
- argc => 1,
-);
-
-sub extract_biblio_desc_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.biblio_leader.xml")->run($r->marc);
- $log->debug("Record descriptor for bib rec $rec is ".OpenSRF::Utils::JSON->perl2JSON($d), DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.biblio_leader.record",
- method => "extract_biblio_desc_record",
- api_level => 1,
- argc => 1,
-);
-
-# --------------------------------------------------------------------------------
-# Flat MARC
-
-package OpenILS::Application::Ingest::FlatMARC;
-use base qw/OpenILS::Application::Ingest/;
-use Unicode::Normalize;
-
-
-sub _marcxml_to_full_rows {
-
- my $marcxml = shift;
- my $xmltype = shift || 'metabib';
-
- my $type = "Fieldmapper::${xmltype}::full_rec";
-
- my @ns_list;
-
- my ($root) = $marcxml->findnodes('//*[local-name()="record"]');
-
- for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
- next unless $tagline;
-
- my $ns = $type->new;
-
- $ns->tag( 'LDR' );
- my $val = $tagline->textContent;
- $val = NFD($val);
- $val =~ s/\pM+//sgo;
- $val =~ s/\pC+//sgo;
- $val =~ s/\W+$//sgo;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
- next unless $tagline;
-
- my $ns = $type->new;
-
- $ns->tag( $tagline->getAttribute( "tag" ) );
- my $val = $tagline->textContent;
- $val = NFD($val);
- $val =~ s/\pM+//sgo;
- $val =~ s/\pC+//sgo;
- $val =~ s/\W+$//sgo;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
- next unless $tagline;
-
- my $tag = $tagline->getAttribute( "tag" );
- my $ind1 = $tagline->getAttribute( "ind1" );
- my $ind2 = $tagline->getAttribute( "ind2" );
-
- for my $data ( @{$tagline->getChildrenByTagName('subfield')} ) {
- next unless $data;
-
- my $ns = $type->new;
-
- $ns->tag( $tag );
- $ns->ind1( $ind1 );
- $ns->ind2( $ind2 );
- $ns->subfield( $data->getAttribute( "code" ) );
- my $val = $data->textContent;
- $val = NFD($val);
- $val =~ s/\pM+//sgo;
- $val =~ s/\pC+//sgo;
- $val =~ s/\W+$//sgo;
- $ns->value( lc($val) );
-
- push @ns_list, $ns;
- }
- }
-
- $log->debug("Returning ".scalar(@ns_list)." Fieldmapper nodes from $xmltype xml", DEBUG);
- return @ns_list;
-}
-
-sub flat_marc_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- my $type = 'metabib';
- $type = 'authority' if ($self->api_name =~ /authority/o);
-
- OpenILS::Application::Ingest->post_init();
-
- $client->respond($_) for (_marcxml_to_full_rows($xml, $type));
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.authority.xml",
- method => "flat_marc_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.biblio.xml",
- method => "flat_marc_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-sub flat_marc_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $type = 'biblio';
- $type = 'authority' if ($self->api_name =~ /authority/o);
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.${type}.record_entry.retrieve" => $rec );
-
- $client->respond($_) for ($self->method_lookup("open-ils.worm.flat_marc.$type.xml")->run($r->marc));
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.biblio.record_entry",
- method => "flat_marc_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.authority.record_entry",
- method => "flat_marc_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# Fingerprinting
-
-package OpenILS::Application::Ingest::Biblio::Fingerprint;
-use base qw/OpenILS::Application::Ingest/;
-use Unicode::Normalize;
-use OpenSRF::EX qw/:try/;
-
-my @fp_mods_xpath = (
- '//mods:mods/mods:typeOfResource[text()="text"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\b(?:the|an?)\b//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\[.[^\]]+\]//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s*[;\/\.]*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- author => {
- xpath => [
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/,?\s+.*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- ],
-
- '//mods:mods/mods:relatedItem[@type!="host" and @type!="series"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and not(@type)]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\b(?:the|an?)\b//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\[.[^\]]+\]//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s*[;\/\.]*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- author => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/,?\s+.*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- ],
-
-);
-
-push @fp_mods_xpath, '//mods:mods/mods:titleInfo' => $fp_mods_xpath[1];
-
-sub _fp_mods {
- my $mods = shift;
- $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
-
- my $fp_string = '';
-
- my $match_index = 0;
- my $block_index = 1;
- while ( my $match_xpath = $fp_mods_xpath[$match_index] ) {
- if ( my @nodes = $mods->findnodes( $match_xpath ) ) {
-
- my $block_name_index = 0;
- my $block_value_index = 1;
- my $block = $fp_mods_xpath[$block_index];
- while ( my $part = $$block[$block_value_index] ) {
- local $text;
- for my $xpath ( @{ $part->{xpath} } ) {
- $text = $mods->findvalue( $xpath );
- last if ($text);
- }
-
- $log->debug("Found fingerprint text using $$block[$block_name_index] : [$text]", DEBUG);
-
- if ($text) {
- $$part{fixup}->();
- $log->debug("Fingerprint text after fixup : [$text]", DEBUG);
- $fp_string .= $text;
- }
-
- $block_name_index += 2;
- $block_value_index += 2;
- }
- }
- if ($fp_string) {
- $fp_string =~ s/\W+//gso;
- $log->debug("Fingerprint is [$fp_string]", INFO);;
- return $fp_string;
- }
-
- $match_index += 2;
- $block_index += 2;
- }
- return undef;
-}
-
-sub refingerprint_bibrec {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::Ingest->in_transaction) {
- OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
- for my $b (@$bibs) {
- my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $b->marc );
-
- if ($b->fingerprint ne $fp->{fingerprint} || $b->quality != $fp->{quality}) {
-
- $log->debug("Updating ".$b->id." with fingerprint [$fp->{fingerprint}], quality [$fp->{quality}]", INFO);;
-
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.remote_update',
- { id => $b->id },
- { fingerprint => $fp->{fingerprint},
- quality => $fp->{quality} }
- );
-
- if ($self->api_name !~ /nomap/o) {
- my $old_source_map = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.source.atomic',
- $b->id
- );
-
- my $old_mrid;
- if (ref($old_source_map) and @$old_source_map) {
- for my $m (@$old_source_map) {
- $old_mrid = $m->metarecord;
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.delete',
- $m->id
- );
- }
- }
-
- my $old_sm = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.atomic',
- { metarecord => $old_mrid }
- ) if ($old_mrid);
-
- if (ref($old_sm) and @$old_sm == 0) {
- OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.delete',
- $old_mrid
- );
- }
-
- my $mr = OpenILS::Application::Ingest->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic',
- { fingerprint => $fp->{fingerprint} }
- )->[0];
-
- unless ($mr) {
- $mr = Fieldmapper::metabib::metarecord->new;
- $mr->fingerprint( $fp->{fingerprint} );
- $mr->master_record( $b->id );
- $mr->id( OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
- }
-
- my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
- $mr_map->metarecord( $mr->id );
- $mr_map->source( $b->id );
- OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.create', $mr_map );
-
- }
- }
- $client->respond($b->id);
- }
-
- } otherwise {
- $log->debug('Fingerprinting failed : '.shift(), ERROR);
- $success = 0;
- };
-
- OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
- OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record.update",
- method => "refingerprint_bibrec",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record.update.nomap",
- method => "refingerprint_bibrec",
- api_level => 1,
- argc => 1,
-);
-
-=comment
-
-sub fingerprint_bibrec {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $r = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec );
-
- my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($r->marc);
- $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
- return $fp;
-
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record",
- method => "fingerprint_bibrec",
- api_level => 0,
- argc => 1,
-);
-
-
-sub fingerprint_mods {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- OpenILS::Application::Ingest->post_init();
- my $mods = $parser->parse_string($xml)->documentElement;
-
- return _fp_mods( $mods );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.mods",
- method => "fingerprint_mods",
- api_level => 1,
- argc => 1,
-);
-
-sub fingerprint_marc {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- OpenILS::Application::Ingest->post_init();
- my $fp = _fp_mods( $mods_sheet->transform($xml)->documentElement );
- $log->debug("Returning [$fp] as fingerprint", INFO);
- return $fp;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.marc",
- method => "fingerprint_marc",
- api_level => 1,
- argc => 1,
-);
-
-
-=cut
-
-sub biblio_fingerprint_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::Ingest->post_init();
-
- my $marc = OpenILS::Application::Ingest
- ->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec )
- ->marc;
-
- my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($marc);
- $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
- return $fp;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record",
- method => "biblio_fingerprint_record",
- api_level => 1,
- argc => 1,
-);
-
-our $fp_script;
-sub biblio_fingerprint {
- my $self = shift;
- my $client = shift;
- my $marc = shift;
-
- OpenILS::Application::Ingest->post_init();
-
- $marc = $parser->parse_string($marc) unless (ref $marc);
-
- my $mods = OpenILS::Application::Ingest::entityize(
- $mods_sheet
- ->transform( $marc )
- ->documentElement
- ->toString,
- 'D'
- );
-
- $marc = OpenILS::Application::Ingest::entityize( $marc->documentElement->toString => 'D' );
-
- warn $marc;
- $log->internal("Got MARC [$marc]");
- $log->internal("Created MODS [$mods]");
-
- if(!$fp_script) {
- my @pfx = ( "apps", "open-ils.storage","app_settings" );
- my $conf = OpenSRF::Utils::SettingsClient->new;
-
- my $libs = $conf->config_value(@pfx, 'script_path');
- my $script_file = $conf->config_value(@pfx, 'scripts', 'biblio_fingerprint');
- my $script_libs = (ref($libs)) ? $libs : [$libs];
-
- $log->debug("Loading script $script_file for biblio fingerprinting...");
-
- $fp_script = new OpenILS::Utils::ScriptRunner
- ( file => $script_file,
- paths => $script_libs,
- reset_count => 1000 );
- }
-
- $log->debug("Applying environment for biblio fingerprinting...");
-
- my $env = {marc => $marc, mods => $mods};
- #my $res = {fingerprint => '', quality => '0'};
-
- $fp_script->insert('environment' => $env);
- #$fp_script->insert('result' => $res);
-
- $log->debug("Running script for biblio fingerprinting...");
-
- my $res = $fp_script->run || ($log->error( "Fingerprint script died! $@" ) && return 0);
-
- $log->debug("Script for biblio fingerprinting completed successfully...");
-
- return $res;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.marc",
- method => "biblio_fingerprint",
- api_level => 1,
- argc => 1,
-);
-
-# --------------------------------------------------------------------------------
-
-1;
-
-__END__
-my $in_xact;
-my $begin;
-my $commit;
-my $rollback;
-my $lookup;
-my $update_entry;
-my $mr_lookup;
-my $mr_update;
-my $mr_create;
-my $create_source_map;
-my $sm_lookup;
-my $rm_old_rd;
-my $rm_old_sm;
-my $rm_old_fr;
-my $rm_old_tr;
-my $rm_old_ar;
-my $rm_old_sr;
-my $rm_old_kr;
-my $rm_old_ser;
-
-my $fr_create;
-my $rd_create;
-my $create = {};
-
-my %descriptor_code = (
- item_type => 'substr($ldr,6,1)',
- item_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,29,1) : substr($oo8,23,1)',
- bib_level => 'substr($ldr,7,1)',
- control_type => 'substr($ldr,8,1)',
- char_encoding => 'substr($ldr,9,1)',
- enc_level => 'substr($ldr,17,1)',
- cat_form => 'substr($ldr,18,1)',
- pub_status => 'substr($ldr,5,1)',
- item_lang => 'substr($oo8,35,3)',
- #lit_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,33,1) : "0"',
- audience => 'substr($oo8,22,1)',
-);
-
-sub wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $sm_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.search.source')
- unless ($sm_lookup);
- $mr_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.search.fingerprint')
- unless ($mr_lookup);
- $mr_update = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.batch.update')
- unless ($mr_update);
- $lookup = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.retrieve')
- unless ($lookup);
- $update_entry = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.update')
- unless ($update_entry);
- $rm_old_sm = $self->method_lookup( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete')
- unless ($rm_old_sm);
- $rm_old_rd = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete')
- unless ($rm_old_rd);
- $rm_old_fr = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.mass_delete')
- unless ($rm_old_fr);
- $rm_old_tr = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete')
- unless ($rm_old_tr);
- $rm_old_ar = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete')
- unless ($rm_old_ar);
- $rm_old_sr = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete')
- unless ($rm_old_sr);
- $rm_old_kr = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete')
- unless ($rm_old_kr);
- $rm_old_ser = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete')
- unless ($rm_old_ser);
- $mr_create = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.create')
- unless ($mr_create);
- $create_source_map = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.batch.create')
- unless ($create_source_map);
- $rd_create = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.batch.create')
- unless ($rd_create);
- $fr_create = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.batch.create')
- unless ($fr_create);
- $$create{title} = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.batch.create')
- unless ($$create{title});
- $$create{author} = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.batch.create')
- unless ($$create{author});
- $$create{subject} = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.batch.create')
- unless ($$create{subject});
- $$create{keyword} = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create')
- unless ($$create{keyword});
- $$create{series} = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.batch.create')
- unless ($$create{series});
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("Ingest Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mods_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- if(!$mods_sheet) {
- my $xslt_doc = $parser->parse_file(
- OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- $mods_sheet = $xslt->parse_stylesheet( $xslt_doc );
- }
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- my $modsdoc = $mods_sheet->transform($marcdoc);
-
- my $mods = $modsdoc->documentElement;
- $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
-
- $entry->fingerprint( fingerprint_mods( $mods ) );
- push @entry_list, $entry;
-
- $log->debug("Fingerprint for Record Entry ".$docid." is [".$entry->fingerprint."]", INFO);
-
- unless ($no_map) {
- my ($mr) = $mr_lookup->run( $entry->fingerprint );
- if (!$mr || !@$mr) {
- $log->debug("No metarecord found for fingerprint [".$entry->fingerprint."]; Creating a new one", INFO);
- $mr = new Fieldmapper::metabib::metarecord;
- $mr->fingerprint( $entry->fingerprint );
- $mr->master_record( $entry->id );
- my ($new_mr) = $mr_create->run($mr);
- $mr->id($new_mr);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.create!")
- }
- } else {
- $log->debug("Retrieved metarecord, id is ".$mr->id, INFO);
- $mr->mods('');
- push @mr_list, $mr;
- }
-
- my $sm = new Fieldmapper::metabib::metarecord_source_map;
- $sm->metarecord( $mr->id );
- $sm->source( $entry->id );
- push @source_maps, $sm;
- }
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- push @mods_data, { $docid => $self->modsdoc_to_values( $mods ) };
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $rm_old_rd->run( { record => \@docids } );
- $rm_old_fr->run( { record => \@docids } );
- $rm_old_sm->run( { source => \@docids } ) unless ($no_map);
- $rm_old_tr->run( { source => \@docids } );
- $rm_old_ar->run( { source => \@docids } );
- $rm_old_sr->run( { source => \@docids } );
- $rm_old_kr->run( { source => \@docids } );
- $rm_old_ser->run( { source => \@docids } );
-
- unless ($no_map) {
- my ($sm) = $create_source_map->run(@source_maps);
- unless (defined $sm) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord_source_map.batch.create!")
- }
- my ($mr) = $mr_update->run(@mr_list);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.batch.update!")
- }
- }
-
- my ($re) = $update_entry->run(@entry_list);
- unless (defined $re) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.biblio.record_entry.batch.update!")
- }
-
- my ($rd) = $rd_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.full_rec.batch.create!")
- }
-
- # step 5: insert the new metadata
- for my $class ( qw/title author subject keyword series/ ) {
- my @md_list = ();
- for my $doc ( @mods_data ) {
- my ($did) = keys %$doc;
- my ($data) = values %$doc;
-
- my $fm_constructor = "Fieldmapper::metabib::${class}_field_entry";
- for my $row ( keys %{ $$data{$class} } ) {
- next unless (exists $$data{$class}{$row});
- next unless ($$data{$class}{$row}{value});
- my $fm_obj = $fm_constructor->new;
- $fm_obj->value( $$data{$class}{$row}{value} );
- $fm_obj->field( $$data{$class}{$row}{field_id} );
- $fm_obj->source( $did );
- $log->debug("$class entry: ".$fm_obj->source." => ".$fm_obj->field." : ".$fm_obj->value, DEBUG);
-
- push @md_list, $fm_obj;
- }
- }
-
- my ($cr) = $$create{$class}->run(@md_list);
- unless (defined $cr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.${class}_field_entry.batch.create!")
- }
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by the Ingest.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-my $ain_xact;
-my $abegin;
-my $acommit;
-my $arollback;
-my $alookup;
-my $aupdate_entry;
-my $amr_lookup;
-my $amr_update;
-my $amr_create;
-my $acreate_source_map;
-my $asm_lookup;
-my $arm_old_rd;
-my $arm_old_sm;
-my $arm_old_fr;
-my $arm_old_tr;
-my $arm_old_ar;
-my $arm_old_sr;
-my $arm_old_kr;
-my $arm_old_ser;
-
-my $afr_create;
-my $ard_create;
-my $acreate = {};
-
-sub authority_wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $alookup = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.retrieve')
- unless ($alookup);
- $aupdate_entry = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.update')
- unless ($aupdate_entry);
- $arm_old_rd = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.mass_delete')
- unless ($arm_old_rd);
- $arm_old_fr = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.mass_delete')
- unless ($arm_old_fr);
- $ard_create = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.batch.create')
- unless ($ard_create);
- $afr_create = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.batch.create')
- unless ($afr_create);
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("Ingest Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mads_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- #if(!$mads_sheet) {
- # my $xslt_doc = $parser->parse_file(
- # OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- # $mads_sheet = $xslt->parse_stylesheet( $xslt_doc );
- #}
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- #my $madsdoc = $mads_sheet->transform($marcdoc);
-
- #my $mads = $madsdoc->documentElement;
- #$mads->setNamespace( "http://www.loc.gov/mads/", "mads", 1 );
-
- push @entry_list, $entry;
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::authority::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc, 'Fieldmapper::authority::full_rec' );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $arm_old_rd->run( { record => \@docids } );
- $arm_old_fr->run( { record => \@docids } );
-
- my ($rd) = $ard_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.full_rec.batch.create!")
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by Ingest.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authortiy.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authority.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-
-
-sub _marcxml_to_full_rows {
-
- my $marcxml = shift;
- my $type = shift || 'Fieldmapper::metabib::full_rec';
-
- my @ns_list;
-
- my $root = $marcxml->documentElement;
-
- for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( 'LDR' );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( $tagline->getAttribute( "tag" ) );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
- next unless $tagline;
-
- my $tag = $tagline->getAttribute( "tag" );
- my $ind1 = $tagline->getAttribute( "ind1" );
- my $ind2 = $tagline->getAttribute( "ind2" );
-
- for my $data ( $tagline->childNodes ) {
- next unless $data;
-
- my $ns = $type->new;
-
- $ns->tag( $tag );
- $ns->ind1( $ind1 );
- $ns->ind2( $ind2 );
- $ns->subfield( $data->getAttribute( "code" ) );
- my $val = NFD($data->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( lc($val) );
-
- push @ns_list, $ns;
- }
- }
- return @ns_list;
-}
-
-sub _get_field_value {
-
- my( $root, $xpath ) = @_;
-
- my $string = "";
-
- # grab the set of matching nodes
- my @nodes = $root->findnodes( $xpath );
- for my $value (@nodes) {
-
- # grab all children of the node
- my @children = $value->childNodes();
- for my $child (@children) {
-
- # add the childs content to the growing buffer
- my $content = quotemeta($child->textContent);
- next if ($string =~ /$content/); # uniquify the values
- $string .= $child->textContent . " ";
- }
- if( ! @children ) {
- $string .= $value->textContent . " ";
- }
- }
- $string = NFD($string);
- $string =~ s/(\pM)//gso;
- return lc($string);
-}
-
-
-sub modsdoc_to_values {
- my( $self, $mods ) = @_;
- my $data = {};
- for my $class (keys %$xpathset) {
- $data->{$class} = {};
- for my $type (keys %{$xpathset->{$class}}) {
- $data->{$class}->{$type} = {};
- $data->{$class}->{$type}->{field_id} = $xpathset->{$class}->{$type}->{id};
- }
- }
- return $data;
-}
-
-
-1;
-
-
throw OpenSRF::EX::PANIC ( "FAILURE LOADING Publisher! : $@" );
}
- OpenILS::Application::WoRM->use;
- if ($@) {
- $log->debug("FAILURE LOADING WORM! $@", ERROR);
- throw OpenSRF::EX::PANIC ( "FAILURE LOADING WoRM! : $@" );
- }
-
$log->debug("We seem to be OK...",DEBUG);
}
);
if (OpenILS::Application::Storage::CDBI->db_Main()) {
- #OpenILS::Application::Storage::WORM->child_init();
- OpenILS::Application::WoRM->child_init();
$log->debug("Success initializing driver!", DEBUG);
return 1;
}
+
$log->debug("FAILURE initializing driver!", ERROR);
return 0;
}
+++ /dev/null
-package OpenILS::Application::Storage::WORM;
-use base qw/OpenILS::Application::Storage/;
-use strict; use warnings;
-
-use Unicode::Normalize;
-use OpenSRF::EX qw/:try/;
-
-use OpenSRF::Utils::SettingsClient;
-use OpenSRF::Utils::Logger qw/:level/;
-my $log = 'OpenSRF::Utils::Logger';
-
-use OpenILS::Utils::FlatXML;
-use OpenILS::Utils::Fieldmapper;
-use OpenSRF::Utils::JSON;
-
-use XML::LibXML;
-use XML::LibXSLT;
-use Time::HiRes qw(time);
-
-my $xml_util = OpenILS::Utils::FlatXML->new();
-
-my $parser = XML::LibXML->new();
-my $xslt = XML::LibXSLT->new();
-my $mods_sheet;
-my $mads_sheet;
-
-use open qw/:utf8/;
-
-my $xpathset = {};
-
-sub child_init {
- my $meth = __PACKAGE__->method_lookup('open-ils.storage.direct.config.metabib_field.retrieve.all');
- for my $f ($meth->run) {
- $xpathset->{ $f->field_class }->{ $f->name }->{xpath} = $f->xpath;
- $xpathset->{ $f->field_class }->{ $f->name }->{id} = $f->id;
- $log->debug("Loaded XPath from DB: ".$f->field_class." => ".$f->name." : ".$f->xpath, DEBUG);
- }
-}
-
-# --------------------------------------------------------------------------------
-# Fingerprinting
-
-my @fp_mods_xpath = (
- '//mods:mods/mods:typeOfResource[text()="text"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => '
- do {
- $text = lc(NFD($text));
- $text =~ s/\pM+//gso;
- $text =~ s/\s+/ /sgo;
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $text =~ s/\b(?:the|an?)\b//sgo;
- $text =~ s/\[.[^\]]+\]//sgo;
- $text =~ s/\s*[;\/\.]*$//sgo;
- };
- ',
- },
- author => {
- xpath => [
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => '
- do {
- $text = lc(NFD($text));
- $text =~ s/\pM+//gso;
- $text =~ s/\s+/ /sgo;
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $text =~ s/,?\s+.*$//sgo;
- $text =~ s/\pM+//gso;
- };
- ',
- },
- ],
-
- '//mods:mods/mods:relatedItem[@type!="host" and @type!="series"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and not(@type)]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => '
- do {
- $text = lc(NFD($text));
- $text =~ s/\pM+//gso;
- $text =~ s/\s+/ /sgo;
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $text =~ s/\b(?:the|an?)\b//sgo;
- $text =~ s/\[.[^\]]+\]//sgo;
- $text =~ s/\s*[;\/\.]*$//sgo;
- $text =~ s/\pM+//gso;
- };
- ',
- },
- author => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => '
- do {
- $text = lc(NFD($text));
- $text =~ s/\pM+//gso;
- $text =~ s/\s+/ /sgo;
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $text =~ s/,?\s+.*$//sgo;
- $text =~ s/\pM+//gso;
- };
- ',
- },
- ],
-
-);
-
-push @fp_mods_xpath, '//mods:mods/mods:titleInfo' => $fp_mods_xpath[1];
-
-sub fingerprint_mods {
- my $mods = shift;
-
- my $fp_string = '';
-
- my $match_index = 0;
- my $block_index = 1;
- while ( my $match_xpath = $fp_mods_xpath[$match_index] ) {
- if ( my @nodes = $mods->findnodes( $match_xpath ) ) {
-
- my $block_name_index = 0;
- my $block_value_index = 1;
- my $block = $fp_mods_xpath[$block_index];
- while ( my $part = $$block[$block_value_index] ) {
- my $text;
- for my $xpath ( @{ $part->{xpath} } ) {
- $text = $mods->findvalue( $xpath );
- last if ($text);
- }
-
- $log->debug("Found fingerprint text using $$block[$block_name_index] : [$text]", DEBUG);
-
- if ($text) {
- eval $$part{fixup};
- $fp_string .= $text;
- }
-
- $block_name_index += 2;
- $block_value_index += 2;
- }
- }
- if ($fp_string) {
- $fp_string =~ s/\W+//gso;
- $log->debug("Fingerprint is [$fp_string]", INFO);;
- return $fp_string;
- }
-
- $match_index += 2;
- $block_index += 2;
- }
- return undef;
-}
-
-
-
-# --------------------------------------------------------------------------------
-
-my $in_xact;
-my $begin;
-my $commit;
-my $rollback;
-my $lookup;
-my $update_entry;
-my $mr_lookup;
-my $mr_update;
-my $mr_create;
-my $create_source_map;
-my $sm_lookup;
-my $rm_old_rd;
-my $rm_old_sm;
-my $rm_old_fr;
-my $rm_old_tr;
-my $rm_old_ar;
-my $rm_old_sr;
-my $rm_old_kr;
-my $rm_old_ser;
-
-my $fr_create;
-my $rd_create;
-my $create = {};
-
-my %descriptor_code = (
- item_type => 'substr($ldr,6,1)',
- item_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,29,1) : substr($oo8,23,1)',
- bib_level => 'substr($ldr,7,1)',
- control_type => 'substr($ldr,8,1)',
- char_encoding => 'substr($ldr,9,1)',
- enc_level => 'substr($ldr,17,1)',
- cat_form => 'substr($ldr,18,1)',
- pub_status => 'substr($ldr,5,1)',
- item_lang => 'substr($oo8,35,3)',
- #lit_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,33,1) : "0"',
- audience => 'substr($oo8,22,1)',
-);
-
-sub wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $sm_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.search.source')
- unless ($sm_lookup);
- $mr_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.search.fingerprint')
- unless ($mr_lookup);
- $mr_update = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.batch.update')
- unless ($mr_update);
- $mr_create = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.create')
- unless ($mr_create);
- $create_source_map = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.batch.create')
- unless ($create_source_map);
- $lookup = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.retrieve')
- unless ($lookup);
- $update_entry = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.update')
- unless ($update_entry);
- $rm_old_sm = $self->method_lookup( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete')
- unless ($rm_old_sm);
- $rm_old_rd = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete')
- unless ($rm_old_rd);
- $rm_old_fr = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.mass_delete')
- unless ($rm_old_fr);
- $rm_old_tr = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete')
- unless ($rm_old_tr);
- $rm_old_ar = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete')
- unless ($rm_old_ar);
- $rm_old_sr = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete')
- unless ($rm_old_sr);
- $rm_old_kr = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete')
- unless ($rm_old_kr);
- $rm_old_ser = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete')
- unless ($rm_old_ser);
- $rd_create = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.batch.create')
- unless ($rd_create);
- $fr_create = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.batch.create')
- unless ($fr_create);
- $$create{title} = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.batch.create')
- unless ($$create{title});
- $$create{author} = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.batch.create')
- unless ($$create{author});
- $$create{subject} = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.batch.create')
- unless ($$create{subject});
- $$create{keyword} = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create')
- unless ($$create{keyword});
- $$create{series} = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.batch.create')
- unless ($$create{series});
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("WoRM isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mods_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- if(!$mods_sheet) {
- my $xslt_doc = $parser->parse_file(
- OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- $mods_sheet = $xslt->parse_stylesheet( $xslt_doc );
- }
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- my $modsdoc = $mods_sheet->transform($marcdoc);
-
- my $mods = $modsdoc->documentElement;
- $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
-
- $entry->fingerprint( fingerprint_mods( $mods ) );
- push @entry_list, $entry;
-
- $log->debug("Fingerprint for Record Entry ".$docid." is [".$entry->fingerprint."]", INFO);
-
- unless ($no_map) {
- my ($mr) = $mr_lookup->run( $entry->fingerprint );
- if (!$mr || !@$mr) {
- $log->debug("No metarecord found for fingerprint [".$entry->fingerprint."]; Creating a new one", INFO);
- $mr = new Fieldmapper::metabib::metarecord;
- $mr->fingerprint( $entry->fingerprint );
- $mr->master_record( $entry->id );
- my ($new_mr) = $mr_create->run($mr);
- $mr->id($new_mr);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.create!")
- }
- } else {
- $log->debug("Retrieved metarecord, id is ".$mr->id, INFO);
- $mr->mods('');
- push @mr_list, $mr;
- }
-
- my $sm = new Fieldmapper::metabib::metarecord_source_map;
- $sm->metarecord( $mr->id );
- $sm->source( $entry->id );
- push @source_maps, $sm;
- }
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- push @mods_data, { $docid => $self->modsdoc_to_values( $mods ) };
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $rm_old_rd->run( { record => \@docids } );
- $rm_old_fr->run( { record => \@docids } );
- $rm_old_sm->run( { source => \@docids } ) unless ($no_map);
- $rm_old_tr->run( { source => \@docids } );
- $rm_old_ar->run( { source => \@docids } );
- $rm_old_sr->run( { source => \@docids } );
- $rm_old_kr->run( { source => \@docids } );
- $rm_old_ser->run( { source => \@docids } );
-
- unless ($no_map) {
- my ($sm) = $create_source_map->run(@source_maps);
- unless (defined $sm) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord_source_map.batch.create!")
- }
- my ($mr) = $mr_update->run(@mr_list);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.batch.update!")
- }
- }
-
- my ($re) = $update_entry->run(@entry_list);
- unless (defined $re) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.biblio.record_entry.batch.update!")
- }
-
- my ($rd) = $rd_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.full_rec.batch.create!")
- }
-
- # step 5: insert the new metadata
- for my $class ( qw/title author subject keyword series/ ) {
- my @md_list = ();
- for my $doc ( @mods_data ) {
- my ($did) = keys %$doc;
- my ($data) = values %$doc;
-
- my $fm_constructor = "Fieldmapper::metabib::${class}_field_entry";
- for my $row ( keys %{ $$data{$class} } ) {
- next unless (exists $$data{$class}{$row});
- next unless ($$data{$class}{$row}{value});
- my $fm_obj = $fm_constructor->new;
- $fm_obj->value( $$data{$class}{$row}{value} );
- $fm_obj->field( $$data{$class}{$row}{field_id} );
- $fm_obj->source( $did );
- $log->debug("$class entry: ".$fm_obj->source." => ".$fm_obj->field." : ".$fm_obj->value, DEBUG);
-
- push @md_list, $fm_obj;
- }
- }
-
- my ($cr) = $$create{$class}->run(@md_list);
- unless (defined $cr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.${class}_field_entry.batch.create!")
- }
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by the WoRM.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-my $ain_xact;
-my $abegin;
-my $acommit;
-my $arollback;
-my $alookup;
-my $aupdate_entry;
-my $amr_lookup;
-my $amr_update;
-my $amr_create;
-my $acreate_source_map;
-my $asm_lookup;
-my $arm_old_rd;
-my $arm_old_sm;
-my $arm_old_fr;
-my $arm_old_tr;
-my $arm_old_ar;
-my $arm_old_sr;
-my $arm_old_kr;
-my $arm_old_ser;
-
-my $afr_create;
-my $ard_create;
-my $acreate = {};
-
-sub authority_wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $alookup = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.retrieve')
- unless ($alookup);
- $aupdate_entry = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.update')
- unless ($aupdate_entry);
- $arm_old_rd = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.mass_delete')
- unless ($arm_old_rd);
- $arm_old_fr = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.mass_delete')
- unless ($arm_old_fr);
- $ard_create = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.batch.create')
- unless ($ard_create);
- $afr_create = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.batch.create')
- unless ($afr_create);
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("WoRM isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mads_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- #if(!$mads_sheet) {
- # my $xslt_doc = $parser->parse_file(
- # OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- # $mads_sheet = $xslt->parse_stylesheet( $xslt_doc );
- #}
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- #my $madsdoc = $mads_sheet->transform($marcdoc);
-
- #my $mads = $madsdoc->documentElement;
- #$mads->setNamespace( "http://www.loc.gov/mads/", "mads", 1 );
-
- push @entry_list, $entry;
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::authority::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc, 'Fieldmapper::authority::full_rec' );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $arm_old_rd->run( { record => \@docids } );
- $arm_old_fr->run( { record => \@docids } );
-
- my ($rd) = $ard_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.full_rec.batch.create!")
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by the WoRM.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authortiy.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authority.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-
-
-sub _marcxml_to_full_rows {
-
- my $marcxml = shift;
- my $type = shift || 'Fieldmapper::metabib::full_rec';
-
- my @ns_list;
-
- my $root = $marcxml->documentElement;
-
- for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( 'LDR' );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( $tagline->getAttribute( "tag" ) );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
- next unless $tagline;
-
- my $tag = $tagline->getAttribute( "tag" );
- my $ind1 = $tagline->getAttribute( "ind1" );
- my $ind2 = $tagline->getAttribute( "ind2" );
-
- for my $data ( $tagline->childNodes ) {
- next unless $data;
-
- my $ns = $type->new;
-
- $ns->tag( $tag );
- $ns->ind1( $ind1 );
- $ns->ind2( $ind2 );
- $ns->subfield( $data->getAttribute( "code" ) );
- my $val = NFD($data->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( lc($val) );
-
- push @ns_list, $ns;
- }
- }
- return @ns_list;
-}
-
-sub _get_field_value {
-
- my( $root, $xpath ) = @_;
-
- my $string = "";
-
- # grab the set of matching nodes
- my @nodes = $root->findnodes( $xpath );
- for my $value (@nodes) {
-
- # grab all children of the node
- my @children = $value->childNodes();
- for my $child (@children) {
-
- # add the childs content to the growing buffer
- my $content = quotemeta($child->textContent);
- next if ($string =~ /$content/); # uniquify the values
- $string .= $child->textContent . " ";
- }
- if( ! @children ) {
- $string .= $value->textContent . " ";
- }
- }
- $string = NFD($string);
- $string =~ s/(\pM)//gso;
- return lc($string);
-}
-
-
-sub modsdoc_to_values {
- my( $self, $mods ) = @_;
- my $data = {};
- for my $class (keys %$xpathset) {
- $data->{$class} = {};
- for my $type (keys %{$xpathset->{$class}}) {
- $data->{$class}->{$type} = {};
- $data->{$class}->{$type}->{value} = _get_field_value( $mods, $xpathset->{$class}->{$type}->{xpath} );
- $data->{$class}->{$type}->{field_id} = $xpathset->{$class}->{$type}->{id};
- }
- }
- return $data;
-}
-
-
-1;
-
-
+++ /dev/null
-package OpenILS::Application::WoRM;
-use base qw/OpenSRF::Application/;
-use open qw/:utf8/;
-
-use Unicode::Normalize;
-use OpenSRF::EX qw/:try/;
-
-use OpenSRF::Utils::SettingsClient;
-use OpenSRF::Utils::Logger qw/:level/;
-
-use OpenILS::Utils::FlatXML;
-use OpenILS::Utils::Fieldmapper;
-use OpenSRF::Utils::JSON;
-
-use OpenILS::Utils::Fieldmapper;
-
-use XML::LibXML;
-use XML::LibXSLT;
-use Time::HiRes qw(time);
-
-
-our $log = 'OpenSRF::Utils::Logger';
-our $xml_util = OpenILS::Utils::FlatXML->new();
-
-our $parser = XML::LibXML->new();
-our $xslt = XML::LibXSLT->new();
-our $mods_sheet;
-our $mads_sheet;
-
-our $st_sess;
-sub st_sess {
- my $self = shift;
- my $sess = shift;
- $st_sess = $sess if ($sess);
- return $st_sess;
-}
-
-our $xpathset = {};
-
-sub initialize {}
-sub child_init {}
-
-sub post_init {
- $log->debug("Running post_init", DEBUG);
-
- unless ($mods_sheet) {
- $log->debug("Loading MODS XSLT", DEBUG);
- my $xslt_doc = $parser->parse_file(
- OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- $mods_sheet = $xslt->parse_stylesheet( $xslt_doc );
- }
-
- #if (!__PACKAGE__->st_sess()) {
- # $log->debug("Creating cached storage server session", DEBUG);
- # __PACKAGE__->st_sess( OpenSRF::AppSession->create('open-ils.storage') );
- #}
-
- unless (keys %$xpathset) {
- my $req = __PACKAGE__->storage_req('open-ils.storage.direct.config.metabib_field.retrieve.all.atomic');
- for my $f (@$req) {
- $xpathset->{ $f->field_class }->{ $f->name }->{xpath} = $f->xpath;
- $xpathset->{ $f->field_class }->{ $f->name }->{id} = $f->id;
- $log->debug("Loaded XPath from DB: ".$f->field_class." => ".$f->name." : ".$f->xpath, DEBUG);
- }
- }
-}
-
-sub entityize {
- my $stuff = shift;
- my $form = shift;
-
- if ($form eq 'D') {
- $stuff = NFD($stuff);
- } else {
- $stuff = NFC($stuff);
- }
-
- $stuff =~ s/([\x{0080}-\x{fffd}])/sprintf('&#x%X;',ord($1))/sgoe;
- return $stuff;
-}
-
-
-sub in_transaction {
- OpenILS::Application::WoRM->post_init();
- return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-}
-
-sub begin_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- if (!$outer_xact) {
- $log->debug("WoRM isn't inside a transaction, starting one now.", INFO);
- #__PACKAGE__->st_sess->connect;
- my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.begin', $client );
- unless (defined $r and $r) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- #__PACKAGE__->st_sess->disconnect;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } otherwise {
- $log->debug("WoRM Couldn't BEGIN transaction!", ERROR)
- };
-
- return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-}
-
-sub rollback_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- if ($outer_xact) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- } else {
- $log->debug("WoRM isn't inside a transaction.", INFO);
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't ROLLBACK transaction!")
- };
-
- return 1;
-}
-
-sub commit_transaction {
- my $self = shift;
- my $client = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
-
- try {
- #if (__PACKAGE__->st_sess->connected && $outer_xact) {
- if ($outer_xact) {
- my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.commit' );
- unless (defined $r and $r) {
- __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT transaction!")
- }
- #__PACKAGE__->st_sess->disconnect;
- } else {
- $log->debug("WoRM isn't inside a transaction.", INFO);
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't COMMIT transaction!")
- };
-
- return 1;
-}
-
-sub storage_req {
- my $self = shift;
- my $method = shift;
- my @res = __PACKAGE__->method_lookup( $method )->run( @_ );
- return shift( @res );
-}
-
-sub scrub_authority_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::WoRM->in_transaction) {
- OpenILS::Application::WoRM->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.set', 'scrub_authority_record' );
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.authority.full_rec.mass_delete', { record => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.authority.record_descriptor.mass_delete', { record => $rec } );
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.release', 'scrub_authority_record' );
- } otherwise {
- $log->debug('Scrubbing failed : '.shift(), ERROR);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_authority_record' );
- $success = 0;
- };
-
- OpenILS::Application::WoRM->commit_transaction if ($commit && $success);
- OpenILS::Application::WoRM->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.scrub.authority",
- method => "scrub_authority_record",
- api_level => 1,
- argc => 1,
-);
-
-
-sub scrub_metabib_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- if ( ref($rec) && ref($rec) =~ /HASH/o ) {
- $rec = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
- );
- }
-
- my $commit = 0;
- if (!OpenILS::Application::WoRM->in_transaction) {
- OpenILS::Application::WoRM->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.set', 'scrub_metabib_record' );
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.full_rec.mass_delete', { record => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete', { source => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete', { record => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete', { source => $rec } );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete', { source => $rec } );
-
- $log->debug( "Looking for metarecords whose master is $rec", DEBUG);
- my $masters = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.master_record.atomic', $rec );
-
- for my $mr (@$masters) {
- $log->debug( "Found metarecord whose master is $rec", DEBUG);
- my $others = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic', $mr->id );
-
- if (@$others) {
- $log->debug("Metarecord ".$mr->id." had master of $rec, setting to ".$others->[0]->source, DEBUG);
- $mr->master_record($others->[0]->source);
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.remote_update',
- { id => $mr->id },
- { master_record => $others->[0]->source, mods => undef }
- );
- } else {
- warn "Removing metarecord whose master is $rec";
- $log->debug( "Removing metarecord whose master is $rec", DEBUG);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord.delete', $mr->id );
- warn "Metarecord removed";
- $log->debug( "Metarecord removed", DEBUG);
- }
- }
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.release', 'scrub_metabib_record' );
-
- } otherwise {
- $log->debug('Scrubbing failed : '.shift(), ERROR);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_metabib_record' );
- $success = 0;
- };
-
- OpenILS::Application::WoRM->commit_transaction if ($commit && $success);
- OpenILS::Application::WoRM->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.scrub.biblio",
- method => "scrub_metabib_record",
- api_level => 1,
- argc => 1,
-);
-
-sub wormize_biblio_metarecord {
- my $self = shift;
- my $client = shift;
- my $mrec = shift;
-
- my $recs = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic' => $mrec );
-
- my $count = 0;
- for my $r (@$recs) {
- my $success = 0;
- try {
- $success = wormize_biblio_record($self => $client => $r->source);
- $client->respond(
- { record => $r->source,
- metarecord => $rec->metarecord,
- success => $success,
- }
- );
- } catch Error with {
- my $e = shift;
- $client->respond(
- { record => $r->source,
- metarecord => $rec->metarecord,
- success => $success,
- error => $e,
- }
- );
- };
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.nomap",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.noscrub",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.metarecord.nomap.noscrub",
- method => "wormize_biblio_metarecord",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-sub wormize_biblio_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- if ( ref($rec) && ref($rec) =~ /HASH/o ) {
- $rec = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
- );
- }
-
-
- my $commit = 0;
- if (!OpenILS::Application::WoRM->in_transaction) {
- OpenILS::Application::WoRM->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- # clean up the cruft
- unless ($self->api_name =~ /noscrub/o) {
- $self->method_lookup( 'open-ils.worm.scrub.biblio' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
- }
-
- # now redo 'em
- my $bibs = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
-
- my @full_rec = ();
- my @rec_descriptor = ();
- my %field_entry = (
- title => [],
- author => [],
- subject => [],
- keyword => [],
- series => [],
- );
- my %metarecord = ();
- my @source_map = ();
- for my $r (@$bibs) {
- try {
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.set', 'extract_data'.$r->id );
-
- my $xml = $parser->parse_string($r->marc);
-
- #update the fingerprint
- my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $xml );
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.remote_update',
- { id => $r->id },
- { fingerprint => $fp->{fingerprint},
- quality => int($fp->{quality}) }
- ) if ($fp->{fingerprint} ne $r->fingerprint || int($fp->{quality}) ne $r->quality);
-
- # the full_rec stuff
- for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.biblio.xml' )->run( $xml ) ) {
- $fr->record( $r->id );
- push @full_rec, $fr;
- }
-
- # the rec_descriptor stuff
- my ($rd) = $self->method_lookup( 'open-ils.worm.biblio_leader.xml' )->run( $xml );
- $rd->record( $r->id );
- push @rec_descriptor, $rd;
-
- # the indexing field entry stuff
- for my $class ( qw/title author subject keyword series/ ) {
- for my $fe ( $self->method_lookup( 'open-ils.worm.field_entry.class.xml' )->run( $xml, $class ) ) {
- $fe->source( $r->id );
- push @{$field_entry{$class}}, $fe;
- }
- }
-
- unless ($self->api_name =~ /nomap/o) {
- my $mr = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic', $fp->{fingerprint} )->[0];
-
- unless ($mr) {
- $mr = Fieldmapper::metabib::metarecord->new;
- $mr->fingerprint( $fp->{fingerprint} );
- $mr->master_record( $r->id );
- $mr->id( OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
- }
-
- my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
- $mr_map->metarecord( $mr->id );
- $mr_map->source( $r->id );
- push @source_map, $mr_map;
-
- $metarecord{$mr->id} = $mr;
- }
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.release', 'extract_data'.$r->id );
- } otherwise {
- $log->debug('Data extraction failed for record '.$r->id.': '.shift(), ERROR);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.rollback', 'extract_data'.$r->id );
- };
- }
-
-
- if (@rec_descriptor) {
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.set', 'wormize_record' );
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.batch.create',
- @source_map
- ) if (@source_map);
-
- for my $mr ( values %metarecord ) {
- my $sources = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic',
- $mr->id
- );
-
- my $bibs = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.search.id.atomic',
- [ map { $_->source } @$sources ]
- );
-
- my $master = ( sort { $b->quality <=> $a->quality } @$bibs )[0];
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.remote_update',
- { id => $mr->id },
- { master_record => $master->id, mods => undef }
- );
- }
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.record_descriptor.batch.create',
- @rec_descriptor
- ) if (@rec_descriptor);
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.full_rec.batch.create',
- @full_rec
- ) if (@full_rec);
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.title_field_entry.batch.create',
- @{ $field_entry{title} }
- ) if (@{ $field_entry{title} });
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.author_field_entry.batch.create',
- @{ $field_entry{author} }
- ) if (@{ $field_entry{author} });
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.subject_field_entry.batch.create',
- @{ $field_entry{subject} }
- ) if (@{ $field_entry{subject} });
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create',
- @{ $field_entry{keyword} }
- ) if (@{ $field_entry{keyword} });
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.series_field_entry.batch.create',
- @{ $field_entry{series} }
- ) if (@{ $field_entry{series} });
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.release', 'wormize_record' );
- } else {
- $success = 0;
- }
-
- } otherwise {
- $log->debug('Wormization failed : '.shift(), ERROR);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_record' );
- $success = 0;
- };
-
- OpenILS::Application::WoRM->commit_transaction if ($commit && $success);
- OpenILS::Application::WoRM->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.nomap",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.noscrub",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.biblio.nomap.noscrub",
- method => "wormize_biblio_record",
- api_level => 1,
- argc => 1,
-);
-
-sub wormize_authority_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::WoRM->in_transaction) {
- OpenILS::Application::WoRM->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- # clean up the cruft
- unless ($self->api_name =~ /noscrub/o) {
- $self->method_lookup( 'open-ils.worm.scrub.authority' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
- }
-
- # now redo 'em
- my $bibs = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.authority.record_entry.search.id.atomic', $rec );
-
- my @full_rec = ();
- my @rec_descriptor = ();
- for my $r (@$bibs) {
- my $xml = $parser->parse_string($r->marc);
-
- # the full_rec stuff
- for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.authority.xml' )->run( $xml ) ) {
- $fr->record( $r->id );
- push @full_rec, $fr;
- }
-
- # the rec_descriptor stuff -- XXX What does this mean for authority records?
- #my ($rd) = $self->method_lookup( 'open-ils.worm.authority_leader.xml' )->run( $xml );
- #$rd->record( $r->id );
- #push @rec_descriptor, $rd;
-
- }
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.set', 'wormize_authority_record' );
-
- #OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.authority.record_descriptor.batch.create', @rec_descriptor ) if (@rec_descriptor);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.authority.full_rec.batch.create', @full_rec ) if (@full_rec);
-
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.release', 'wormize_authority_record' );
-
- } otherwise {
- $log->debug('Wormization failed : '.shift(), ERROR);
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_authority_record' );
- $success = 0;
- };
-
- OpenILS::Application::WoRM->commit_transaction if ($commit && $success);
- OpenILS::Application::WoRM->rollback_transaction if ($commit && !$success);
- return $success;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.authority",
- method => "wormize_authority_record",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.authority.noscrub",
- method => "wormize_authority_record",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# MARC index extraction
-
-package OpenILS::Application::WoRM::XPATH;
-use base qw/OpenILS::Application::WoRM/;
-use Unicode::Normalize;
-
-# give this a MODS documentElement and an XPATH expression
-sub _xpath_to_string {
- my $xml = shift;
- my $xpath = shift;
- my $ns_uri = shift;
- my $ns_prefix = shift;
- my $unique = shift;
-
- $xml->setNamespace( $ns_uri, $ns_prefix, 1 ) if ($ns_uri && $ns_prefix);
-
- my $string = "";
-
- # grab the set of matching nodes
- my @nodes = $xml->findnodes( $xpath );
- for my $value (@nodes) {
-
- # grab all children of the node
- my @children = $value->childNodes();
- for my $child (@children) {
-
- # add the childs content to the growing buffer
- my $content = quotemeta($child->textContent);
- next if ($unique && $string =~ /$content/); # uniquify the values
- $string .= $child->textContent . " ";
- }
- if( ! @children ) {
- $string .= $value->textContent . " ";
- }
- }
- return NFD($string);
-}
-
-sub class_all_index_string_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $class = shift;
-
- OpenILS::Application::WoRM->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- my $class_constructor = "Fieldmapper::metabib::${class}_field_entry";
- for my $type ( keys %{ $xpathset->{$class} } ) {
- my $value = _xpath_to_string(
- $mods_sheet->transform($xml)->documentElement,
- $xpathset->{$class}->{$type}->{xpath},
- "http://www.loc.gov/mods/",
- "mods",
- 1
- );
-
- next unless $value;
-
- $value =~ s/\pM+//sgo;
- $value =~ s/\pC+//sgo;
- #$value =~ s/[\x{0080}-\x{fffd}]//sgoe;
-
- $value =~ s/(\w)\./$1/sgo;
- $value = lc($value);
-
- my $fm = $class_constructor->new;
- $fm->value( $value );
- $fm->field( $xpathset->{$class}->{$type}->{id} );
- $client->respond($fm);
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.field_entry.class.xml",
- method => "class_all_index_string_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-sub class_all_index_string_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $class = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- for my $fm ($self->method_lookup("open-ils.worm.field_entry.class.xml")->run($r->marc, $class)) {
- $fm->source($rec);
- $client->respond($fm);
- }
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.field_entry.class.record",
- method => "class_all_index_string_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-sub class_index_string_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $class = shift;
- my $type = shift;
-
- OpenILS::Application::WoRM->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
- return _xpath_to_string( $mods_sheet->transform($xml)->documentElement, $xpathset->{$class}->{$type}->{xpath}, "http://www.loc.gov/mods/", "mods", 1 );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.class.type.xml",
- method => "class_index_string_xml",
- api_level => 1,
- argc => 1,
-);
-
-sub class_index_string_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $class = shift;
- my $type = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.class.type.xml")->run($r->marc, $class => $type);
- $log->debug("XPath $class->$type for bib rec $rec returns ($d)", DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.class.type.record",
- method => "class_index_string_record",
- api_level => 1,
- argc => 1,
-);
-
-sub xml_xpath {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
- my $xpath = shift;
- my $uri = shift;
- my $prefix = shift;
- my $unique = shift;
-
- OpenILS::Application::WoRM->post_init();
- $xml = $parser->parse_string($xml) unless (ref $xml);
- return _xpath_to_string( $xml->documentElement, $xpath, $uri, $prefix, $unique );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.xpath.xml",
- method => "xml_xpath",
- api_level => 1,
- argc => 1,
-);
-
-sub record_xpath {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
- my $xpath = shift;
- my $uri = shift;
- my $prefix = shift;
- my $unique = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.xpath.xml")->run($r->marc, $xpath, $uri, $prefix, $unique );
- $log->debug("XPath [$xpath] bib rec $rec returns ($d)", DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.xpath.record",
- method => "record_xpath",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# MARC Descriptor
-
-package OpenILS::Application::WoRM::Biblio::Leader;
-use base qw/OpenILS::Application::WoRM/;
-use Unicode::Normalize;
-
-our %marc_type_groups = (
- BKS => q/[at]{1}/,
- SER => q/[a]{1}/,
- VIS => q/[gkro]{1}/,
- MIX => q/[p]{1}/,
- MAP => q/[ef]{1}/,
- SCO => q/[cd]{1}/,
- REC => q/[ij]{1}/,
- COM => q/[m]{1}/,
-);
-
-sub _type_re {
- my $re = '^'. join('|', $marc_type_groups{@_}) .'$';
- return qr/$re/;
-}
-
-our %biblio_descriptor_code = (
- item_type => sub { substr($ldr,6,1); },
- item_form =>
- sub {
- if (substr($ldr,6,1) =~ _type_re( qw/MAP VIS/ )) {
- return substr($oo8,29,1);
- } elsif (substr($ldr,6,1) =~ _type_re( qw/BKS SER MIX SCO REC/ )) {
- return substr($oo8,23,1);
- }
- return ' ';
- },
- bib_level => sub { substr($ldr,7,1); },
- control_type => sub { substr($ldr,8,1); },
- char_encoding => sub { substr($ldr,9,1); },
- enc_level => sub { substr($ldr,17,1); },
- cat_form => sub { substr($ldr,18,1); },
- pub_status => sub { substr($ldr,5,1); },
- item_lang => sub { substr($oo8,35,3); },
- lit_form => sub { (substr($ldr,6,1) =~ _type_re('BKS')) ? substr($oo8,33,1) : undef; },
- type_mat => sub { (substr($ldr,6,1) =~ _type_re('VIS')) ? substr($oo8,33,1) : undef; },
- audience => sub { substr($oo8,22,1); },
-);
-
-sub _extract_biblio_descriptors {
- my $xml = shift;
-
- local $ldr = $xml->findvalue('//*[local-name()="leader"]');
- local $oo8 = $xml->findvalue('//*[local-name()="controlfield" and @tag="008"]');
- local $oo7 = $xml->findvalue('//*[local-name()="controlfield" and @tag="007"]');
-
- my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
- for my $rd_field ( keys %biblio_descriptor_code ) {
- $rd_obj->$rd_field( $biblio_descriptor_code{$rd_field}->() );
- }
-
- return $rd_obj;
-}
-
-sub extract_biblio_desc_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- return _extract_biblio_descriptors( $xml );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.biblio_leader.xml",
- method => "extract_biblio_desc_xml",
- api_level => 1,
- argc => 1,
-);
-
-sub extract_biblio_desc_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
-
- my ($d) = $self->method_lookup("open-ils.worm.biblio_leader.xml")->run($r->marc);
- $log->debug("Record descriptor for bib rec $rec is ".OpenSRF::Utils::JSON->perl2JSON($d), DEBUG);
- return $d;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.biblio_leader.record",
- method => "extract_biblio_desc_record",
- api_level => 1,
- argc => 1,
-);
-
-# --------------------------------------------------------------------------------
-# Flat MARC
-
-package OpenILS::Application::WoRM::FlatMARC;
-use base qw/OpenILS::Application::WoRM/;
-use Unicode::Normalize;
-
-
-sub _marcxml_to_full_rows {
-
- my $marcxml = shift;
- my $xmltype = shift || 'metabib';
-
- my $type = "Fieldmapper::${xmltype}::full_rec";
-
- my @ns_list;
-
- my ($root) = $marcxml->findnodes('//*[local-name()="record"]');
-
- for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
- next unless $tagline;
-
- my $ns = $type->new;
-
- $ns->tag( 'LDR' );
- my $val = $tagline->textContent;
- $val = NFD($val);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
- next unless $tagline;
-
- my $ns = $type->new;
-
- $ns->tag( $tagline->getAttribute( "tag" ) );
- my $val = $tagline->textContent;
- $val = NFD($val);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
- next unless $tagline;
-
- my $tag = $tagline->getAttribute( "tag" );
- my $ind1 = $tagline->getAttribute( "ind1" );
- my $ind2 = $tagline->getAttribute( "ind2" );
-
- for my $data ( @{$tagline->getChildrenByTagName('subfield')} ) {
- next unless $data;
-
- my $ns = $type->new;
-
- $ns->tag( $tag );
- $ns->ind1( $ind1 );
- $ns->ind2( $ind2 );
- $ns->subfield( $data->getAttribute( "code" ) );
- my $val = $data->textContent;
- $val = NFD($val);
- $val =~ s/(\pM+)//gso;
- $ns->value( lc($val) );
-
- push @ns_list, $ns;
- }
- }
-
- $log->debug("Returning ".scalar(@ns_list)." Fieldmapper nodes from $xmltype xml", DEBUG);
- return @ns_list;
-}
-
-sub flat_marc_xml {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- my $type = 'metabib';
- $type = 'authority' if ($self->api_name =~ /authority/o);
-
- OpenILS::Application::WoRM->post_init();
-
- $client->respond($_) for (_marcxml_to_full_rows($xml, $type));
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.authority.xml",
- method => "flat_marc_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.biblio.xml",
- method => "flat_marc_xml",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-sub flat_marc_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $type = 'biblio';
- $type = 'authority' if ($self->api_name =~ /authority/o);
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( "open-ils.storage.direct.${type}.record_entry.retrieve" => $rec );
-
- $client->respond($_) for ($self->method_lookup("open-ils.worm.flat_marc.$type.xml")->run($r->marc));
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.biblio.record_entry",
- method => "flat_marc_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.flat_marc.authority.record_entry",
- method => "flat_marc_record",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-# Fingerprinting
-
-package OpenILS::Application::WoRM::Biblio::Fingerprint;
-use base qw/OpenILS::Application::WoRM/;
-use Unicode::Normalize;
-use OpenSRF::EX qw/:try/;
-
-my @fp_mods_xpath = (
- '//mods:mods/mods:typeOfResource[text()="text"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\b(?:the|an?)\b//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\[.[^\]]+\]//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s*[;\/\.]*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- author => {
- xpath => [
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/,?\s+.*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- ],
-
- '//mods:mods/mods:relatedItem[@type!="host" and @type!="series"]' => [
- title => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and not(@type)]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
- '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
- '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\b(?:the|an?)\b//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\[.[^\]]+\]//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s*[;\/\.]*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- author => {
- xpath => [
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
- '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
- ],
- fixup => sub {
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = NFD($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\pM+//gso;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text = lc($text);
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/\s+/ /sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/^\s*(.+)\s*$/$1/sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- $text =~ s/,?\s+.*$//sgo;
- $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
- },
- },
- ],
-
-);
-
-push @fp_mods_xpath, '//mods:mods/mods:titleInfo' => $fp_mods_xpath[1];
-
-sub _fp_mods {
- my $mods = shift;
- $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
-
- my $fp_string = '';
-
- my $match_index = 0;
- my $block_index = 1;
- while ( my $match_xpath = $fp_mods_xpath[$match_index] ) {
- if ( my @nodes = $mods->findnodes( $match_xpath ) ) {
-
- my $block_name_index = 0;
- my $block_value_index = 1;
- my $block = $fp_mods_xpath[$block_index];
- while ( my $part = $$block[$block_value_index] ) {
- local $text;
- for my $xpath ( @{ $part->{xpath} } ) {
- $text = $mods->findvalue( $xpath );
- last if ($text);
- }
-
- $log->debug("Found fingerprint text using $$block[$block_name_index] : [$text]", DEBUG);
-
- if ($text) {
- $$part{fixup}->();
- $log->debug("Fingerprint text after fixup : [$text]", DEBUG);
- $fp_string .= $text;
- }
-
- $block_name_index += 2;
- $block_value_index += 2;
- }
- }
- if ($fp_string) {
- $fp_string =~ s/\W+//gso;
- $log->debug("Fingerprint is [$fp_string]", INFO);;
- return $fp_string;
- }
-
- $match_index += 2;
- $block_index += 2;
- }
- return undef;
-}
-
-sub refingerprint_bibrec {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- my $commit = 0;
- if (!OpenILS::Application::WoRM->in_transaction) {
- OpenILS::Application::WoRM->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
- $commit = 1;
- }
-
- my $success = 1;
- try {
- my $bibs = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
- for my $b (@$bibs) {
- my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $b->marc );
-
- if ($b->fingerprint ne $fp->{fingerprint} || $b->quality != $fp->{quality}) {
-
- $log->debug("Updating ".$b->id." with fingerprint [$fp->{fingerprint}], quality [$fp->{quality}]", INFO);;
-
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.biblio.record_entry.remote_update',
- { id => $b->id },
- { fingerprint => $fp->{fingerprint},
- quality => $fp->{quality} }
- );
-
- if ($self->api_name !~ /nomap/o) {
- my $old_source_map = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.source.atomic',
- $b->id
- );
-
- my $old_mrid;
- if (ref($old_source_map) and @$old_source_map) {
- for my $m (@$old_source_map) {
- $old_mrid = $m->metarecord;
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.delete',
- $m->id
- );
- }
- }
-
- my $old_sm = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord_source_map.search.atomic',
- { metarecord => $old_mrid }
- ) if ($old_mrid);
-
- if (ref($old_sm) and @$old_sm == 0) {
- OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.delete',
- $old_mrid
- );
- }
-
- my $mr = OpenILS::Application::WoRM->storage_req(
- 'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic',
- { fingerprint => $fp->{fingerprint} }
- )->[0];
-
- unless ($mr) {
- $mr = Fieldmapper::metabib::metarecord->new;
- $mr->fingerprint( $fp->{fingerprint} );
- $mr->master_record( $b->id );
- $mr->id( OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
- }
-
- my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
- $mr_map->metarecord( $mr->id );
- $mr_map->source( $b->id );
- OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.create', $mr_map );
-
- }
- }
- $client->respond($b->id);
- }
-
- } otherwise {
- $log->debug('Fingerprinting failed : '.shift(), ERROR);
- $success = 0;
- };
-
- OpenILS::Application::WoRM->commit_transaction if ($commit && $success);
- OpenILS::Application::WoRM->rollback_transaction if ($commit && !$success);
- return undef;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record.update",
- method => "refingerprint_bibrec",
- api_level => 1,
- argc => 1,
- stream => 1,
-);
-
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record.update.nomap",
- method => "refingerprint_bibrec",
- api_level => 1,
- argc => 1,
-);
-
-=comment
-
-sub fingerprint_bibrec {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $r = OpenILS::Application::WoRM->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec );
-
- my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($r->marc);
- $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
- return $fp;
-
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record",
- method => "fingerprint_bibrec",
- api_level => 0,
- argc => 1,
-);
-
-
-sub fingerprint_mods {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- OpenILS::Application::WoRM->post_init();
- my $mods = $parser->parse_string($xml)->documentElement;
-
- return _fp_mods( $mods );
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.mods",
- method => "fingerprint_mods",
- api_level => 1,
- argc => 1,
-);
-
-sub fingerprint_marc {
- my $self = shift;
- my $client = shift;
- my $xml = shift;
-
- $xml = $parser->parse_string($xml) unless (ref $xml);
-
- OpenILS::Application::WoRM->post_init();
- my $fp = _fp_mods( $mods_sheet->transform($xml)->documentElement );
- $log->debug("Returning [$fp] as fingerprint", INFO);
- return $fp;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.marc",
- method => "fingerprint_marc",
- api_level => 1,
- argc => 1,
-);
-
-
-=cut
-
-sub biblio_fingerprint_record {
- my $self = shift;
- my $client = shift;
- my $rec = shift;
-
- OpenILS::Application::WoRM->post_init();
-
- my $marc = OpenILS::Application::WoRM
- ->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec )
- ->marc;
-
- my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($marc);
- $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
- return $fp;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.record",
- method => "biblio_fingerprint_record",
- api_level => 1,
- argc => 1,
-);
-
-our $fp_script;
-sub biblio_fingerprint {
- my $self = shift;
- my $client = shift;
- my $marc = shift;
-
- OpenILS::Application::WoRM->post_init();
-
- $marc = $parser->parse_string($marc) unless (ref $marc);
-
- my $mods = OpenILS::Application::WoRM::entityize(
- $mods_sheet
- ->transform( $marc )
- ->documentElement
- ->toString,
- 'D'
- );
-
- $marc = OpenILS::Application::WoRM::entityize( $marc->documentElement->toString => 'D' );
-
- warn $marc;
- $log->internal("Got MARC [$marc]");
- $log->internal("Created MODS [$mods]");
-
- if(!$fp_script) {
- my @pfx = ( "apps", "open-ils.storage","app_settings" );
- my $conf = OpenSRF::Utils::SettingsClient->new;
-
- my $libs = $conf->config_value(@pfx, 'script_path');
- my $script_file = $conf->config_value(@pfx, 'scripts', 'biblio_fingerprint');
- my $script_libs = (ref($libs)) ? $libs : [$libs];
-
- $log->debug("Loading script $script_file for biblio fingerprinting...");
-
- $fp_script = new OpenILS::Utils::ScriptRunner
- ( file => $script_file,
- paths => $script_libs,
- reset_count => 1000 );
- }
-
- $log->debug("Applying environment for biblio fingerprinting...");
-
- my $env = {marc => $marc, mods => $mods};
- #my $res = {fingerprint => '', quality => '0'};
-
- $fp_script->insert('environment' => $env);
- #$fp_script->insert('result' => $res);
-
- $log->debug("Running script for biblio fingerprinting...");
-
- my $res = $fp_script->run || ($log->error( "Fingerprint script died! $@" ) && return 0);
-
- $log->debug("Script for biblio fingerprinting completed successfully...");
-
- return $res;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.fingerprint.marc",
- method => "biblio_fingerprint",
- api_level => 1,
- argc => 1,
-);
-
-# --------------------------------------------------------------------------------
-
-1;
-
-__END__
-my $in_xact;
-my $begin;
-my $commit;
-my $rollback;
-my $lookup;
-my $update_entry;
-my $mr_lookup;
-my $mr_update;
-my $mr_create;
-my $create_source_map;
-my $sm_lookup;
-my $rm_old_rd;
-my $rm_old_sm;
-my $rm_old_fr;
-my $rm_old_tr;
-my $rm_old_ar;
-my $rm_old_sr;
-my $rm_old_kr;
-my $rm_old_ser;
-
-my $fr_create;
-my $rd_create;
-my $create = {};
-
-my %descriptor_code = (
- item_type => 'substr($ldr,6,1)',
- item_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,29,1) : substr($oo8,23,1)',
- bib_level => 'substr($ldr,7,1)',
- control_type => 'substr($ldr,8,1)',
- char_encoding => 'substr($ldr,9,1)',
- enc_level => 'substr($ldr,17,1)',
- cat_form => 'substr($ldr,18,1)',
- pub_status => 'substr($ldr,5,1)',
- item_lang => 'substr($oo8,35,3)',
- #lit_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,33,1) : "0"',
- audience => 'substr($oo8,22,1)',
-);
-
-sub wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $sm_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.search.source')
- unless ($sm_lookup);
- $mr_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.search.fingerprint')
- unless ($mr_lookup);
- $mr_update = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.batch.update')
- unless ($mr_update);
- $lookup = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.retrieve')
- unless ($lookup);
- $update_entry = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.update')
- unless ($update_entry);
- $rm_old_sm = $self->method_lookup( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete')
- unless ($rm_old_sm);
- $rm_old_rd = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete')
- unless ($rm_old_rd);
- $rm_old_fr = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.mass_delete')
- unless ($rm_old_fr);
- $rm_old_tr = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete')
- unless ($rm_old_tr);
- $rm_old_ar = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete')
- unless ($rm_old_ar);
- $rm_old_sr = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete')
- unless ($rm_old_sr);
- $rm_old_kr = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete')
- unless ($rm_old_kr);
- $rm_old_ser = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete')
- unless ($rm_old_ser);
- $mr_create = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.create')
- unless ($mr_create);
- $create_source_map = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.batch.create')
- unless ($create_source_map);
- $rd_create = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.batch.create')
- unless ($rd_create);
- $fr_create = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.batch.create')
- unless ($fr_create);
- $$create{title} = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.batch.create')
- unless ($$create{title});
- $$create{author} = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.batch.create')
- unless ($$create{author});
- $$create{subject} = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.batch.create')
- unless ($$create{subject});
- $$create{keyword} = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create')
- unless ($$create{keyword});
- $$create{series} = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.batch.create')
- unless ($$create{series});
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("WoRM isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mods_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- if(!$mods_sheet) {
- my $xslt_doc = $parser->parse_file(
- OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- $mods_sheet = $xslt->parse_stylesheet( $xslt_doc );
- }
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- my $modsdoc = $mods_sheet->transform($marcdoc);
-
- my $mods = $modsdoc->documentElement;
- $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
-
- $entry->fingerprint( fingerprint_mods( $mods ) );
- push @entry_list, $entry;
-
- $log->debug("Fingerprint for Record Entry ".$docid." is [".$entry->fingerprint."]", INFO);
-
- unless ($no_map) {
- my ($mr) = $mr_lookup->run( $entry->fingerprint );
- if (!$mr || !@$mr) {
- $log->debug("No metarecord found for fingerprint [".$entry->fingerprint."]; Creating a new one", INFO);
- $mr = new Fieldmapper::metabib::metarecord;
- $mr->fingerprint( $entry->fingerprint );
- $mr->master_record( $entry->id );
- my ($new_mr) = $mr_create->run($mr);
- $mr->id($new_mr);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.create!")
- }
- } else {
- $log->debug("Retrieved metarecord, id is ".$mr->id, INFO);
- $mr->mods('');
- push @mr_list, $mr;
- }
-
- my $sm = new Fieldmapper::metabib::metarecord_source_map;
- $sm->metarecord( $mr->id );
- $sm->source( $entry->id );
- push @source_maps, $sm;
- }
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- push @mods_data, { $docid => $self->modsdoc_to_values( $mods ) };
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $rm_old_rd->run( { record => \@docids } );
- $rm_old_fr->run( { record => \@docids } );
- $rm_old_sm->run( { source => \@docids } ) unless ($no_map);
- $rm_old_tr->run( { source => \@docids } );
- $rm_old_ar->run( { source => \@docids } );
- $rm_old_sr->run( { source => \@docids } );
- $rm_old_kr->run( { source => \@docids } );
- $rm_old_ser->run( { source => \@docids } );
-
- unless ($no_map) {
- my ($sm) = $create_source_map->run(@source_maps);
- unless (defined $sm) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord_source_map.batch.create!")
- }
- my ($mr) = $mr_update->run(@mr_list);
- unless (defined $mr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.batch.update!")
- }
- }
-
- my ($re) = $update_entry->run(@entry_list);
- unless (defined $re) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.biblio.record_entry.batch.update!")
- }
-
- my ($rd) = $rd_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.full_rec.batch.create!")
- }
-
- # step 5: insert the new metadata
- for my $class ( qw/title author subject keyword series/ ) {
- my @md_list = ();
- for my $doc ( @mods_data ) {
- my ($did) = keys %$doc;
- my ($data) = values %$doc;
-
- my $fm_constructor = "Fieldmapper::metabib::${class}_field_entry";
- for my $row ( keys %{ $$data{$class} } ) {
- next unless (exists $$data{$class}{$row});
- next unless ($$data{$class}{$row}{value});
- my $fm_obj = $fm_constructor->new;
- $fm_obj->value( $$data{$class}{$row}{value} );
- $fm_obj->field( $$data{$class}{$row}{field_id} );
- $fm_obj->source( $did );
- $log->debug("$class entry: ".$fm_obj->source." => ".$fm_obj->field." : ".$fm_obj->value, DEBUG);
-
- push @md_list, $fm_obj;
- }
- }
-
- my ($cr) = $$create{$class}->run(@md_list);
- unless (defined $cr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.${class}_field_entry.batch.create!")
- }
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by the WoRM.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.wormize.no_map.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-my $ain_xact;
-my $abegin;
-my $acommit;
-my $arollback;
-my $alookup;
-my $aupdate_entry;
-my $amr_lookup;
-my $amr_update;
-my $amr_create;
-my $acreate_source_map;
-my $asm_lookup;
-my $arm_old_rd;
-my $arm_old_sm;
-my $arm_old_fr;
-my $arm_old_tr;
-my $arm_old_ar;
-my $arm_old_sr;
-my $arm_old_kr;
-my $arm_old_ser;
-
-my $afr_create;
-my $ard_create;
-my $acreate = {};
-
-sub authority_wormize {
-
- my $self = shift;
- my $client = shift;
- my @docids = @_;
-
- my $no_map = 0;
- if ($self->api_name =~ /no_map/o) {
- $no_map = 1;
- }
-
- $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
- unless ($in_xact);
- $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
- unless ($begin);
- $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
- unless ($commit);
- $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
- unless ($rollback);
- $alookup = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.retrieve')
- unless ($alookup);
- $aupdate_entry = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.update')
- unless ($aupdate_entry);
- $arm_old_rd = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.mass_delete')
- unless ($arm_old_rd);
- $arm_old_fr = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.mass_delete')
- unless ($arm_old_fr);
- $ard_create = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.batch.create')
- unless ($ard_create);
- $afr_create = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.batch.create')
- unless ($afr_create);
-
-
- my ($outer_xact) = $in_xact->run;
- try {
- unless ($outer_xact) {
- $log->debug("WoRM isn't inside a transaction, starting one now.", INFO);
- my ($r) = $begin->run($client);
- unless (defined $r and $r) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
- }
- }
- } catch Error with {
- throw OpenSRF::EX::PANIC ("WoRM Couldn't BEGIN transaction!")
- };
-
- my @source_maps;
- my @entry_list;
- my @mr_list;
- my @rd_list;
- my @ns_list;
- my @mads_data;
- my $ret = 0;
- for my $entry ( $lookup->run(@docids) ) {
- # step -1: grab the doc from storage
- next unless ($entry);
-
- #if(!$mads_sheet) {
- # my $xslt_doc = $parser->parse_file(
- # OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') . "/MARC21slim2MODS.xsl");
- # $mads_sheet = $xslt->parse_stylesheet( $xslt_doc );
- #}
-
- my $xml = $entry->marc;
- my $docid = $entry->id;
- my $marcdoc = $parser->parse_string($xml);
- #my $madsdoc = $mads_sheet->transform($marcdoc);
-
- #my $mads = $madsdoc->documentElement;
- #$mads->setNamespace( "http://www.loc.gov/mads/", "mads", 1 );
-
- push @entry_list, $entry;
-
- my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
- my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
-
- my $rd_obj = Fieldmapper::authority::record_descriptor->new;
- for my $rd_field ( keys %descriptor_code ) {
- $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
- }
- $rd_obj->record( $docid );
- push @rd_list, $rd_obj;
-
- # step 2: build the KOHA rows
- my @tmp_list = _marcxml_to_full_rows( $marcdoc, 'Fieldmapper::authority::full_rec' );
- $_->record( $docid ) for (@tmp_list);
- push @ns_list, @tmp_list;
-
- $ret++;
-
- last unless ($self->api_name =~ /batch$/o);
- }
-
- $arm_old_rd->run( { record => \@docids } );
- $arm_old_fr->run( { record => \@docids } );
-
- my ($rd) = $ard_create->run(@rd_list);
- unless (defined $rd) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.record_descriptor.batch.create!")
- }
-
- my ($fr) = $fr_create->run(@ns_list);
- unless (defined $fr) {
- throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.full_rec.batch.create!")
- }
-
- unless ($outer_xact) {
- $log->debug("Commiting transaction started by the WoRM.", INFO);
- my ($c) = $commit->run;
- unless (defined $c and $c) {
- $rollback->run;
- throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
- }
- }
-
- return $ret;
-}
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authortiy.wormize",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-__PACKAGE__->register_method(
- api_name => "open-ils.worm.authority.wormize.batch",
- method => "wormize",
- api_level => 1,
- argc => 1,
-);
-
-
-# --------------------------------------------------------------------------------
-
-
-sub _marcxml_to_full_rows {
-
- my $marcxml = shift;
- my $type = shift || 'Fieldmapper::metabib::full_rec';
-
- my @ns_list;
-
- my $root = $marcxml->documentElement;
-
- for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( 'LDR' );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
- next unless $tagline;
-
- my $ns = new Fieldmapper::metabib::full_rec;
-
- $ns->tag( $tagline->getAttribute( "tag" ) );
- my $val = NFD($tagline->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( $val );
-
- push @ns_list, $ns;
- }
-
- for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
- next unless $tagline;
-
- my $tag = $tagline->getAttribute( "tag" );
- my $ind1 = $tagline->getAttribute( "ind1" );
- my $ind2 = $tagline->getAttribute( "ind2" );
-
- for my $data ( $tagline->childNodes ) {
- next unless $data;
-
- my $ns = $type->new;
-
- $ns->tag( $tag );
- $ns->ind1( $ind1 );
- $ns->ind2( $ind2 );
- $ns->subfield( $data->getAttribute( "code" ) );
- my $val = NFD($data->textContent);
- $val =~ s/(\pM+)//gso;
- $ns->value( lc($val) );
-
- push @ns_list, $ns;
- }
- }
- return @ns_list;
-}
-
-sub _get_field_value {
-
- my( $root, $xpath ) = @_;
-
- my $string = "";
-
- # grab the set of matching nodes
- my @nodes = $root->findnodes( $xpath );
- for my $value (@nodes) {
-
- # grab all children of the node
- my @children = $value->childNodes();
- for my $child (@children) {
-
- # add the childs content to the growing buffer
- my $content = quotemeta($child->textContent);
- next if ($string =~ /$content/); # uniquify the values
- $string .= $child->textContent . " ";
- }
- if( ! @children ) {
- $string .= $value->textContent . " ";
- }
- }
- $string = NFD($string);
- $string =~ s/(\pM)//gso;
- return lc($string);
-}
-
-
-sub modsdoc_to_values {
- my( $self, $mods ) = @_;
- my $data = {};
- for my $class (keys %$xpathset) {
- $data->{$class} = {};
- for my $type (keys %{$xpathset->{$class}}) {
- $data->{$class}->{$type} = {};
- $data->{$class}->{$type}->{field_id} = $xpathset->{$class}->{$type}->{id};
- }
- }
- return $data;
-}
-
-
-1;
-
-
* Copyright (C) 2005 Georgia Public Library Service
* Mike Rylander <mrylander@gmail.com>
*
- * XPath used for WoRMing
+ * XPath used for record indexing ingest
*
* This table contains the XPath used to chop up MODS into it's
* indexable parts. Each XPath entry is named and assigned to