new non-saving worm stuff
authormiker <miker@dcc99617-32d9-48b4-a31d-7c20da2025e4>
Wed, 5 Jul 2006 21:22:44 +0000 (21:22 +0000)
committermiker <miker@dcc99617-32d9-48b4-a31d-7c20da2025e4>
Wed, 5 Jul 2006 21:22:44 +0000 (21:22 +0000)
git-svn-id: svn://svn.open-ils.org/ILS/trunk@4894 dcc99617-32d9-48b4-a31d-7c20da2025e4

Open-ILS/src/perlmods/OpenILS/Application/Ingest.pm [new file with mode: 0644]

diff --git a/Open-ILS/src/perlmods/OpenILS/Application/Ingest.pm b/Open-ILS/src/perlmods/OpenILS/Application/Ingest.pm
new file mode 100644 (file)
index 0000000..a94e81c
--- /dev/null
@@ -0,0 +1,2124 @@
+package OpenILS::Application::Ingest;
+use base qw/OpenSRF::Application/;
+
+use Unicode::Normalize;
+use OpenSRF::EX qw/:try/;
+
+use OpenSRF::Utils::SettingsClient;
+use OpenSRF::Utils::Logger qw/:level/;
+
+use OpenILS::Utils::FlatXML;
+use OpenILS::Utils::Fieldmapper;
+use JSON;
+
+use OpenILS::Utils::Fieldmapper;
+
+use XML::LibXML;
+use XML::LibXSLT;
+use Time::HiRes qw(time);
+
+our %supported_formats = (
+       mods3   => {ns => 'http://www.loc.gov/mods/v3'},
+       mods    => {ns => 'http://www.loc.gov/mods/'},
+       marcxml => {ns => 'http://www.loc.gov/MARC21/slim'},
+       srw_dc  => {ns => ''},
+       oai_dc  => {ns => ''},
+       rdf_dc  => {ns => ''},
+);
+
+
+our $log = 'OpenSRF::Utils::Logger';
+
+our $parser = XML::LibXML->new();
+our $xslt = XML::LibXSLT->new();
+
+our $mods_sheet;
+our $mads_sheet;
+our $xpathset = {};
+sub initialize {}
+sub child_init {}
+
+sub post_init {
+
+       unless (keys %$xpathset) {
+               $log->debug("Running post_init", DEBUG);
+
+               my $xsldir = OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl');
+
+               unless ($supported_formats{mods}{xslt}) {
+                       $log->debug("Loading MODS XSLT", DEBUG);
+                       my $xslt_doc = $parser->parse_file( $xsldir . "/MARC21slim2MODS.xsl");
+                       $supported_formats{mods}{xslt} = $xslt->parse_stylesheet( $xslt_doc );
+               }
+
+               unless ($supported_formats{mods3}{xslt}) {
+                       $log->debug("Loading MODS v3 XSLT", DEBUG);
+                       my $xslt_doc = $parser->parse_file( $xsldir . "/MARC21slim2MODS3.xsl");
+                       $supported_formats{mods3}{xslt} = $xslt->parse_stylesheet( $xslt_doc );
+               }
+
+
+               my $req = __PACKAGE__->storage_req('open-ils.cstore.direct.config.metabib_field.search.atomic', { id => { '!=' => undef } });
+               for my $f (@$req) {
+                       $xpathset->{ $f->field_class }->{ $f->name }->{xpath} = $f->xpath;
+                       $xpathset->{ $f->field_class }->{ $f->name }->{id} = $f->id;
+                       $xpathset->{ $f->field_class }->{ $f->name }->{format} = $f->format;
+                       $log->debug("Loaded XPath from DB: ".$f->field_class." => ".$f->name." : ".$f->xpath, DEBUG);
+               }
+       }
+}
+
+sub entityize {
+       my $stuff = shift;
+       my $form = shift;
+
+       if ($form eq 'D') {
+               $stuff = NFD($stuff);
+       } else {
+               $stuff = NFC($stuff);
+       }
+
+       $stuff =~ s/([\x{0080}-\x{fffd}])/sprintf('&#x%X;',ord($1))/sgoe;
+       return $stuff;
+}
+
+# --------------------------------------------------------------------------------
+# MARC index extraction
+
+package OpenILS::Application::Ingest::XPATH;
+use base qw/OpenILS::Application::Ingest/;
+use Unicode::Normalize;
+
+# give this a MODS documentElement and an XPATH expression
+sub xpath_to_string {
+       my $xml = shift;
+       my $xpath = shift;
+       my $ns_uri = shift;
+       my $ns_prefix = shift;
+       my $unique = shift;
+
+       $xml->setNamespace( $ns_uri, $ns_prefix, 1 ) if ($ns_uri && $ns_prefix);
+
+       my $string = "";
+
+       # grab the set of matching nodes
+       my @nodes = $xml->findnodes( $xpath );
+       for my $value (@nodes) {
+
+               # grab all children of the node
+               my @children = $value->childNodes();
+               for my $child (@children) {
+
+                       # add the childs content to the growing buffer
+                       my $content = quotemeta($child->textContent);
+                       next if ($unique && $string =~ /$content/);  # uniquify the values
+                       $string .= $child->textContent . " ";
+               }
+               if( ! @children ) {
+                       $string .= $value->textContent . " ";
+               }
+       }
+       return NFD($string);
+}
+
+sub class_index_string_xml {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+       my @classes = @_;
+
+       OpenILS::Application::Ingest->post_init();
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+       
+       for my $class (@classes) {
+               my $class_constructor = "Fieldmapper::metabib::${class}_field_entry";
+               for my $type ( keys %{ $xpathset->{$class} } ) {
+
+                       my $def = $xpathset->{$class}->{$type};
+                       my $value =  xpath_to_string(
+                                       $mods_sheet->transform($xml)->documentElement,
+                                       $def->{xpath},
+                                       $supported_formats{$def->{format}}{ns},
+                                       $def->{format},
+                                       1
+                       );
+
+                       next unless $value;
+
+                       $value =~ s/\pM+//sgo;
+                       $value =~ s/\pC+//sgo;
+                       #$value =~ s/[\x{0080}-\x{fffd}]//sgoe;
+
+                       $value =~ s/(\w)\./$1/sgo;
+                       $value = lc($value);
+
+                       my $fm = $class_constructor->new;
+                       $fm->value( $value );
+                       $fm->field( $xpathset->{$class}->{$type}->{id} );
+                       $client->respond($fm);
+               }
+       }
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.ingest.field_entry.class.xml",
+       method          => "class_index_string_xml",
+       api_level       => 1,
+       argc            => 2,
+       stream          => 1,
+);                      
+
+sub class_index_string_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+       my @classes = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenSRF::AppSession->create('open-ils.cstore')->request( 'open-ils.cstore.direct.biblio.record_entry.retrieve' => $rec )->gather(1);
+
+       for my $fm ($self->method_lookup("open-ils.ingest.field_entry.class.xml")->run($r->marc, @classes)) {
+               $fm->source($rec);
+               $client->respond($fm);
+       }
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.field_entry.class.record",
+       method          => "class_index_string_record",
+       api_level       => 1,
+       argc            => 2,
+       stream          => 1,
+);                      
+
+
+1;
+
+__END__
+
+sub in_transaction {
+       OpenILS::Application::Ingest->post_init();
+       return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
+}
+
+sub begin_transaction {
+       my $self = shift;
+       my $client = shift;
+       
+       OpenILS::Application::Ingest->post_init();
+       my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
+       
+       try {
+               if (!$outer_xact) {
+                       $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
+                       #__PACKAGE__->st_sess->connect;
+                       my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.begin', $client );
+                       unless (defined $r and $r) {
+                               __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
+                               #__PACKAGE__->st_sess->disconnect;
+                               throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
+                       }
+               }
+       } otherwise {
+               $log->debug("Ingest Couldn't BEGIN transaction!", ERROR)
+       };
+
+       return __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
+}
+
+sub rollback_transaction {
+       my $self = shift;
+       my $client = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
+
+       try {
+               if ($outer_xact) {
+                       __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
+               } else {
+                       $log->debug("Ingest isn't inside a transaction.", INFO);
+               }
+       } catch Error with {
+               throw OpenSRF::EX::PANIC ("Ingest Couldn't ROLLBACK transaction!")
+       };
+
+       return 1;
+}
+
+sub commit_transaction {
+       my $self = shift;
+       my $client = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $outer_xact = __PACKAGE__->storage_req( 'open-ils.storage.transaction.current' );
+
+       try {
+               #if (__PACKAGE__->st_sess->connected && $outer_xact) {
+               if ($outer_xact) {
+                       my $r = __PACKAGE__->storage_req( 'open-ils.storage.transaction.commit' );
+                       unless (defined $r and $r) {
+                               __PACKAGE__->storage_req( 'open-ils.storage.transaction.rollback' );
+                               throw OpenSRF::EX::PANIC ("Couldn't COMMIT transaction!")
+                       }
+                       #__PACKAGE__->st_sess->disconnect;
+               } else {
+                       $log->debug("Ingest isn't inside a transaction.", INFO);
+               }
+       } catch Error with {
+               throw OpenSRF::EX::PANIC ("Ingest Couldn't COMMIT transaction!")
+       };
+
+       return 1;
+}
+
+sub storage_req {
+       my $self = shift;
+       my $method = shift;
+       my @res = __PACKAGE__->method_lookup( $method )->run( @_ );
+       return shift( @res );
+}
+
+sub scrub_authority_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       my $commit = 0;
+       if (!OpenILS::Application::Ingest->in_transaction) {
+               OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
+               $commit = 1;
+       }
+
+       my $success = 1;
+       try {
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'scrub_authority_record' );
+
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.full_rec.mass_delete', { record => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_descriptor.mass_delete', { record => $rec } );
+
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'scrub_authority_record' );
+       } otherwise {
+               $log->debug('Scrubbing failed : '.shift(), ERROR);
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_authority_record' );
+               $success = 0;
+       };
+
+       OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
+       OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
+       return $success;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.scrub.authority",
+       method          => "scrub_authority_record",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+
+sub scrub_metabib_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       if ( ref($rec) && ref($rec) =~ /HASH/o ) {
+               $rec = OpenILS::Application::Ingest->storage_req(
+                       'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
+               );
+       }
+
+       my $commit = 0;
+       if (!OpenILS::Application::Ingest->in_transaction) {
+               OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
+               $commit = 1;
+       }
+
+       my $success = 1;
+       try {
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'scrub_metabib_record' );
+               
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.full_rec.mass_delete', { record => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete', { source => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete', { record => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete', { source => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete', { source => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete', { source => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete', { source => $rec } );
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete', { source => $rec } );
+
+               $log->debug( "Looking for metarecords whose master is $rec", DEBUG);
+               my $masters = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.master_record.atomic', $rec );
+
+               for my $mr (@$masters) {
+                       $log->debug( "Found metarecord whose master is $rec", DEBUG);
+                       my $others = OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic', $mr->id );
+
+                       if (@$others) {
+                               $log->debug("Metarecord ".$mr->id." had master of $rec, setting to ".$others->[0]->source, DEBUG);
+                               $mr->master_record($others->[0]->source);
+                               OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.metabib.metarecord.remote_update',
+                                       { id => $mr->id },
+                                       { master_record => $others->[0]->source, mods => undef }
+                               );
+                       } else {
+                               warn "Removing metarecord whose master is $rec";
+                               $log->debug( "Removing metarecord whose master is $rec", DEBUG);
+                               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.delete', $mr->id );
+                               warn "Metarecord removed";
+                               $log->debug( "Metarecord removed", DEBUG);
+                       }
+               }
+
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'scrub_metabib_record' );
+
+       } otherwise {
+               $log->debug('Scrubbing failed : '.shift(), ERROR);
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'scrub_metabib_record' );
+               $success = 0;
+       };
+
+       OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
+       OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
+       return $success;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.scrub.biblio",
+       method          => "scrub_metabib_record",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub wormize_biblio_metarecord {
+       my $self = shift;
+       my $client = shift;
+       my $mrec = shift;
+
+       my $recs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic' => $mrec );
+
+       my $count = 0;
+       for my $r (@$recs) {
+               my $success = 0;
+               try {
+                       $success = wormize_biblio_record($self => $client => $r->source);
+                       $client->respond(
+                               { record  => $r->source,
+                                 metarecord => $rec->metarecord,
+                                 success => $success,
+                               }
+                       );
+               } catch Error with {
+                       my $e = shift;
+                       $client->respond(
+                               { record  => $r->source,
+                                 metarecord => $rec->metarecord,
+                                 success => $success,
+                                 error   => $e,
+                               }
+                       );
+               };
+       }
+       return undef;
+}
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.metarecord",
+       method          => "wormize_biblio_metarecord",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.metarecord.nomap",
+       method          => "wormize_biblio_metarecord",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.metarecord.noscrub",
+       method          => "wormize_biblio_metarecord",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.metarecord.nomap.noscrub",
+       method          => "wormize_biblio_metarecord",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);
+
+
+sub wormize_biblio_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       if ( ref($rec) && ref($rec) =~ /HASH/o ) {
+               $rec = OpenILS::Application::Ingest->storage_req(
+                       'open-ils.storage.id_list.biblio.record_entry.search_where', $rec
+               );
+       }
+
+
+       my $commit = 0;
+       if (!OpenILS::Application::Ingest->in_transaction) {
+               OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
+               $commit = 1;
+       }
+
+       my $success = 1;
+       try {
+               # clean up the cruft
+               unless ($self->api_name =~ /noscrub/o) {
+                       $self->method_lookup( 'open-ils.worm.scrub.biblio' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
+               }
+
+               # now redo 'em
+               my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
+
+               my @full_rec = ();
+               my @rec_descriptor = ();
+               my %field_entry = (
+                       title   => [],
+                       author  => [],
+                       subject => [],
+                       keyword => [],
+                       series  => [],
+               );
+               my %metarecord = ();
+               my @source_map = ();
+               for my $r (@$bibs) {
+                       try {
+                               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'extract_data'.$r->id );
+
+                               my $xml = $parser->parse_string($r->marc);
+
+                               #update the fingerprint
+                               my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $xml );
+                               OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.biblio.record_entry.remote_update',
+                                       { id => $r->id },
+                                       { fingerprint => $fp->{fingerprint},
+                                         quality     => int($fp->{quality}) }
+                               ) if ($fp->{fingerprint} ne $r->fingerprint || int($fp->{quality}) ne $r->quality);
+
+                               # the full_rec stuff
+                               for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.biblio.xml' )->run( $xml ) ) {
+                                       $fr->record( $r->id );
+                                       push @full_rec, $fr;
+                               }
+
+                               # the rec_descriptor stuff
+                               my ($rd) = $self->method_lookup( 'open-ils.worm.biblio_leader.xml' )->run( $xml );
+                               $rd->record( $r->id );
+                               push @rec_descriptor, $rd;
+                       
+                               # the indexing field entry stuff
+                               for my $class ( qw/title author subject keyword series/ ) {
+                                       for my $fe ( $self->method_lookup( 'open-ils.worm.field_entry.class.xml' )->run( $xml, $class ) ) {
+                                               $fe->source( $r->id );
+                                               push @{$field_entry{$class}}, $fe;
+                                       }
+                               }
+
+                               unless ($self->api_name =~ /nomap/o) {
+                                       my $mr = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic', $fp->{fingerprint}  )->[0];
+                               
+                                       unless ($mr) {
+                                               $mr = Fieldmapper::metabib::metarecord->new;
+                                               $mr->fingerprint( $fp->{fingerprint} );
+                                               $mr->master_record( $r->id );
+                                               $mr->id( OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
+                                       }
+
+                                       my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
+                                       $mr_map->metarecord( $mr->id );
+                                       $mr_map->source( $r->id );
+                                       push @source_map, $mr_map;
+
+                                       $metarecord{$mr->id} = $mr;
+                               }
+                               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'extract_data'.$r->id );
+                       } otherwise {
+                               $log->debug('Data extraction failed for record '.$r->id.': '.shift(), ERROR);
+                               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'extract_data'.$r->id );
+                       };
+               }
+               
+
+               if (@rec_descriptor) {
+                       OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'wormize_record' );
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.metarecord_source_map.batch.create',
+                               @source_map
+                       ) if (@source_map);
+
+                       for my $mr ( values %metarecord ) {
+                               my $sources = OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.metabib.metarecord_source_map.search.metarecord.atomic',
+                                       $mr->id
+                               );
+
+                               my $bibs = OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.biblio.record_entry.search.id.atomic',
+                                       [ map { $_->source } @$sources ]
+                               );
+
+                               my $master = ( sort { $b->quality <=> $a->quality } @$bibs )[0];
+
+                               OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.metabib.metarecord.remote_update',
+                                       { id => $mr->id },
+                                       { master_record => $master->id, mods => undef }
+                               );
+                       }
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.record_descriptor.batch.create',
+                               @rec_descriptor
+                       ) if (@rec_descriptor);
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.full_rec.batch.create',
+                               @full_rec
+                       ) if (@full_rec);
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.title_field_entry.batch.create',
+                               @{ $field_entry{title} }
+                       ) if (@{ $field_entry{title} });
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.author_field_entry.batch.create',
+                               @{ $field_entry{author} }
+                       ) if (@{ $field_entry{author} });
+                       
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.subject_field_entry.batch.create',
+                               @{ $field_entry{subject} }
+                       ) if (@{ $field_entry{subject} });
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.keyword_field_entry.batch.create',
+                               @{ $field_entry{keyword} }
+                       ) if (@{ $field_entry{keyword} });
+
+                       OpenILS::Application::Ingest->storage_req(
+                               'open-ils.storage.direct.metabib.series_field_entry.batch.create',
+                               @{ $field_entry{series} }
+                       ) if (@{ $field_entry{series} });
+
+                       OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'wormize_record' );
+               } else {
+                       $success = 0;
+               }
+
+       } otherwise {
+               $log->debug('Wormization failed : '.shift(), ERROR);
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_record' );
+               $success = 0;
+       };
+
+       OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
+       OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
+       return $success;
+}
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.biblio",
+       method          => "wormize_biblio_record",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.biblio.nomap",
+       method          => "wormize_biblio_record",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.biblio.noscrub",
+       method          => "wormize_biblio_record",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.biblio.nomap.noscrub",
+       method          => "wormize_biblio_record",
+       api_level       => 1,
+       argc            => 1,
+);
+
+sub wormize_authority_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       my $commit = 0;
+       if (!OpenILS::Application::Ingest->in_transaction) {
+               OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
+               $commit = 1;
+       }
+
+       my $success = 1;
+       try {
+               # clean up the cruft
+               unless ($self->api_name =~ /noscrub/o) {
+                       $self->method_lookup( 'open-ils.worm.scrub.authority' )->run( $rec ) || throw OpenSRF::EX::PANIC ("Couldn't scrub record $rec!");
+               }
+
+               # now redo 'em
+               my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_entry.search.id.atomic', $rec );
+
+               my @full_rec = ();
+               my @rec_descriptor = ();
+               for my $r (@$bibs) {
+                       my $xml = $parser->parse_string($r->marc);
+
+                       # the full_rec stuff
+                       for my $fr ( $self->method_lookup( 'open-ils.worm.flat_marc.authority.xml' )->run( $xml ) ) {
+                               $fr->record( $r->id );
+                               push @full_rec, $fr;
+                       }
+
+                       # the rec_descriptor stuff -- XXX What does this mean for authority records?
+                       #my ($rd) = $self->method_lookup( 'open-ils.worm.authority_leader.xml' )->run( $xml );
+                       #$rd->record( $r->id );
+                       #push @rec_descriptor, $rd;
+                       
+               }
+
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.set', 'wormize_authority_record' );
+
+               #OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.record_descriptor.batch.create', @rec_descriptor ) if (@rec_descriptor);
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.authority.full_rec.batch.create', @full_rec ) if (@full_rec);
+
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.release', 'wormize_authority_record' );
+
+       } otherwise {
+               $log->debug('Wormization failed : '.shift(), ERROR);
+               OpenILS::Application::Ingest->storage_req( 'open-ils.storage.savepoint.rollback', 'wormize_authority_record' );
+               $success = 0;
+       };
+
+       OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
+       OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
+       return $success;
+}
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.authority",
+       method          => "wormize_authority_record",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method(
+       api_name        => "open-ils.worm.wormize.authority.noscrub",
+       method          => "wormize_authority_record",
+       api_level       => 1,
+       argc            => 1,
+);
+
+
+# --------------------------------------------------------------------------------
+# MARC index extraction
+
+package OpenILS::Application::Ingest::XPATH;
+use base qw/OpenILS::Application::Ingest/;
+use Unicode::Normalize;
+
+# give this a MODS documentElement and an XPATH expression
+sub _xpath_to_string {
+       my $xml = shift;
+       my $xpath = shift;
+       my $ns_uri = shift;
+       my $ns_prefix = shift;
+       my $unique = shift;
+
+       $xml->setNamespace( $ns_uri, $ns_prefix, 1 ) if ($ns_uri && $ns_prefix);
+
+       my $string = "";
+
+       # grab the set of matching nodes
+       my @nodes = $xml->findnodes( $xpath );
+       for my $value (@nodes) {
+
+               # grab all children of the node
+               my @children = $value->childNodes();
+               for my $child (@children) {
+
+                       # add the childs content to the growing buffer
+                       my $content = quotemeta($child->textContent);
+                       next if ($unique && $string =~ /$content/);  # uniquify the values
+                       $string .= $child->textContent . " ";
+               }
+               if( ! @children ) {
+                       $string .= $value->textContent . " ";
+               }
+       }
+       return NFD($string);
+}
+
+sub class_all_index_string_xml {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+       my $class = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+       
+       my $class_constructor = "Fieldmapper::metabib::${class}_field_entry";
+       for my $type ( keys %{ $xpathset->{$class} } ) {
+               my $value =  _xpath_to_string(
+                               $mods_sheet->transform($xml)->documentElement,
+                               $xpathset->{$class}->{$type}->{xpath},
+                               "http://www.loc.gov/mods/",
+                               "mods",
+                               1
+               );
+
+               next unless $value;
+
+               $value =~ s/\pM+//sgo;
+               $value =~ s/\pC+//sgo;
+               #$value =~ s/[\x{0080}-\x{fffd}]//sgoe;
+
+               $value =~ s/(\w)\./$1/sgo;
+               $value = lc($value);
+
+               my $fm = $class_constructor->new;
+               $fm->value( $value );
+               $fm->field( $xpathset->{$class}->{$type}->{id} );
+               $client->respond($fm);
+       }
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.field_entry.class.xml",
+       method          => "class_all_index_string_xml",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+
+sub class_all_index_string_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+       my $class = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
+
+       for my $fm ($self->method_lookup("open-ils.worm.field_entry.class.xml")->run($r->marc, $class)) {
+               $fm->source($rec);
+               $client->respond($fm);
+       }
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.field_entry.class.record",
+       method          => "class_all_index_string_record",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+
+
+sub class_index_string_xml {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+       my $class = shift;
+       my $type = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+       return _xpath_to_string( $mods_sheet->transform($xml)->documentElement, $xpathset->{$class}->{$type}->{xpath}, "http://www.loc.gov/mods/", "mods", 1 );
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.class.type.xml",
+       method          => "class_index_string_xml",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub class_index_string_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+       my $class = shift;
+       my $type = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
+
+       my ($d) = $self->method_lookup("open-ils.worm.class.type.xml")->run($r->marc, $class => $type);
+       $log->debug("XPath $class->$type for bib rec $rec returns ($d)", DEBUG);
+       return $d;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.class.type.record",
+       method          => "class_index_string_record",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub xml_xpath {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+       my $xpath = shift;
+       my $uri = shift;
+       my $prefix = shift;
+       my $unique = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+       return _xpath_to_string( $xml->documentElement, $xpath, $uri, $prefix, $unique );
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.xpath.xml",
+       method          => "xml_xpath",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub record_xpath {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+       my $xpath = shift;
+       my $uri = shift;
+       my $prefix = shift;
+       my $unique = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
+
+       my ($d) = $self->method_lookup("open-ils.worm.xpath.xml")->run($r->marc, $xpath, $uri, $prefix, $unique );
+       $log->debug("XPath [$xpath] bib rec $rec returns ($d)", DEBUG);
+       return $d;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.xpath.record",
+       method          => "record_xpath",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+
+# --------------------------------------------------------------------------------
+# MARC Descriptor
+
+package OpenILS::Application::Ingest::Biblio::Leader;
+use base qw/OpenILS::Application::Ingest/;
+use Unicode::Normalize;
+
+our %marc_type_groups = (
+       BKS => q/[at]{1}/,
+       SER => q/[a]{1}/,
+       VIS => q/[gkro]{1}/,
+       MIX => q/[p]{1}/,
+       MAP => q/[ef]{1}/,
+       SCO => q/[cd]{1}/,
+       REC => q/[ij]{1}/,
+       COM => q/[m]{1}/,
+);
+
+sub _type_re {
+       my $re = '^'. join('|', $marc_type_groups{@_}) .'$';
+       return qr/$re/;
+}
+
+our %biblio_descriptor_code = (
+       item_type => sub { substr($ldr,6,1); },
+       item_form =>
+               sub {
+                       if (substr($ldr,6,1) =~ _type_re( qw/MAP VIS/ )) {
+                               return substr($oo8,29,1);
+                       } elsif (substr($ldr,6,1) =~ _type_re( qw/BKS SER MIX SCO REC/ )) {
+                               return substr($oo8,23,1);
+                       }
+                       return ' ';
+               },
+       bib_level => sub { substr($ldr,7,1); },
+       control_type => sub { substr($ldr,8,1); },
+       char_encoding => sub { substr($ldr,9,1); },
+       enc_level => sub { substr($ldr,17,1); },
+       cat_form => sub { substr($ldr,18,1); },
+       pub_status => sub { substr($ldr,5,1); },
+       item_lang => sub { substr($oo8,35,3); },
+       lit_form => sub { (substr($ldr,6,1) =~ _type_re('BKS')) ? substr($oo8,33,1) : undef; },
+       type_mat => sub { (substr($ldr,6,1) =~ _type_re('VIS')) ? substr($oo8,33,1) : undef; },
+       audience => sub { substr($oo8,22,1); },
+);
+
+sub _extract_biblio_descriptors {
+       my $xml = shift;
+
+       local $ldr = $xml->findvalue('//*[local-name()="leader"]');
+       local $oo8 = $xml->findvalue('//*[local-name()="controlfield" and @tag="008"]');
+       local $oo7 = $xml->findvalue('//*[local-name()="controlfield" and @tag="007"]');
+
+       my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
+       for my $rd_field ( keys %biblio_descriptor_code ) {
+               $rd_obj->$rd_field( $biblio_descriptor_code{$rd_field}->() );
+       }
+
+       return $rd_obj;
+}
+
+sub extract_biblio_desc_xml {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+
+       return _extract_biblio_descriptors( $xml );
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.biblio_leader.xml",
+       method          => "extract_biblio_desc_xml",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub extract_biblio_desc_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.biblio.record_entry.retrieve" => $rec );
+
+       my ($d) = $self->method_lookup("open-ils.worm.biblio_leader.xml")->run($r->marc);
+       $log->debug("Record descriptor for bib rec $rec is ".JSON->perl2JSON($d), DEBUG);
+       return $d;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.biblio_leader.record",
+       method          => "extract_biblio_desc_record",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+# --------------------------------------------------------------------------------
+# Flat MARC
+
+package OpenILS::Application::Ingest::FlatMARC;
+use base qw/OpenILS::Application::Ingest/;
+use Unicode::Normalize;
+
+
+sub _marcxml_to_full_rows {
+
+       my $marcxml = shift;
+       my $xmltype = shift || 'metabib';
+
+       my $type = "Fieldmapper::${xmltype}::full_rec";
+
+       my @ns_list;
+       
+       my ($root) = $marcxml->findnodes('//*[local-name()="record"]');
+
+       for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
+               next unless $tagline;
+
+               my $ns = $type->new;
+
+               $ns->tag( 'LDR' );
+               my $val = $tagline->textContent;
+               $val = NFD($val);
+               $val =~ s/(\pM+)//gso;
+               $ns->value( $val );
+
+               push @ns_list, $ns;
+       }
+
+       for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
+               next unless $tagline;
+
+               my $ns = $type->new;
+
+               $ns->tag( $tagline->getAttribute( "tag" ) );
+               my $val = $tagline->textContent;
+               $val = NFD($val);
+               $val =~ s/(\pM+)//gso;
+               $ns->value( $val );
+
+               push @ns_list, $ns;
+       }
+
+       for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
+               next unless $tagline;
+
+               my $tag = $tagline->getAttribute( "tag" );
+               my $ind1 = $tagline->getAttribute( "ind1" );
+               my $ind2 = $tagline->getAttribute( "ind2" );
+
+               for my $data ( @{$tagline->getChildrenByTagName('subfield')} ) {
+                       next unless $data;
+
+                       my $ns = $type->new;
+
+                       $ns->tag( $tag );
+                       $ns->ind1( $ind1 );
+                       $ns->ind2( $ind2 );
+                       $ns->subfield( $data->getAttribute( "code" ) );
+                       my $val = $data->textContent;
+                       $val = NFD($val);
+                       $val =~ s/(\pM+)//gso;
+                       $ns->value( lc($val) );
+
+                       push @ns_list, $ns;
+               }
+       }
+
+       $log->debug("Returning ".scalar(@ns_list)." Fieldmapper nodes from $xmltype xml", DEBUG);
+       return @ns_list;
+}
+
+sub flat_marc_xml {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+
+       my $type = 'metabib';
+       $type = 'authority' if ($self->api_name =~ /authority/o);
+
+       OpenILS::Application::Ingest->post_init();
+
+       $client->respond($_) for (_marcxml_to_full_rows($xml, $type));
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.flat_marc.authority.xml",
+       method          => "flat_marc_xml",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.flat_marc.biblio.xml",
+       method          => "flat_marc_xml",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+
+sub flat_marc_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       my $type = 'biblio';
+       $type = 'authority' if ($self->api_name =~ /authority/o);
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( "open-ils.storage.direct.${type}.record_entry.retrieve" => $rec );
+
+       $client->respond($_) for ($self->method_lookup("open-ils.worm.flat_marc.$type.xml")->run($r->marc));
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.flat_marc.biblio.record_entry",
+       method          => "flat_marc_record",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.flat_marc.authority.record_entry",
+       method          => "flat_marc_record",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+
+
+# --------------------------------------------------------------------------------
+# Fingerprinting
+
+package OpenILS::Application::Ingest::Biblio::Fingerprint;
+use base qw/OpenILS::Application::Ingest/;
+use Unicode::Normalize;
+use OpenSRF::EX qw/:try/;
+
+my @fp_mods_xpath = (
+       '//mods:mods/mods:typeOfResource[text()="text"]' => [
+                       title   => {
+                                       xpath   => [
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
+                                       ],
+                                       fixup   => sub {
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = NFD($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\pM+//gso;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = lc($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s+/ /sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/^\s*(.+)\s*$/$1/sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\b(?:the|an?)\b//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\[.[^\]]+\]//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s*[;\/\.]*$//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                               },
+                       },
+                       author  => {
+                                       xpath   => [
+                                                       '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
+                                                       '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
+                                       ],
+                                       fixup   => sub {
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = NFD($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\pM+//gso;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = lc($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s+/ /sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/^\s*(.+)\s*$/$1/sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/,?\s+.*$//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                               },
+                       },
+       ],
+
+       '//mods:mods/mods:relatedItem[@type!="host" and @type!="series"]' => [
+                       title   => {
+                                       xpath   => [
+                                                       '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="uniform")]',
+                                                       '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="translated")]',
+                                                       '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and (@type="alternative")]',
+                                                       '//mods:mods/mods:relatedItem/mods:titleInfo[mods:title and not(@type)]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="uniform")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="translated")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and (@type="alternative")]',
+                                                       '//mods:mods/mods:titleInfo[mods:title and not(@type)]',
+                                       ],
+                                       fixup   => sub {
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = NFD($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\pM+//gso;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = lc($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s+/ /sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/^\s*(.+)\s*$/$1/sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\b(?:the|an?)\b//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\[.[^\]]+\]//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s*[;\/\.]*$//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                               },
+                       },
+                       author  => {
+                                       xpath   => [
+                                                       '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
+                                                       '//mods:mods/mods:relatedItem/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
+                                                       '//mods:mods/mods:name[mods:role/mods:text/text()="creator" and @type="personal"]/mods:namePart',
+                                                       '//mods:mods/mods:name[mods:role/mods:text/text()="creator"]/mods:namePart',
+                                       ],
+                                       fixup   => sub {
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = NFD($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\pM+//gso;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text = lc($text);
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/\s+/ /sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/^\s*(.+)\s*$/$1/sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                                       $text =~ s/,?\s+.*$//sgo;
+                                                       $log->debug("Fingerprint text /durring/ fixup : [$text]", INTERNAL);
+                                               },
+                       },
+       ],
+
+);
+
+push @fp_mods_xpath, '//mods:mods/mods:titleInfo' => $fp_mods_xpath[1];
+
+sub _fp_mods {
+       my $mods = shift;
+       $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
+
+       my $fp_string = '';
+
+       my $match_index = 0;
+       my $block_index = 1;
+       while ( my $match_xpath = $fp_mods_xpath[$match_index] ) {
+               if ( my @nodes = $mods->findnodes( $match_xpath ) ) {
+
+                       my $block_name_index = 0;
+                       my $block_value_index = 1;
+                       my $block = $fp_mods_xpath[$block_index];
+                       while ( my $part = $$block[$block_value_index] ) {
+                               local $text;
+                               for my $xpath ( @{ $part->{xpath} } ) {
+                                       $text = $mods->findvalue( $xpath );
+                                       last if ($text);
+                               }
+
+                               $log->debug("Found fingerprint text using $$block[$block_name_index] : [$text]", DEBUG);
+
+                               if ($text) {
+                                       $$part{fixup}->();
+                                       $log->debug("Fingerprint text after fixup : [$text]", DEBUG);
+                                       $fp_string .= $text;
+                               }
+
+                               $block_name_index += 2;
+                               $block_value_index += 2;
+                       }
+               }
+               if ($fp_string) {
+                       $fp_string =~ s/\W+//gso;
+                       $log->debug("Fingerprint is [$fp_string]", INFO);;
+                       return $fp_string;
+               }
+
+               $match_index += 2;
+               $block_index += 2;
+       }
+       return undef;
+}
+
+sub refingerprint_bibrec {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       my $commit = 0;
+       if (!OpenILS::Application::Ingest->in_transaction) {
+               OpenILS::Application::Ingest->begin_transaction($client) || throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!");
+               $commit = 1;
+       }
+
+       my $success = 1;
+       try {
+               my $bibs = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.search.id.atomic', $rec );
+               for my $b (@$bibs) {
+                       my ($fp) = $self->method_lookup( 'open-ils.worm.fingerprint.marc' )->run( $b->marc );
+
+                       if ($b->fingerprint ne $fp->{fingerprint} || $b->quality != $fp->{quality}) {
+
+                               $log->debug("Updating ".$b->id." with fingerprint [$fp->{fingerprint}], quality [$fp->{quality}]", INFO);;
+
+                               OpenILS::Application::Ingest->storage_req(
+                                       'open-ils.storage.direct.biblio.record_entry.remote_update',
+                                       { id => $b->id },
+                                       { fingerprint => $fp->{fingerprint},
+                                         quality     => $fp->{quality} }
+                               );
+
+                               if ($self->api_name !~ /nomap/o) {
+                                       my $old_source_map = OpenILS::Application::Ingest->storage_req(
+                                               'open-ils.storage.direct.metabib.metarecord_source_map.search.source.atomic',
+                                               $b->id
+                                       );
+
+                                       my $old_mrid;
+                                       if (ref($old_source_map) and @$old_source_map) {
+                                               for my $m (@$old_source_map) {
+                                                       $old_mrid = $m->metarecord;
+                                                       OpenILS::Application::Ingest->storage_req(
+                                                               'open-ils.storage.direct.metabib.metarecord_source_map.delete',
+                                                               $m->id
+                                                       );
+                                               }
+                                       }
+
+                                       my $old_sm = OpenILS::Application::Ingest->storage_req(
+                                                       'open-ils.storage.direct.metabib.metarecord_source_map.search.atomic',
+                                                       { metarecord => $old_mrid }
+                                       ) if ($old_mrid);
+
+                                       if (ref($old_sm) and @$old_sm == 0) {
+                                               OpenILS::Application::Ingest->storage_req(
+                                                       'open-ils.storage.direct.metabib.metarecord.delete',
+                                                       $old_mrid
+                                               );
+                                       }
+
+                                       my $mr = OpenILS::Application::Ingest->storage_req(
+                                                       'open-ils.storage.direct.metabib.metarecord.search.fingerprint.atomic',
+                                                       { fingerprint => $fp->{fingerprint} }
+                                       )->[0];
+                               
+                                       unless ($mr) {
+                                               $mr = Fieldmapper::metabib::metarecord->new;
+                                               $mr->fingerprint( $fp->{fingerprint} );
+                                               $mr->master_record( $b->id );
+                                               $mr->id( OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord.create', $mr) );
+                                       }
+
+                                       my $mr_map = Fieldmapper::metabib::metarecord_source_map->new;
+                                       $mr_map->metarecord( $mr->id );
+                                       $mr_map->source( $b->id );
+                                       OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.metabib.metarecord_source_map.create', $mr_map );
+
+                               }
+                       }
+                       $client->respond($b->id);
+               }
+
+       } otherwise {
+               $log->debug('Fingerprinting failed : '.shift(), ERROR);
+               $success = 0;
+       };
+
+       OpenILS::Application::Ingest->commit_transaction if ($commit && $success);
+       OpenILS::Application::Ingest->rollback_transaction if ($commit && !$success);
+       return undef;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.record.update",
+       method          => "refingerprint_bibrec",
+       api_level       => 1,
+       argc            => 1,
+       stream          => 1,
+);                      
+
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.record.update.nomap",
+       method          => "refingerprint_bibrec",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+=comment
+
+sub fingerprint_bibrec {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $r = OpenILS::Application::Ingest->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec );
+
+       my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($r->marc);
+       $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
+       return $fp;
+
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.record",
+       method          => "fingerprint_bibrec",
+       api_level       => 0,
+       argc            => 1,
+);                      
+
+
+sub fingerprint_mods {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+
+       OpenILS::Application::Ingest->post_init();
+       my $mods = $parser->parse_string($xml)->documentElement;
+
+       return _fp_mods( $mods );
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.mods",
+       method          => "fingerprint_mods",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+sub fingerprint_marc {
+       my $self = shift;
+       my $client = shift;
+       my $xml = shift;
+
+       $xml = $parser->parse_string($xml) unless (ref $xml);
+
+       OpenILS::Application::Ingest->post_init();
+       my $fp = _fp_mods( $mods_sheet->transform($xml)->documentElement );
+       $log->debug("Returning [$fp] as fingerprint", INFO);
+       return $fp;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.marc",
+       method          => "fingerprint_marc",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+
+=cut
+
+sub biblio_fingerprint_record {
+       my $self = shift;
+       my $client = shift;
+       my $rec = shift;
+
+       OpenILS::Application::Ingest->post_init();
+
+       my $marc = OpenILS::Application::Ingest
+                       ->storage_req( 'open-ils.storage.direct.biblio.record_entry.retrieve' => $rec )
+                       ->marc;
+
+       my ($fp) = $self->method_lookup('open-ils.worm.fingerprint.marc')->run($marc);
+       $log->debug("Returning [$fp] as fingerprint for record $rec", INFO);
+       return $fp;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.record",
+       method          => "biblio_fingerprint_record",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+our $fp_script;
+sub biblio_fingerprint {
+       my $self = shift;
+       my $client = shift;
+       my $marc = shift;
+
+       OpenILS::Application::Ingest->post_init();
+
+       $marc = $parser->parse_string($marc) unless (ref $marc);
+
+       my $mods = OpenILS::Application::Ingest::entityize(
+               $mods_sheet
+                       ->transform( $marc )
+                       ->documentElement
+                       ->toString,
+               'D'
+       );
+
+       $marc = OpenILS::Application::Ingest::entityize( $marc->documentElement->toString => 'D' );
+
+       warn $marc;
+       $log->internal("Got MARC [$marc]");
+       $log->internal("Created MODS [$mods]");
+
+       if(!$fp_script) {
+               my @pfx = ( "apps", "open-ils.storage","app_settings" );
+               my $conf = OpenSRF::Utils::SettingsClient->new;
+
+               my $libs        = $conf->config_value(@pfx, 'script_path');
+               my $script_file = $conf->config_value(@pfx, 'scripts', 'biblio_fingerprint');
+               my $script_libs = (ref($libs)) ? $libs : [$libs];
+
+               $log->debug("Loading script $script_file for biblio fingerprinting...");
+               
+               $fp_script = new OpenILS::Utils::ScriptRunner
+                       ( file          => $script_file,
+                         paths         => $script_libs,
+                         reset_count   => 1000 );
+       }
+
+       $log->debug("Applying environment for biblio fingerprinting...");
+
+       my $env = {marc => $marc, mods => $mods};
+       #my $res = {fingerprint => '', quality => '0'};
+
+       $fp_script->insert('environment' => $env);
+       #$fp_script->insert('result' => $res);
+
+       $log->debug("Running script for biblio fingerprinting...");
+
+       my $res = $fp_script->run || ($log->error( "Fingerprint script died!  $@" ) && return 0);
+
+       $log->debug("Script for biblio fingerprinting completed successfully...");
+
+       return $res;
+}
+__PACKAGE__->register_method(  
+       api_name        => "open-ils.worm.fingerprint.marc",
+       method          => "biblio_fingerprint",
+       api_level       => 1,
+       argc            => 1,
+);                      
+
+# --------------------------------------------------------------------------------
+
+1;
+
+__END__
+my $in_xact;
+my $begin;
+my $commit;
+my $rollback;
+my $lookup;
+my $update_entry;
+my $mr_lookup;
+my $mr_update;
+my $mr_create;
+my $create_source_map;
+my $sm_lookup;
+my $rm_old_rd;
+my $rm_old_sm;
+my $rm_old_fr;
+my $rm_old_tr;
+my $rm_old_ar;
+my $rm_old_sr;
+my $rm_old_kr;
+my $rm_old_ser;
+
+my $fr_create;
+my $rd_create;
+my $create = {};
+
+my %descriptor_code = (
+       item_type => 'substr($ldr,6,1)',
+       item_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,29,1) : substr($oo8,23,1)',
+       bib_level => 'substr($ldr,7,1)',
+       control_type => 'substr($ldr,8,1)',
+       char_encoding => 'substr($ldr,9,1)',
+       enc_level => 'substr($ldr,17,1)',
+       cat_form => 'substr($ldr,18,1)',
+       pub_status => 'substr($ldr,5,1)',
+       item_lang => 'substr($oo8,35,3)',
+       #lit_form => '(substr($ldr,6,1) =~ /^(?:f|g|i|m|o|p|r)$/) ? substr($oo8,33,1) : "0"',
+       audience => 'substr($oo8,22,1)',
+);
+
+sub wormize {
+
+       my $self = shift;
+       my $client = shift;
+       my @docids = @_;
+
+       my $no_map = 0;
+       if ($self->api_name =~ /no_map/o) {
+               $no_map = 1;
+       }
+
+       $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
+               unless ($in_xact);
+       $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
+               unless ($begin);
+       $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
+               unless ($commit);
+       $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
+               unless ($rollback);
+       $sm_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.search.source')
+               unless ($sm_lookup);
+       $mr_lookup = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.search.fingerprint')
+               unless ($mr_lookup);
+       $mr_update = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.batch.update')
+               unless ($mr_update);
+       $lookup = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.retrieve')
+               unless ($lookup);
+       $update_entry = $self->method_lookup('open-ils.storage.direct.biblio.record_entry.batch.update')
+               unless ($update_entry);
+       $rm_old_sm = $self->method_lookup( 'open-ils.storage.direct.metabib.metarecord_source_map.mass_delete')
+               unless ($rm_old_sm);
+       $rm_old_rd = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.mass_delete')
+               unless ($rm_old_rd);
+       $rm_old_fr = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.mass_delete')
+               unless ($rm_old_fr);
+       $rm_old_tr = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.mass_delete')
+               unless ($rm_old_tr);
+       $rm_old_ar = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.mass_delete')
+               unless ($rm_old_ar);
+       $rm_old_sr = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.mass_delete')
+               unless ($rm_old_sr);
+       $rm_old_kr = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.mass_delete')
+               unless ($rm_old_kr);
+       $rm_old_ser = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.mass_delete')
+               unless ($rm_old_ser);
+       $mr_create = $self->method_lookup('open-ils.storage.direct.metabib.metarecord.create')
+               unless ($mr_create);
+       $create_source_map = $self->method_lookup('open-ils.storage.direct.metabib.metarecord_source_map.batch.create')
+               unless ($create_source_map);
+       $rd_create = $self->method_lookup( 'open-ils.storage.direct.metabib.record_descriptor.batch.create')
+               unless ($rd_create);
+       $fr_create = $self->method_lookup( 'open-ils.storage.direct.metabib.full_rec.batch.create')
+               unless ($fr_create);
+       $$create{title} = $self->method_lookup( 'open-ils.storage.direct.metabib.title_field_entry.batch.create')
+               unless ($$create{title});
+       $$create{author} = $self->method_lookup( 'open-ils.storage.direct.metabib.author_field_entry.batch.create')
+               unless ($$create{author});
+       $$create{subject} = $self->method_lookup( 'open-ils.storage.direct.metabib.subject_field_entry.batch.create')
+               unless ($$create{subject});
+       $$create{keyword} = $self->method_lookup( 'open-ils.storage.direct.metabib.keyword_field_entry.batch.create')
+               unless ($$create{keyword});
+       $$create{series} = $self->method_lookup( 'open-ils.storage.direct.metabib.series_field_entry.batch.create')
+               unless ($$create{series});
+
+
+       my ($outer_xact) = $in_xact->run;
+       try {
+               unless ($outer_xact) {
+                       $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
+                       my ($r) = $begin->run($client);
+                       unless (defined $r and $r) {
+                               $rollback->run;
+                               throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
+                       }
+               }
+       } catch Error with {
+               throw OpenSRF::EX::PANIC ("Ingest Couldn't BEGIN transaction!")
+       };
+
+       my @source_maps;
+       my @entry_list;
+       my @mr_list;
+       my @rd_list;
+       my @ns_list;
+       my @mods_data;
+       my $ret = 0;
+       for my $entry ( $lookup->run(@docids) ) {
+               # step -1: grab the doc from storage
+               next unless ($entry);
+
+               if(!$mods_sheet) {
+                       my $xslt_doc = $parser->parse_file(
+                               OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') .  "/MARC21slim2MODS.xsl");
+                       $mods_sheet = $xslt->parse_stylesheet( $xslt_doc );
+               }
+
+               my $xml = $entry->marc;
+               my $docid = $entry->id;
+               my $marcdoc = $parser->parse_string($xml);
+               my $modsdoc = $mods_sheet->transform($marcdoc);
+
+               my $mods = $modsdoc->documentElement;
+               $mods->setNamespace( "http://www.loc.gov/mods/", "mods", 1 );
+
+               $entry->fingerprint( fingerprint_mods( $mods ) );
+               push @entry_list, $entry;
+
+               $log->debug("Fingerprint for Record Entry ".$docid." is [".$entry->fingerprint."]", INFO);
+
+               unless ($no_map) {
+                       my ($mr) = $mr_lookup->run( $entry->fingerprint );
+                       if (!$mr || !@$mr) {
+                               $log->debug("No metarecord found for fingerprint [".$entry->fingerprint."]; Creating a new one", INFO);
+                               $mr = new Fieldmapper::metabib::metarecord;
+                               $mr->fingerprint( $entry->fingerprint );
+                               $mr->master_record( $entry->id );
+                               my ($new_mr) = $mr_create->run($mr);
+                               $mr->id($new_mr);
+                               unless (defined $mr) {
+                                       throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.create!")
+                               }
+                       } else {
+                               $log->debug("Retrieved metarecord, id is ".$mr->id, INFO);
+                               $mr->mods('');
+                               push @mr_list, $mr;
+                       }
+
+                       my $sm = new Fieldmapper::metabib::metarecord_source_map;
+                       $sm->metarecord( $mr->id );
+                       $sm->source( $entry->id );
+                       push @source_maps, $sm;
+               }
+
+               my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
+               my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
+
+               my $rd_obj = Fieldmapper::metabib::record_descriptor->new;
+               for my $rd_field ( keys %descriptor_code ) {
+                       $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
+               }
+               $rd_obj->record( $docid );
+               push @rd_list, $rd_obj;
+
+               push @mods_data, { $docid => $self->modsdoc_to_values( $mods ) };
+
+               # step 2: build the KOHA rows
+               my @tmp_list = _marcxml_to_full_rows( $marcdoc );
+               $_->record( $docid ) for (@tmp_list);
+               push @ns_list, @tmp_list;
+
+               $ret++;
+
+               last unless ($self->api_name =~ /batch$/o);
+       }
+
+       $rm_old_rd->run( { record => \@docids } );
+       $rm_old_fr->run( { record => \@docids } );
+       $rm_old_sm->run( { source => \@docids } ) unless ($no_map);
+       $rm_old_tr->run( { source => \@docids } );
+       $rm_old_ar->run( { source => \@docids } );
+       $rm_old_sr->run( { source => \@docids } );
+       $rm_old_kr->run( { source => \@docids } );
+       $rm_old_ser->run( { source => \@docids } );
+
+       unless ($no_map) {
+               my ($sm) = $create_source_map->run(@source_maps);
+               unless (defined $sm) {
+                       throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord_source_map.batch.create!")
+               }
+               my ($mr) = $mr_update->run(@mr_list);
+               unless (defined $mr) {
+                       throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.metarecord.batch.update!")
+               }
+       }
+
+       my ($re) = $update_entry->run(@entry_list);
+       unless (defined $re) {
+               throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.biblio.record_entry.batch.update!")
+       }
+
+       my ($rd) = $rd_create->run(@rd_list);
+       unless (defined $rd) {
+               throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.record_descriptor.batch.create!")
+       }
+
+       my ($fr) = $fr_create->run(@ns_list);
+       unless (defined $fr) {
+               throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.full_rec.batch.create!")
+       }
+
+       # step 5: insert the new metadata
+       for my $class ( qw/title author subject keyword series/ ) {
+               my @md_list = ();
+               for my $doc ( @mods_data ) {
+                       my ($did) = keys %$doc;
+                       my ($data) = values %$doc;
+
+                       my $fm_constructor = "Fieldmapper::metabib::${class}_field_entry";
+                       for my $row ( keys %{ $$data{$class} } ) {
+                               next unless (exists $$data{$class}{$row});
+                               next unless ($$data{$class}{$row}{value});
+                               my $fm_obj = $fm_constructor->new;
+                               $fm_obj->value( $$data{$class}{$row}{value} );
+                               $fm_obj->field( $$data{$class}{$row}{field_id} );
+                               $fm_obj->source( $did );
+                               $log->debug("$class entry: ".$fm_obj->source." => ".$fm_obj->field." : ".$fm_obj->value, DEBUG);
+
+                               push @md_list, $fm_obj;
+                       }
+               }
+                       
+               my ($cr) = $$create{$class}->run(@md_list);
+               unless (defined $cr) {
+                       throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.metabib.${class}_field_entry.batch.create!")
+               }
+       }
+
+       unless ($outer_xact) {
+               $log->debug("Commiting transaction started by the Ingest.", INFO);
+               my ($c) = $commit->run;
+               unless (defined $c and $c) {
+                       $rollback->run;
+                       throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
+               }
+       }
+
+       return $ret;
+}
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.wormize",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.wormize.no_map",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.wormize.batch",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.wormize.no_map.batch",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+
+
+my $ain_xact;
+my $abegin;
+my $acommit;
+my $arollback;
+my $alookup;
+my $aupdate_entry;
+my $amr_lookup;
+my $amr_update;
+my $amr_create;
+my $acreate_source_map;
+my $asm_lookup;
+my $arm_old_rd;
+my $arm_old_sm;
+my $arm_old_fr;
+my $arm_old_tr;
+my $arm_old_ar;
+my $arm_old_sr;
+my $arm_old_kr;
+my $arm_old_ser;
+
+my $afr_create;
+my $ard_create;
+my $acreate = {};
+
+sub authority_wormize {
+
+       my $self = shift;
+       my $client = shift;
+       my @docids = @_;
+
+       my $no_map = 0;
+       if ($self->api_name =~ /no_map/o) {
+               $no_map = 1;
+       }
+
+       $in_xact = $self->method_lookup( 'open-ils.storage.transaction.current')
+               unless ($in_xact);
+       $begin = $self->method_lookup( 'open-ils.storage.transaction.begin')
+               unless ($begin);
+       $commit = $self->method_lookup( 'open-ils.storage.transaction.commit')
+               unless ($commit);
+       $rollback = $self->method_lookup( 'open-ils.storage.transaction.rollback')
+               unless ($rollback);
+       $alookup = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.retrieve')
+               unless ($alookup);
+       $aupdate_entry = $self->method_lookup('open-ils.storage.direct.authority.record_entry.batch.update')
+               unless ($aupdate_entry);
+       $arm_old_rd = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.mass_delete')
+               unless ($arm_old_rd);
+       $arm_old_fr = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.mass_delete')
+               unless ($arm_old_fr);
+       $ard_create = $self->method_lookup( 'open-ils.storage.direct.authority.record_descriptor.batch.create')
+               unless ($ard_create);
+       $afr_create = $self->method_lookup( 'open-ils.storage.direct.authority.full_rec.batch.create')
+               unless ($afr_create);
+
+
+       my ($outer_xact) = $in_xact->run;
+       try {
+               unless ($outer_xact) {
+                       $log->debug("Ingest isn't inside a transaction, starting one now.", INFO);
+                       my ($r) = $begin->run($client);
+                       unless (defined $r and $r) {
+                               $rollback->run;
+                               throw OpenSRF::EX::PANIC ("Couldn't BEGIN transaction!")
+                       }
+               }
+       } catch Error with {
+               throw OpenSRF::EX::PANIC ("Ingest Couldn't BEGIN transaction!")
+       };
+
+       my @source_maps;
+       my @entry_list;
+       my @mr_list;
+       my @rd_list;
+       my @ns_list;
+       my @mads_data;
+       my $ret = 0;
+       for my $entry ( $lookup->run(@docids) ) {
+               # step -1: grab the doc from storage
+               next unless ($entry);
+
+               #if(!$mads_sheet) {
+               #       my $xslt_doc = $parser->parse_file(
+               #               OpenSRF::Utils::SettingsClient->new->config_value(dirs => 'xsl') .  "/MARC21slim2MODS.xsl");
+               #       $mads_sheet = $xslt->parse_stylesheet( $xslt_doc );
+               #}
+
+               my $xml = $entry->marc;
+               my $docid = $entry->id;
+               my $marcdoc = $parser->parse_string($xml);
+               #my $madsdoc = $mads_sheet->transform($marcdoc);
+
+               #my $mads = $madsdoc->documentElement;
+               #$mads->setNamespace( "http://www.loc.gov/mads/", "mads", 1 );
+
+               push @entry_list, $entry;
+
+               my $ldr = $marcdoc->documentElement->getChildrenByTagName('leader')->pop->textContent;
+               my $oo8 = $marcdoc->documentElement->findvalue('//*[local-name()="controlfield" and @tag="008"]');
+
+               my $rd_obj = Fieldmapper::authority::record_descriptor->new;
+               for my $rd_field ( keys %descriptor_code ) {
+                       $rd_obj->$rd_field( eval "$descriptor_code{$rd_field};" );
+               }
+               $rd_obj->record( $docid );
+               push @rd_list, $rd_obj;
+
+               # step 2: build the KOHA rows
+               my @tmp_list = _marcxml_to_full_rows( $marcdoc, 'Fieldmapper::authority::full_rec' );
+               $_->record( $docid ) for (@tmp_list);
+               push @ns_list, @tmp_list;
+
+               $ret++;
+
+               last unless ($self->api_name =~ /batch$/o);
+       }
+
+       $arm_old_rd->run( { record => \@docids } );
+       $arm_old_fr->run( { record => \@docids } );
+
+       my ($rd) = $ard_create->run(@rd_list);
+       unless (defined $rd) {
+               throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.record_descriptor.batch.create!")
+       }
+
+       my ($fr) = $fr_create->run(@ns_list);
+       unless (defined $fr) {
+               throw OpenSRF::EX::PANIC ("Couldn't run open-ils.storage.direct.authority.full_rec.batch.create!")
+       }
+
+       unless ($outer_xact) {
+               $log->debug("Commiting transaction started by Ingest.", INFO);
+               my ($c) = $commit->run;
+               unless (defined $c and $c) {
+                       $rollback->run;
+                       throw OpenSRF::EX::PANIC ("Couldn't COMMIT changes!")
+               }
+       }
+
+       return $ret;
+}
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.authortiy.wormize",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+__PACKAGE__->register_method( 
+       api_name        => "open-ils.worm.authority.wormize.batch",
+       method          => "wormize",
+       api_level       => 1,
+       argc            => 1,
+);
+
+
+# --------------------------------------------------------------------------------
+
+
+sub _marcxml_to_full_rows {
+
+       my $marcxml = shift;
+       my $type = shift || 'Fieldmapper::metabib::full_rec';
+
+       my @ns_list;
+       
+       my $root = $marcxml->documentElement;
+
+       for my $tagline ( @{$root->getChildrenByTagName("leader")} ) {
+               next unless $tagline;
+
+               my $ns = new Fieldmapper::metabib::full_rec;
+
+               $ns->tag( 'LDR' );
+               my $val = NFD($tagline->textContent);
+               $val =~ s/(\pM+)//gso;
+               $ns->value( $val );
+
+               push @ns_list, $ns;
+       }
+
+       for my $tagline ( @{$root->getChildrenByTagName("controlfield")} ) {
+               next unless $tagline;
+
+               my $ns = new Fieldmapper::metabib::full_rec;
+
+               $ns->tag( $tagline->getAttribute( "tag" ) );
+               my $val = NFD($tagline->textContent);
+               $val =~ s/(\pM+)//gso;
+               $ns->value( $val );
+
+               push @ns_list, $ns;
+       }
+
+       for my $tagline ( @{$root->getChildrenByTagName("datafield")} ) {
+               next unless $tagline;
+
+               my $tag = $tagline->getAttribute( "tag" );
+               my $ind1 = $tagline->getAttribute( "ind1" );
+               my $ind2 = $tagline->getAttribute( "ind2" );
+
+               for my $data ( $tagline->childNodes ) {
+                       next unless $data;
+
+                       my $ns = $type->new;
+
+                       $ns->tag( $tag );
+                       $ns->ind1( $ind1 );
+                       $ns->ind2( $ind2 );
+                       $ns->subfield( $data->getAttribute( "code" ) );
+                       my $val = NFD($data->textContent);
+                       $val =~ s/(\pM+)//gso;
+                       $ns->value( lc($val) );
+
+                       push @ns_list, $ns;
+               }
+       }
+       return @ns_list;
+}
+
+sub _get_field_value {
+
+       my( $root, $xpath ) = @_;
+
+       my $string = "";
+
+       # grab the set of matching nodes
+       my @nodes = $root->findnodes( $xpath );
+       for my $value (@nodes) {
+
+               # grab all children of the node
+               my @children = $value->childNodes();
+               for my $child (@children) {
+
+                       # add the childs content to the growing buffer
+                       my $content = quotemeta($child->textContent);
+                       next if ($string =~ /$content/);  # uniquify the values
+                       $string .= $child->textContent . " ";
+               }
+               if( ! @children ) {
+                       $string .= $value->textContent . " ";
+               }
+       }
+       $string = NFD($string);
+       $string =~ s/(\pM)//gso;
+       return lc($string);
+}
+
+
+sub modsdoc_to_values {
+       my( $self, $mods ) = @_;
+       my $data = {};
+       for my $class (keys %$xpathset) {
+               $data->{$class} = {};
+               for my $type (keys %{$xpathset->{$class}}) {
+                       $data->{$class}->{$type} = {};
+                       $data->{$class}->{$type}->{field_id} = $xpathset->{$class}->{$type}->{id};
+               }
+       }
+       return $data;
+}
+
+
+1;
+
+