X-Git-Url: http://git.equinoxoli.org/?p=migration-tools.git;a=blobdiff_plain;f=mig-bin%2Fmig-loadbibs;h=119a1ec3445e56fe05f05153a814b14438027412;hp=a6840dec8a8d76f8d89559d409c26ba0a6d461df;hb=4ec23f88c7f20557b13ec6f5be637e726904e114;hpb=8778d74ad0833c120f7db371376b2420c3edc6c4 diff --git a/mig-bin/mig-loadbibs b/mig-bin/mig-loadbibs index a6840de..119a1ec 100755 --- a/mig-bin/mig-loadbibs +++ b/mig-bin/mig-loadbibs @@ -39,6 +39,8 @@ use MARC::Record; use MARC::Batch; use MARC::File; use MARC::File::XML; +use MARC::Charset 'marc8_to_utf8'; +#binmode STDIN, ':bytes'; use Env qw( HOME PGHOST PGPORT PGUSER PGDATABASE MIGSCHEMA MIGBASEWORKDIR MIGBASEGITDIR MIGGITDIR MIGWORKDIR @@ -57,8 +59,10 @@ pod2usage(-verbose => 2) if defined $ARGV[0] && $ARGV[0] eq '--help'; pod2usage(-verbose => 1) if ! $ARGV[1]; my $next_arg_is_file = 0; -my $append_is_false = 1; +my $append = 0; my $next_arg_is_source = 0; +my $next_arg_is_stage = 0; +my $stage_table = 'biblio_record_entry_legacy'; my $source = 'default'; my $file_is_xml = 0; my $dbh = Mig::db_connect(); @@ -67,6 +71,9 @@ my $i = 0; my $batch; binmode STDIN, ':utf8'; +#MARC::Charset->assume_unicode(1); +MARC::Charset->ignore_errors(1); + foreach my $arg (@ARGV) { if ($arg eq '--stage_file') { $next_arg_is_file = 1; @@ -81,13 +88,22 @@ foreach my $arg (@ARGV) { $next_arg_is_source = 1; next; } - if ($next_arg_is_file) { + if ($next_arg_is_source) { $source = $arg; $next_arg_is_source = 0; next; } + if ($arg eq '--stage_table') { + $next_arg_is_stage = 1; + next; + } + if ($next_arg_is_stage) { + $stage_table = $arg; + $next_arg_is_stage = 0; + next; + } if ($arg eq '--append') { - $append_is_false = 0; + $append = 1; next; } if ($arg eq '--xml') { @@ -96,18 +112,13 @@ foreach my $arg (@ARGV) { } } -if ($append_is_false) { - $dbh->do(qq{ - DROP TABLE IF EXISTS $MIGSCHEMA.biblio_record_entry_stage; - CREATE UNLOGGED TABLE $MIGSCHEMA.biblio_record_entry_stage ( - l_bib_id TEXT, - x_source TEXT, - x_warnings TEXT, - x_migrate BOOLEAN DEFAULT TRUE - ) INHERITS ($MIGSCHEMA.biblio_record_entry); - }); -} +create_child_table($dbh); #and test to see if it exists +# normal stage table creation +if ($append == 0) { + drop_stage_table($dbh,$stage_table); + create_stage_table($dbh,$stage_table); + } if ($file_is_xml) { $batch = MARC::Batch->new('XML',$infile); } else { @@ -115,31 +126,75 @@ if ($file_is_xml) { } $batch->strict_off(); -while ( my $record = $batch->next() ) { - my $xml; - if ($file_is_xml) { $xml = $record; } - else { $xml = $record->as_xml_record(); } +my $record; +#while ( my $record = $batch->next() ) { +while ( eval {$record = $batch->next()} or do { if (!$record and !$@) { last; } else { next; }} ) { + my $xml = $record->as_xml_record(); + $xml = marc8_to_utf8($xml); $i++; $xml = clean_marc($xml); $xml = '$_$' . $xml . '$_$'; my @warnings = $batch->warnings(); my $warning_string; if (@warnings) { $warning_string = "'" . join(':',@warnings) . "'"; } else { $warning_string = "'none'"; } - my $sql = "INSERT INTO $MIGSCHEMA.biblio_record_entry_stage (marc,x_source,x_warnings) VALUES ($xml,$source,$warning_string);"; + my $sql = "INSERT INTO $MIGSCHEMA.$stage_table (marc,x_source,x_warnings) VALUES ($xml,'$source',$warning_string);"; my $sth = $dbh->prepare($sql); - $sth->execute(); + eval { $sth->execute() }; report_progress("Records staged", $i) if 0 != $i % 100; } $dbh->do(qq/ - CREATE INDEX ${MIGSCHEMA}_biblio_record_entry_stage_idx ON - $MIGSCHEMA.biblio_record_entry_stage (id); + CREATE INDEX ${MIGSCHEMA}_biblio_record_entry_legacy_idx ON + $MIGSCHEMA.biblio_record_entry_legacy (id); /); print "Finis.\n"; + +sub drop_stage_table { + my $dbh = shift; + my $stage_table = shift; + my $tablecheck = check_for_mig_table($dbh,$stage_table); + my $answer = 'null'; + if ($tablecheck == 1) { $answer = prompt('Do you want to drop $MIGSCHEMA.$stage_table? This will not remove any bibs loaded to production. y/n'); } + if ($tablecheck == 1 and $answer eq 'y') { $dbh->do("DROP TABLE IF EXISTS $MIGSCHEMA.$stage_table;"); } + if ($tablecheck == 1 and $answer ne 'y') { abort('Table not dropped, bib load aborted.'); } + return(); +} + +sub create_stage_table { + my $dbh = shift; + my $stage_table = shift; + + $dbh->do("CREATE UNLOGGED TABLE $MIGSCHEMA.$stage_table ( + l_bib_id TEXT, + x_source TEXT, + x_warnings TEXT, + x_migrate BOOLEAN DEFAULT TRUE + ) INHERITS ($MIGSCHEMA.biblio_record_entry);"); + + return(); +} + +sub create_child_table { + my $dbh = shift; + + $dbh->do("DO \$\$ + DECLARE + t BOOLEAN; + BEGIN + SELECT EXISTS(SELECT 1 FROM information_schema.tables WHERE table_schema = '$MIGSCHEMA' AND table_name = 'biblio_record_entry') INTO t; + IF t = FALSE THEN + PERFORM migration_tools.build_specific_base_staging_table ('$MIGSCHEMA','biblio.record_entry'); + END IF; + END \$\$;"); + + return (); +} + sub clean_marc { my $xml = shift; + $xml = marc8_to_utf8($xml); $xml =~ s/\n//sog; $xml =~ s/^<\?xml.+\?\s*>//go; $xml =~ s/>\s+prepare($sql); + $sth->execute(); + my @sqlresult = $sth->fetchrow_array; + my $r = pop @sqlresult; + if ($r) { return $r; } else { return 0; } +} + +sub prompt { + my ($query) = @_; + local $| = 1; + print $query; + chomp(my $answer = ); + return $answer; +} + +