3 ###############################################################################
6 =item B<stagebibs> --file foo.xml
8 Takes a load of bibs from a UTF-8 MARC XML file and loads them into mig staging
9 table of bibio_record_entry. This is done with no checking of file validity
10 so records should be checked before hand and cleaned.
12 Takes one optional arguments:
16 Sets an x_source value on the staging table to the one supplied instead of the
23 ###############################################################################
29 #binmode STDIN, ':bytes';
31 HOME PGHOST PGPORT PGUSER PGDATABASE MIGSCHEMA
32 MIGBASEWORKDIR MIGBASEGITDIR MIGGITDIR MIGWORKDIR
40 my $mig_bin = "$FindBin::Bin/";
41 use lib "$FindBin::Bin/";
44 pod2usage(-verbose => 2) if defined $ARGV[0] && $ARGV[0] eq '--help';
45 pod2usage(-verbose => 1) if ! $ARGV[1];
47 my $next_arg_is_file = 0;
49 my $next_arg_is_source = 0;
50 my $next_arg_is_stage = 0;
51 my $next_arg_is_base_table = 0;
52 my $next_arg_is_stage_table = 0;
53 my $base_table = 'biblio_record_entry';
54 my $stage_table = 'biblio_record_entry_legacy';
55 my $source = 'default';
57 my $dbh = Mig::db_connect();
61 binmode STDIN, ':utf8';
63 foreach my $arg (@ARGV) {
64 if ($arg eq '--file') {
65 $next_arg_is_file = 1;
68 if ($next_arg_is_file) {
70 $next_arg_is_file = 0;
73 if ($arg eq '--source') {
74 $next_arg_is_source = 1;
77 if ($next_arg_is_source) {
79 $next_arg_is_source = 0;
82 if ($arg eq '--base-table') {
83 $next_arg_is_base_table = 1;
86 if ($next_arg_is_base_table) {
88 $next_arg_is_base_table = 0;
91 if ($arg eq '--stage-table') {
92 $next_arg_is_stage_table = 1;
95 if ($next_arg_is_stage_table) {
97 $next_arg_is_stage_table = 0;
102 my $bre_test = check_for_table($dbh,$base_table);
103 my $bre_legacy_test = check_for_table($dbh,$stage_table);
104 if ($bre_test == 0 and $bre_legacy_test == 0 ) { create_bre($dbh); create_child_bre($dbh); }
105 if ($bre_test == 1 and $bre_legacy_test == 0 ) { create_child_bre($dbh); }
107 my $xmig_test = check_for_column($dbh,$stage_table,'x_migrate');
108 if ($xmig_test == 0) { add_column($dbh,$stage_table,'x_migrate','BOOLEAN DEFAULT TRUE'); }
110 my $xsource_test = check_for_column($dbh,$stage_table,'x_source');
111 if ($xsource_test == 0) { add_column($dbh,$stage_table,'x_source','TEXT'); }
113 #flatten out MARC XML FILE
114 open my $xml, "<:encoding(utf8)", $infile or abort('could not open MARC XML file');
117 while(my $line = <$xml>) {
118 if ($line =~ /^<\/?collection/) { next; }
120 $record = $record . $line;
121 if ($line =~ /<\/record>$/) {
122 stage_record($dbh,$record,$source);
125 if (($i % 100) == 0) { report_progress('Records stage', $i); }
130 if ($i == 0) { print "No XML was processed, are you sure this is an XML file?\n"; }
133 # beyond here be functions
141 SELECT EXISTS(SELECT 1 FROM information_schema.tables WHERE table_schema = '$MIGSCHEMA' AND table_name = '$base_table') INTO t;
143 PERFORM migration_tools.build_specific_base_staging_table ('$MIGSCHEMA',REGEXP_REPLACE('$base_table','_','.'));
150 sub create_child_bre {
154 CREATE TABLE $MIGSCHEMA.$stage_table (x_migrate BOOLEAN DEFAULT TRUE, x_source TEXT) INHERITS ($MIGSCHEMA.$base_table);
162 print STDERR "$0: $msg", "\n";
166 sub report_progress {
167 my ($msg, $counter) = @_;
168 if (defined $counter) {
169 print STDERR "$msg: $counter\n";
171 print STDERR "$msg\n";
179 my $last_xact = "'$MIGSCHEMA'";
180 $record = '$_$' . $record . '$_$';
182 if ($source eq 'default') { $sql = "INSERT INTO $MIGSCHEMA.$stage_table (last_xact_id,marc) VALUES ($last_xact,$record);"; }
183 else { $sql = "INSERT INTO $MIGSCHEMA.$stage_table (last_xact_id,marc,x_source) VALUES ($last_xact,$record,'$source');"; }
184 my $sth = $dbh->prepare($sql);
189 sub check_for_table {
192 my $sql = "SELECT 1 FROM information_schema.tables WHERE table_schema = '$MIGSCHEMA' AND table_name = '$table';";
193 my $sth = $dbh->prepare($sql);
195 my @sqlresult = $sth->fetchrow_array;
196 my $r = pop @sqlresult;
197 if ($r) { return $r; } else { return 0; }
200 sub check_for_column {
204 my $sql = "SELECT 1 FROM information_schema.columns WHERE table_schema = '$MIGSCHEMA' AND table_name = '$table' AND column_name = '$column';";
205 my $sth = $dbh->prepare($sql);
207 my @sqlresult = $sth->fetchrow_array;
208 my $r = pop @sqlresult;
209 if ($r) { return $r; } else { return 0; }
216 my $column_type = shift;
217 my $sql = "ALTER TABLE $MIGSCHEMA.$table ADD COLUMN $column $column_type;";
218 my $sth = $dbh->prepare($sql);
220 my @sqlresult = $sth->fetchrow_array;
221 my $r = check_for_column($dbh,$table,$column);
222 if ($r == 0) { abort('failed to create column'); } else { return $r; }