3 ###############################################################################
6 =item B<stagebibs> --file foo.xml
8 Takes a load of bibs from a UTF-8 MARC XML file and loads them into mig staging
9 table of bibio_record_entry. This is done with no checking of file validity
10 so records should be checked before hand and cleaned.
12 Takes one optional arguments:
16 Sets an x_source value on the staging table to the one supplied instead of the
23 ###############################################################################
29 #binmode STDIN, ':bytes';
31 HOME PGHOST PGPORT PGUSER PGDATABASE MIGSCHEMA
32 MIGBASEWORKDIR MIGBASEGITDIR MIGGITDIR MIGWORKDIR
40 my $mig_bin = "$FindBin::Bin/";
41 use lib "$FindBin::Bin/";
44 pod2usage(-verbose => 2) if defined $ARGV[0] && $ARGV[0] eq '--help';
45 pod2usage(-verbose => 1) if ! $ARGV[1];
47 my $next_arg_is_file = 0;
49 my $next_arg_is_source = 0;
50 my $next_arg_is_stage = 0;
51 my $base_table = 'biblio_record_entry';
52 my $stage_table = 'biblio_record_entry_legacy';
53 my $source = 'default';
55 my $dbh = Mig::db_connect();
59 binmode STDIN, ':utf8';
61 foreach my $arg (@ARGV) {
62 if ($arg eq '--file') {
63 $next_arg_is_file = 1;
66 if ($next_arg_is_file) {
68 $next_arg_is_file = 0;
71 if ($arg eq '--source') {
72 $next_arg_is_source = 1;
75 if ($next_arg_is_source) {
77 $next_arg_is_source = 0;
82 my $bre_test = check_for_table($dbh,$base_table);
83 my $bre_legacy_test = check_for_table($dbh,$stage_table);
84 if ($bre_test == 0 and $bre_legacy_test == 0 ) { create_bre($dbh); create_child_bre($dbh); }
85 if ($bre_test == 1 and $bre_legacy_test == 0 ) { create_child_bre($dbh); }
87 my $xmig_test = check_for_column($dbh,$stage_table,'x_migrate');
88 if ($xmig_test == 0) { add_column($dbh,$stage_table,'x_migrate','BOOLEAN DEFAULT TRUE'); }
90 my $xsource_test = check_for_column($dbh,$stage_table,'x_source');
91 if ($xsource_test == 0) { add_column($dbh,$stage_table,'x_source','TEXT'); }
93 #flatten out MARC XML FILE
94 open my $xml, "<:encoding(utf8)", $infile or abort('could not open MARC XML file');
97 while(my $line = <$xml>) {
98 if ($line =~ /^<\/?collection/) { next; }
100 $record = $record . $line;
101 if ($line =~ /<\/record>$/) {
102 stage_record($dbh,$record,$source);
105 if (($i % 100) == 0) { report_progress('Records stage', $i); }
110 if ($i == 0) { print "No XML was processed, are you sure this is an XML file?\n"; }
113 # beyond here be functions
121 SELECT EXISTS(SELECT 1 FROM information_schema.tables WHERE table_schema = '$MIGSCHEMA' AND table_name = '$base_table') INTO t;
123 PERFORM migration_tools.build_specific_base_staging_table ('$MIGSCHEMA',REGEXP_REPLACE('$base_table','_','.'));
130 sub create_child_bre {
134 CREATE TABLE $MIGSCHEMA.$stage_table (x_migrate BOOLEAN DEFAULT TRUE, x_source TEXT) INHERITS ($MIGSCHEMA.$base_table);
142 print STDERR "$0: $msg", "\n";
146 sub report_progress {
147 my ($msg, $counter) = @_;
148 if (defined $counter) {
149 print STDERR "$msg: $counter\n";
151 print STDERR "$msg\n";
159 my $last_xact = "'$MIGSCHEMA'";
160 $record = '$_$' . $record . '$_$';
162 if ($source eq 'default') { $sql = "INSERT INTO $MIGSCHEMA.$stage_table (last_xact_id,marc) VALUES ($last_xact,$record);"; }
163 else { $sql = "INSERT INTO $MIGSCHEMA.$stage_table (last_xact_id,marc,x_source) VALUES ($last_xact,$record,'$source');"; }
164 my $sth = $dbh->prepare($sql);
169 sub check_for_table {
172 my $sql = "SELECT 1 FROM information_schema.tables WHERE table_schema = '$MIGSCHEMA' AND table_name = '$table';";
173 my $sth = $dbh->prepare($sql);
175 my @sqlresult = $sth->fetchrow_array;
176 my $r = pop @sqlresult;
177 if ($r) { return $r; } else { return 0; }
180 sub check_for_column {
184 my $sql = "SELECT 1 FROM information_schema.columns WHERE table_schema = '$MIGSCHEMA' AND table_name = '$table' AND column_name = '$column';";
185 my $sth = $dbh->prepare($sql);
187 my @sqlresult = $sth->fetchrow_array;
188 my $r = pop @sqlresult;
189 if ($r) { return $r; } else { return 0; }
196 my $column_type = shift;
197 my $sql = "ALTER TABLE $MIGSCHEMA.$table ADD COLUMN $column $column_type;";
198 my $sth = $dbh->prepare($sql);
200 my @sqlresult = $sth->fetchrow_array;
201 my $r = check_for_column($dbh,$table,$column);
202 if ($r == 0) { abort('failed to create column'); } else { return $r; }