=head1 VERSION
-Version 1.000
+Version 1.002
=cut
-our $VERSION = '1.000';
+our $VERSION = '1.002';
=head1 SYNOPSIS
my $self = bless { data => { recs => undef, # X::T record objects
rcnt => 0, # record counter
tcnt => 0, # tag counter
+ scnt => {}, # subfield/tag counters
samp => {}, # data samples
tags => {}, # all found tags
},
die "Argument 'marcfile' must be specified\n" unless ($args{marcfile});
if (-r $args{marcfile}) {
$self->{twig} = XML::Twig->new;
- $self->{twig}->parsefile($args{marcfile});
- my @records = $self->{twig}->root->children;
- $self->{data}{recs} = \@records;
+ $self->{conf}{marc} = $args{marcfile};
} else {
die "Can't open marc file: $!\n";
}
sub parse_records {
my ($self) = @_;
- for my $record ( @{$self->{data}{recs}} ) {
+ $self->{twig}->parsefile( $self->{conf}{marc} );
+ for my $record ( $self->{twig}->root->children ) {
my @fields = $record->children;
for my $f (@fields)
- { $self->process_field($f) }
+ { $self->process_field($f); $f->purge }
# cleanup memory and increment pointer
$record->purge;
if ($map and $map->has($tag)) {
my @subs = $field->children('subfield');
+ my $i= 0;
for my $sub (@subs)
- { $self->process_subs($tag, $sub) }
+ { $self->process_subs($tag, $sub); $sub->purge; $i++ }
+
+ # increment sub length counter
+ $self->{data}{scnt}{$tag}{$i}++;
}
}
# handle unmapped tag/subs
my $samp = $self->{data}{samp};
# set a value, total-seen count and records-seen-in count
- $samp->{$tag}{$code}{value} = $sub->text unless defined $samp->{$tag}{$code};
+ $samp->{$tag}{$code}{value} = $sub->text unless $samp->{$tag}{$code};
$samp->{$tag}{$code}{count}++;
$samp->{$tag}{$code}{tcnt}++ unless ( defined $samp->{$tag}{$code}{last} and
$samp->{$tag}{$code}{last} == $self->{data}{tcnt} );
$samp->{$tag}{$code}{last} = $self->{data}{tcnt};
- #FIXME tcnt not rcnt
}