=head1 VERSION
-Version 1.000
+Version 1.005
=cut
-our $VERSION = '1.000';
+our $VERSION = '1.005';
=head1 SYNOPSIS
that set.
use Equinox::Migration::SubfieldMapper;
-
- my $stl = Equinox::Migration::SubfieldMapper->new( file => ".txt" );
- my $tags = $stl->as_hashref;
+ ...
-or
-
- my $stl = Equinox::Migration::SubfieldMapper->new( file => ".txt" );
- if ( $stl->has($foo) ) {
- # if $foo is an element of $stl's parsed list
- # do stuff ...
- }
-
-
-=head1 ROUTINES
+=head1 METHODS
=head2 new
Takes one optional argument, C<file>. If this is speficied, the tag
list will be populated as per that file on instantiation.
-Returns a E::M::STL object.
+Returns a E::M::SM object.
=cut
sub new {
my ($class, %args) = @_;
- my $self = bless { conf => { mods => { multi => 1, bib => 1, req => 1, bibreq => 1 } },
+ my $self = bless { conf => { mods => undef },
fields => {},
tags => {} }, $class;
+ if ($args{mods}) {
+ die "Argument 'mods' is wrong type\n"
+ unless (ref $args{mods} eq "ARRAY");
+ for my $mod ( @{$args{mods}} )
+ { $self->{conf}{mods}{$mod} = 1 }
+ }
+
if ($args{file}) {
if (-r $args{file}) {
$self->{conf}{file} = $args{file};
=head2 has
-Ask it whether you mapping has various things, and it'll let you know.
+Ask it whether your mapping has various things, and it'll let you know.
$sm->has('fieldname') # is this fieldname mapped?
$sm->has(901) # are there any mappings for this tag?
}
}
+=head2 tags
+
+Returns an arrayref containing the tags defined in the map.
+
+ my $tags = $sfm->tags;
+ for my tag ( @{$tags} ) {
+ my $subs = $sfm->subfields($tag);
+ ...
+ }
+
+=cut
+
+sub tags {
+ my ($self) = @_;
+ return [ keys %{$self->{tags}} ];
+}
+
+=head2 subfields
+
+Given a tag, return an arrayref of the subfields mapped with that tag.
+
+ my $tags = $sfm->tags;
+ for my tag ( @{$tags} ) {
+ my $subs = $sfm->subfields($tag);
+ ...
+ }
+
+Returns C<undef> if C<tag> is not mapped.
+
+=cut
+
+sub subfields {
+ my ($self, $tag) = @_;
+ return undef unless $self->has($tag);
+ return [ keys %{$self->{tags}{$tag}} ];
+}
+
+
=head2 field
Given a tag and subfield code,
return $self->{tags}{$tag}{$sub};
}
-=head2 mod
+=head2 mods
-Returns the modifier set on a mapping.
+With no argument, returns a hashref containing all modifiers for the entire map:
- if ($sm->mod('field) eq "bib")
+ {
+ modifier => {
+ tag => [ list_of subs ],
+ ...
+ },
+ ...
+ }
-If there is no modifier, C<0> will be returned. At the moment, the
-valid mappings are
+Given a fieldname, returns a hashref of the modifiers set on that mapping.
- * multi - This field is expected to be seen multiple times per
- datafield
+ $self->mods('fieldname')
- * bib - This is a bib-level field, and is expected to be seen only
- once per record (normal is once per datafield)
+Returns undef is nothing is defined.
- * req - This field is required to occur before output
+=cut
- * bibreq - Both 'bib' and 'req'
+sub mods {
+ my ($self, $field) = @_;
+ return $self->{allmods} unless defined $field;
+ return undef unless $self->has($field);
+ return undef unless (%{ $self->{fields}{$field}{mods} });
+ return $self->{fields}{$field}{mods};
+}
+
+=head2 filters
+
+Returns the content filters set on a mapping
+
+ $self->filters('fieldname')
+
+If there are no filters, C<undef> will be returned. Else a listref
+will be returned.
+
+=cut
+
+sub filters {
+ my ($self, $field) = @_;
+ return undef unless $self->has($field);
+ return undef unless ($self->{fields}{$field}{filt});
+ return $self->{fields}{$field}{filt};
+}
+
+=head2 sep
+
+Returns the separator string set on a mapping. Used only
+if concatenating.
=cut
-sub mod {
+sub sep {
my ($self, $field) = @_;
return undef unless $self->has($field);
- return $self->{fields}{$field}{mod};
+ return $self->{fields}{$field}{sep};
}
+=head1 MAP CONSTRUCTION METHODS
+
+These methods are not generally accessed from user code.
+
=head2 generate
Generate initial mapping from file.
chomp;
my @tokens = split /\s+/;
- if (defined $tokens[3]) {
- $self->add( field => $tokens[0], tag => $tokens[1],
- sub => $tokens[2], mod => $tokens[3] );
- } else {
- $self->add( field => $tokens[0], tag => $tokens[1], sub => $tokens[2] );
+ my $map = { mods => [], filt => [], sep => ' ' };
+ $map->{field} = shift @tokens;
+ $map->{tag} = shift @tokens;
+ while (defined (my $tok = shift @tokens)) {
+ last if ($tok =~ m/^#/);
+ if ($tok =~ m/^[a-z]:'/ and $tok !~ /^'$/) {
+ $tok .= ' ' . shift @tokens
+ until ($tokens[0] =~ m/'$/);
+ $tok .= ' ' . shift @tokens;
+ $tok =~ s/'//;
+ $tok =~ s/'$//;
+ }
+ if ($tok =~ m/^m:/)
+ { push @{$map->{mods}}, $tok }
+ elsif ($tok =~ m/^f:/)
+ { push @{$map->{filt}}, $tok }
+ elsif ($tok =~ m/^[a-z0-9]$/)
+ { $map->{sub} = $tok }
+ elsif ($tok =~ /^c:(.*)$/)
+ { $map->{sep} = $1 }
+ else
+ { die "Unknown chunk '$tok' at line $.\n" }
}
+ $self->add($map);
}
-
}
=head2 add
Add new item to mapping. Not usually called directly from user code.
- $sm->add( field => 'value', tag => num, sub => 'c' );
- $sm->add( field => 'value', tag => num,
- sub => 'c', mod => 'modifier' );
+ $sm->add( $map );
+
+Where C<$map> is a hashref that, at a minimum, looks like
+
+ { field => "value", tag => NNN, sub => X }
+
+and may also have the key/value pairs
+
+ mods => [ ITEMS ]
+ filt => [ ITEMS ]
=cut
sub add {
- my ($self, %toks) = @_;
+ my ($self, $map) = @_;
+
+ # trim the mods and filters
+ my $mods = {};
+ my $filt = []; my %filt = ();
+ for my $m (@{$map->{mods}}) {
+ die "Modifier collision '$m' at line $." if $mods->{$m};
+ $m =~ s/^m://;
+ $mods->{$m} = 1;
+ push @{$self->{allmods}{$m}{ $map->{tag} }}, $map->{sub};
+ }
+ for my $f (@{$map->{filt}}) {
+ die "Filter collision '$f' at line $." if $filt{$f};
+ $f =~ s/^f://;
+ push @{$filt}, $f; $filt{$f} = 1;
+ }
+ $map->{mods} = $mods;
+ $map->{filt} = $filt;
# check bits for validity
- $self->validate(\%toks);
-
- $toks{mod} = (defined $toks{mod} and $toks{mod} !~ /^#/) ? $toks{mod} : 0;
-
- $self->{fields}{$toks{field}} = { tag => $toks{tag}, sub => $toks{sub}, mod => $toks{mod}};
- $self->{tags}{$toks{tag}}{$toks{sub}} = $toks{field};
+ $self->validate($map);
+
+ # add data to the fields hash
+ $self->{fields}{ $map->{field} } = { tag => $map->{tag},
+ sub => $map->{sub},
+ mods => $map->{mods},
+ filt => $map->{filt},
+ sep => $map->{sep},
+ };
+ # and to the tags hash
+ $self->{tags}{ $map->{tag} }{ $map->{sub} } = $map->{field};
}
=head2 validate
* tag must be between 0 and 999
* subfield code must be a single alphanumeric character
* tag+subfield can only be mapped once
+ * if a list of allowable mod values was given in the call to
+ C<new>, any modifiers must be on that list
=cut
sub validate {
- my ($self, $toks) = @_;
+ my ($self, $map) = @_;
$.= 1 unless defined $.;
die "Required field missing (line $.)\n"
- unless (defined $toks->{field} and defined $toks->{tag} and defined $toks->{sub});
+ unless (defined $map->{field} and defined $map->{tag} and defined $map->{sub});
die "Fieldnames must start with letter (line $.)\n"
- unless ($toks->{field} =~ /^[a-zA-z]/);
+ unless ($map->{field} =~ /^[a-zA-z]/);
die "Invalid tag (line $.)\n"
- if ($toks->{tag} =~ /[^\d\-]/ or $toks->{tag} < 0 or $toks->{tag} > 999);
+ if ($map->{tag} =~ /[^\d\-]/ or $map->{tag} < 0 or $map->{tag} > 999);
die "Invalid subfield code (line $.)\n"
- if (length $toks->{sub} != 1 or $toks->{sub} =~ /[^a-zA-Z0-9]/);
+ if (length $map->{sub} != 1 or $map->{sub} =~ /[^a-zA-Z0-9]/);
- # the next thing (if it exists), must be a comment or valid modifier
- if (defined $toks->{mod}) {
- die "Unknown chunk (line $.)\n"
- unless (defined $self->{conf}{mods}{$toks->{mod}} or $toks->{mod} =~ /^#/);
+ # test mod names if we have a set to check against
+ if (defined $self->{conf}{mods}) {
+ for my $mod ( keys %{$map->{mods}} ) {
+ die "Modifier '$mod' not allowed\n"
+ unless $self->{conf}{mods}{$mod};
+ }
}
die "Fieldnames must be unique (line $.)\n"
- if (defined $self->{fields}{$toks->{field}});
+ if (defined $self->{fields}{$map->{field}});
+
+ die "Subfields cannot be mapped twice (line $.)\n"
+ if (defined $self->{tags}{$map->{tag}}{$map->{sub}});
- die "Subfields cannot be multimapped (line $.)\n"
- if (defined $self->{tags}{$toks->{tag}}{$toks->{sub}});
}