# $Id: NSNormalise.pm,v 1.5 2002/10/11 02:01:43 grantm Exp $
package XML::Filter::NSNormalise;
use strict;
use warnings;
use Carp;
use XML::SAX::Base;
use vars qw($VERSION @ISA);
$VERSION = '0.04';
@ISA = qw(XML::SAX::Base);
##############################################################################
# Constructor: new()
#
# Validate mappings and delegate to base class constructor.
#
sub new {
my $class = shift;
my %args = @_;
if(!$args{Map} or !ref($args{Map}) or !%{$args{Map}}) {
croak "No 'Map' option in call to XML::Filter::NSNormalise->new()";
}
my %revmap;
while(my($uri, $prefix) = each %{$args{Map}} ) {
if($revmap{$prefix} and $revmap{$prefix} ne $uri) {
croak "Multiple URIs mapped to prefix '$prefix'"
}
$revmap{$prefix} = $uri;
}
$class->SUPER::new(@_, ReverseMap => \%revmap);
}
##############################################################################
# Method: start_prefix_mapping()
# Method: end_prefix_mapping()
#
# Intercept any namespace prefix events for which we have a mapping and
# normalise the 'Prefix'.
#
sub start_prefix_mapping {
my $self = shift;
my $event = shift;
if($self->{Map}->{$event->{NamespaceURI}}) {
$event = { %$event };
$event->{Prefix} = $self->{Map}->{$event->{NamespaceURI}};
}
$self->SUPER::start_prefix_mapping($event);
}
sub end_prefix_mapping {
my $self = shift;
my $event = shift;
if($self->{Map}->{$event->{NamespaceURI}}) {
$event = { %$event };
$event->{Prefix} = $self->{Map}->{$event->{NamespaceURI}};
}
$self->SUPER::end_prefix_mapping($event);
}
##############################################################################
# Method: start_element()
# Method: end_element()
#
# - Fix the 'Prefix' and 'Name' data for elements in a mapped namespace
# - Fix the 'LocalName' and 'Name' data for namespace declaration attributes
# - Fix the 'Prefix' and 'Name' data for attributes in a mapped namespace
#
sub start_element {
my $self = shift;
my $event = shift;
$event = { %$event }; # make a (shallow) copy of the event data
my %new_attr;
if($self->{Map}->{$event->{NamespaceURI}}) {
$event->{Prefix} = $self->{Map}->{$event->{NamespaceURI}};
$event->{Name} = "$event->{Prefix}:$event->{LocalName}";
}
foreach my $key (keys %{$event->{Attributes}}) {
my $attr = $event->{Attributes}->{$key};
if($attr->{Prefix} eq 'xmlns') {
if($self->{ReverseMap}->{$attr->{LocalName}}) {
if($attr->{Value} ne $self->{ReverseMap}->{$attr->{LocalName}}) {
die "Cannot map '$self->{ReverseMap}->{$attr->{LocalName}}' to " .
"'$attr->{LocalName}' - prefix already occurs in document";
}
}
if($self->{Map}->{$attr->{Value}}) {
$attr = { %$attr };
$attr->{LocalName} = $self->{Map}->{$attr->{Value}};
$attr->{Name} = "xmlns:$attr->{LocalName}";
$new_attr{"{http://www.w3.org/2000/xmlns/}$attr->{LocalName}"} = $attr;
}
else {
$new_attr{$key} = $attr;
}
}
elsif($self->{Map}->{$attr->{NamespaceURI}}) {
$attr = { %$attr };
$attr->{Prefix} = $self->{Map}->{$attr->{NamespaceURI}};
$attr->{Name} = "$attr->{Prefix}:$attr->{LocalName}";
my $new_key = "{$attr->{NamespaceURI}}$attr->{LocalName}";
$new_attr{$new_key} = $attr;
delete($event->{Attributes}->{$key});
}
else {
$new_attr{$key} = $attr;
}
}
$event->{Attributes} = \%new_attr;
$self->SUPER::start_element($event);
}
sub end_element {
my $self = shift;
my $event = shift;
if($self->{Map}->{$event->{NamespaceURI}}) {
$event = { %$event };
$event->{Prefix} = $self->{Map}->{$event->{NamespaceURI}};
$event->{Name} = "$event->{Prefix}:$event->{LocalName}";
}
$self->SUPER::end_element($event);
}
1;
__END__
=head1 NAME
XML::Filter::NSNormalise - SAX filter to normalise namespace prefixes
=head1 SYNOPSIS
use XML::SAX::Machines qw( :all );
use XML::Filter::NSNormalise;
my $p = Pipeline(
XML::Filter::NSNormalise->new(
Map => {
'http://purl.org/dc/elements/1.1/' => 'dc',
'http://purl.org/rss/1.0/modules/syndication/' => 'syn'
}
)
=> \*STDOUT
);
$p->parse_uri($filename);
=head1 DESCRIPTION
This SAX (version 2) filter can be used to transform documents to ensure the
prefixes associated with namespaces are used consistently.
For example, feeding this document...
2002-10-08
... through this filter ...
XML::Filter::NSNormalise->new(
Map => {
'http://purl.org/dc/elements/1.1/' => 'dc'
}
)
... would produce this output ...
2002-10-08
You can specify more than one namespace URI to prefix mapping, eg:
XML::Filter::NSNormalise->new(
Map => {
'http://purl.org/dc/elements/1.1/' => 'dc',
'http://www.w3.org/1999/02/22-rdf-syntax-ns#' => 'rdf',
'http://purl.org/rss/1.0/modules/syndication/' => 'syn'
}
)
=head1 METHODS
=head2 new()
The constructor expects a list of options as Key => Value pairs.
The 'Map' option must be specified and must be set to a hashref. Each key of
the hashref is a namespace URI and each value is the corresponding namespace
prefix you want in the output document. Any namespaces which occur in the
document but do not occur in the Map hash, will be passed through unaltered.
All other options are passed to the default constructor in L.
=head1 ERROR HANDLING
Attempting to map more than one URI to the same prefix will cause a fatal
exception, eg:
XML::Filter::NSNormalise->new(
Map => {
'http://x.com/ => 'z',
'http://y.com/ => 'z'
}
)
Attempting to map a URI to a prefix that is already mapped to a different URI
will cause a fatal exception (eg: you map a URI to the prefix 'foo' but the
document your are filtering already uses 'foo' for a different URI).
=head1 SEE ALSO
L, L, L.
=head1 COPYRIGHT
Copyright 2002 Grant McLean Egrantm@cpan.orgE
This library is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.
=cut