package AnyEvent::XMPP::Parser; no warnings; use strict; use AnyEvent::XMPP::Node; # OMFG!!!111 THANK YOU FOR THIS MODULE TO HANDLE THE XMPP INSANITY: use XML::Parser::Expat; =head1 NAME AnyEvent::XMPP::Parser - Parser for XML streams (helper for AnyEvent::XMPP) =head1 SYNOPSIS use AnyEvent::XMPP::Parser; ... =head1 DESCRIPTION This is a XMPP XML parser helper class, which helps me to cope with the XMPP XML. See also L for a discussion of the issues with XML in XMPP. =head1 METHODS =over 4 =item B This creates a new AnyEvent::XMPP::Parser and calls C. =cut sub new { my $this = shift; my $class = ref($this) || $this; my $self = { stanza_cb => sub { die "No stanza callback provided!" }, error_cb => sub { warn "No error callback provided: $_[0]: $_[1]!" }, stream_cb => sub { }, @_ }; bless $self, $class; $self->init; $self } =item B Sets the 'XML stanza' callback. C<$cb> must be a code reference. The first argument to the callback will be this AnyEvent::XMPP::Parser instance and the second will be the stanzas root AnyEvent::XMPP::Node as first argument. If the second argument is undefined the end of the stream has been found. =cut sub set_stanza_cb { my ($self, $cb) = @_; $self->{stanza_cb} = $cb; } =item B This sets the error callback that will be called when the parser encounters an syntax error. The first argument is the exception and the second is the data which caused the error. =cut sub set_error_cb { my ($self, $cb) = @_; $self->{error_cb} = $cb; } =item B This method sets the stream tag callback. It is called when the tag from the server has been encountered. The first argument to the callback is the L of the opening stream tag. =cut sub set_stream_cb { my ($self, $cb) = @_; $self->{stream_cb} = $cb; } =item B This methods (re)initializes the parser. =cut sub init { my ($self) = @_; $self->{parser} = XML::Parser::ExpatNB->new ( Namespaces => 1, ProtocolEncoding => 'UTF-8' ); $self->{parser}->setHandlers ( Start => sub { $self->cb_start_tag (@_) }, End => sub { $self->cb_end_tag (@_) }, Char => sub { $self->cb_char_data (@_) }, Default => sub { $self->cb_default (@_) }, ); $self->{nso} = {}; $self->{nodestack} = []; } =item B This methods removes all handlers. Use it to avoid circular references. =cut sub cleanup { my ($self) = @_; for (qw(stanza_cb error_cb stream_cb parser)) { delete $self->{$_}; } return; } =item B This method checks whether the C<$cmptag> matches the C<$tagname> in the C<$namespace>. C<$cmptag> needs to come from the XML::Parser::Expat as it has some magic attached that stores the namespace. =cut sub nseq { my ($self, $ns, $name, $tag) = @_; unless (exists $self->{nso}->{$ns}->{$name}) { $self->{nso}->{$ns}->{$name} = $self->{parser}->generate_ns_name ($name, $ns); } return $self->{parser}->eq_name ($self->{nso}->{$ns}->{$name}, $tag); } =item B This method feeds a chunk of unparsed data to the parser. =cut sub feed { my ($self, $data) = @_; eval { $self->{parser}->parse_more ($data); }; if ($@) { if ($self->{error_cb}) { $self->{error_cb}->($@, $data, 'xml'); } else { warn "parser error: $@ on [$data]\n"; } } } sub cb_start_tag { my ($self, $p, $el, %attrs) = @_; my $node = AnyEvent::XMPP::Node->new ($p->namespace ($el), $el, \%attrs, $self); $node->append_raw ($p->recognized_string); if (not @{$self->{nodestack}}) { $self->{stream_cb}->($node); } push @{$self->{nodestack}}, $node; } sub cb_char_data { my ($self, $p, $str) = @_; unless (@{$self->{nodestack}}) { warn "characters outside of tag: [$str]!\n"; return; } return if @{$self->{nodestack}} < 2; # don't append anything to the stream element my $node = $self->{nodestack}->[-1]; $node->add_text ($str); $node->append_raw ($p->recognized_string); } sub cb_end_tag { my ($self, $p, $el) = @_; unless (@{$self->{nodestack}}) { warn "end tag read without any starting tag!\n"; return; } if (!$p->eq_name ($self->{nodestack}->[-1]->name, $el)) { warn "end tag doesn't match start tags ($self->{tags}->[-1]->[0])!\n"; return; } my $node = pop @{$self->{nodestack}}; $node->append_raw ($p->recognized_string); # > 1 because we don't want the stream tag to save all our children... if (@{$self->{nodestack}} > 1) { $self->{nodestack}->[-1]->add_node ($node); } eval { if (@{$self->{nodestack}} == 1) { $self->{stanza_cb}->($self, $node); } elsif (@{$self->{nodestack}} == 0) { $self->{stanza_cb}->($self, undef); } }; if ($@) { $self->{error_cb}->($@, undef, 'exception'); } } sub cb_default { my ($self, $p, $str) = @_; $self->{nodestack}->[-1]->append_raw ($str) if @{$self->{nodestack}} > 1; # don't append to the stream element } =back =head1 AUTHOR Robin Redeker, C<< >>, JID: C<< >> =head1 COPYRIGHT & LICENSE Copyright 2007, 2008 Robin Redeker, all rights reserved. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =cut sub DESTROY { my ($self) = @_; $self->{parser}->release if defined($self->{parser}); } 1; # End of AnyEvent::XMPP