package HTML::TrackerLink; # HTML::TrackerLink is a package for automatically finding tracker references # in the form of 'Keyword 12345' or '#12345', and converting them into links into # the external tracking system. # See POD below for more details use 5.006; use strict; use vars qw{$VERSION $errstr}; BEGIN { $VERSION = '1.03'; $errstr = ''; } ##################################################################### # Constructor and Accessors sub new { my $class = shift; # Create our object my $self = bless { keywords => {}, }, $class; return $self unless @_; # Handle arguments if ( @_ == 1 ) { # Should be a tracker URL for the default search my $url = shift; return undef unless $self->_check_url( $url ); # Set the default search $self->{default} = $url; } elsif ( @_ == 2 ) { # Should be a single keyword/url pair my ($keyword, $url) = @_; return undef unless $self->_check_keyword( $keyword ); return undef unless $self->_check_url( $url ); # Set the keyword $self->{keywords}->{lc $keyword} = $url; # Set the default search to be the same $self->{default_keyword} = $keyword; } elsif ( scalar(@_) % 2 == 0 ) { # Multiple keyword/url pairs my %keywords = @_; foreach my $keyword ( sort keys %keywords ) { my $url = $keywords{$keyword}; unless ( $self->_check_keyword( $keyword ) ) { return $self->_error( "Invalid keyword '$keyword': " . $self->errstr ); } unless ( $self->_check_url( $url ) ) { return $self->_error( "Bad URL for keyword '$keyword': " . $self->errstr ); } # Set the keyword $self->{keywords}->{$keyword} = $url; } } else { return $self->_error( 'Arguments must be in keyword/url pairs' ); } $self; } # Return the currently defined keywords sub keywords { if ( wantarray ) { return sort keys %{ $_[0]->{keywords} }; } else { return scalar keys %{ $_[0]->{keywords} }; } } ##################################################################### # Main Methods # Get or set a keyword search sub keyword { my $self = shift; my $keyword = $self->_check_keyword($_[0]) ? lc shift : return undef; return $self->{keywords}->{$keyword} unless @_; # Set the tracker URL my $url = $self->_check_url($_[0]) ? shift : return undef; $self->{keywords}->{$keyword} = $url; } # Get the current default search sub default { my $self = shift; return $self->{default_keyword} ? $self->{keywords}->{ $self->{default_keyword} } : $self->{default} unless @_; # Try to set the default search my $url = $self->_check_url($_[0]) ? shift : return undef; # In case they are using a keyword, remove it delete $self->{default_keyword}; $self->{default} = $url; } # Make the default search the same as a particular keyword sub default_keyword { my $self = shift; my $keyword = $self->_check_keyword($_[0]) ? lc shift : return undef; # Does the keyword exist? unless ( exists $self->{keywords}->{$keyword} ) { return $self->_error( "The keyword '$keyword' does not exist" ); } # In case they are using an explicit default search, remove it delete $self->{default}; $self->{default_keyword} = $keyword; } # Process and return a string sub process { my $self = shift; my $text = (@_ and defined $_[0]) ? shift : return $self->_error( 'You did not provide a string to process' ); # Prepare the transforms my @replace = (); if ( $self->keywords ) { my $any_keyword = '(?:' . join('|', $self->keywords) .')'; push @replace, [ qr/\b($any_keyword)\s+\#?(\d+)/is, sub { $self->_replace( $self->{keywords}->{lc $_[3]}, $_[2], $_[4], ) }, ]; } if ( $self->default ) { push @replace, [ qr/\#(\d+)/s, sub { $self->_replace( $self->default, $_[2], $_[3], ) }, ]; } # Hand off to the main substitution method return $self->_subst( $text, @replace ); } # Implement the parallel substitution sub _subst { my $self = shift; my $input = shift; # Map the match regex to capture everything BEFORE the match, # and the entire pattern provided. # (We'll provide them as the first params) my @try = map { [ qr/\G(.*?)($_->[0])/s => $_->[1] ] } @_; unless ( @try ) { # Handle the pathological no-replace case return $input; } # Start the main loop my $position = 0; my $len = length $input; my $output = ''; while ( $position < $len ) { my $found = undef; my @start = (); my @end = (); foreach my $r ( @try ) { # Skip if it is not in the string pos $input = $position; next unless $input =~ $r->[0]; # Skip if it DOESN'T match earlier if ( $found and $start[2] <= $-[2] ) { next; } # This is the best option. # Save the matching regex $found = $r->[1]; @start = @-; @end = @+; } # Break out if no more matches last unless $found; # Append the pre-match string to the output $output .= substr( $input, $start[1], $end[1] - $start[1] ); # Pass the rest to the transform function my $rv = $found->( map { substr( $input, $start[$_], $end[$_] - $start[$_] ) } 0 .. $#end ); unless ( defined $rv ) { # Transform is signaling an error return undef; } # Transform completed ok $output .= $rv; # Move the match position for the next iteration $position = $end[2]; } # Append the remainder of the string return $output . substr( $input, $position ); } # Return any error message sub errstr { $errstr } ##################################################################### # Support Methods sub _check_keyword { my $self = shift; my $kw = shift or return $self->_error( 'You did not provide a keyword' ); return $self->_error( 'Keyword contains non-word characters' ) if $kw =~ /\W/; return $self->_error( 'Keyword cannot start with a number' ) if $kw =~ /^\d/; return 1; } sub _check_url { my $self = shift; my $url = shift or return $self->_error( 'You did not provide a tracker URL' ); unless ( $url =~ m!^https?://[\w.]+/! ) { return $self->_error( 'The tracker URL format appears to be invalid' ); } unless ( $url =~ /\%n/ ) { return $self->_error( 'The tracker URL does not contain a %n placeholder' ); } return 1; } # Generates the link in the replacer sub _replace { my ($self, $url, $text, $id) = @_; # Create the link $url =~ s/\%n/$id/g; return "$text"; } sub _error { $errstr = $_[1]; undef } 1; __END__ =pod =head1 NAME HTML::TrackerLink - Autogenerates links to Bug/Tracker systems =head1 SYNOPSIS # Create a linker for only #12345 for a single tracker system my $linker = HTML::TrackerLink->new( 'http://host/path?id=%n' ); # Create a linker for a single named ( 'Bug #12345' ) system $linker = HTML::TrackerLink->new( 'bug', 'http://host/path?id=%n' ); # Create a linker for multiple named systems $linker = HTML::TrackerLink->new( 'bug' => 'http://host1/path?id=%n', 'tracker' => 'http://host2/path?id=%n', ); # For the multiple linker, make it default to an arbitrary system $linker->default( 'http://host/path?id=%n' ); # For the multiple linker, make it default to one of the keywords $linker->default_keyword( 'bug' ); # Process a string, and add links my $string = 'Fix for bug 1234, described in client request CT #1234'; $string = $linker->process( $string ); =head1 DESCRIPTION HTML::TrackerLink is a package for automatically generating links to one or more external systems from references found in ordinary text, such as CVS commit messages. It tries to do this as intelligently and as flexibly as possible. =head2 Tracker URL Format Most tracking systems ( bugs, client requests etc, henceforth known as a 'Tracker' ) use a numeric ID number as a key for the tracker item. Web interfaces to these systems will generally contain a URL like the following. Mozilla Bugzilla 100,000th Bug Example URL http://bugzilla.mozilla.org/show_bug.cgi?id=100000 HTML::TrackerLink takes as arguments a generic form of this URL, created by replacing the number of the tracker item, with the symbol '%n'. For the previous example. HTML::TrackerLink URL for Mozilla Bugzilla http://bugzilla.mozilla.org/show_bug.cgi?id=%n When HTML::TrackerLink find a valid reference while processing, it will replace the %n with the id it finds, and replace the reference in the source string with a resulting link. Any tracker URL arguments passed to HTML::TrackerLink will be checked to make sure that they actually contain the %n placeholder. =head2 Default Tracker and Keyworded Trackers HTML::TrackerLink does two types of searches in the source text, a 'default' search, and 'keyword' searches. A default search will look B for a number with a preceding hash, like '#12345'. Note that the default search will NOT match with naked numbers, such as '12345'. A keyword search is a little more flexible. For a 'bug' keyword search, the following would all be valid, and matched against. bug 12345 # Simplest form Bug 12345 # Case insensitive BuG 12345 # Case insensitive and allows multiple spaces bug #12345 # Normal hashed number form Bug #12345 # Again, case insensitive The keyword search would B match with the following bug12345 # Must be seperated by whitespace bug#12345 # Even in this case bigbug 12345 # 'bug' must be a seperate word All of these searches are performed condurrently, meaning that given both a default search, and a C<'bug'> keyword search, the following would match the way you would expect it to. Client issue #435 ( Bug #1532 ) fixed The C<'Bug #1532'> would link to your bug tracking system, and the C<'#435'> would link to your client feedback tracking system, which is the default. =head2 Keyword Format The keyword can be up to 32 characters long, containing only word characters, and cannot start with a number. Irrelevant of the case passed, the keywords are stored internally in lowercase. As such, you cannot have two seperate keyword searchs for C<'bug'>, and C<'BUG'>. =head1 METHODS =head2 new The C constructor takes a variety of arguments and returns a new HTML::TrackerLink processing object. Arguments to C are accepted in one of the following formats. =over 4 =item new A empty HTML::LinkTracker object is created without any trackers set =item new $tracker_url If a single argument is passed, the argument is assume be the tracker URL for a the default search. =item new $keyword => $tracker_url If two arguments are passed, they are assumed to be a single keyword search. In the case where the HTML::TrackerLink object is created with only one keyword, the default search will ALSO be set to the same tracker, so that in systems with only one possible place to link to, people that forget the keyword will still get their references linked to. It also catches a cases where there is a message like C<'This resolves Bug #12, #13, #14 and #15'>. =item new $keyword1 => $tracker_url1, $keyword2 => $tracker_url2 [, ...] If more than two arguments are passed, they are assumed to be a set of keyword searches. In this case, the default search will NOT be set, as we cannot be sure I case the default should go to. To assign the default in this case, you should use the C or C methods. =back In all cases, the C method will returns a new HTML::TrackerLink object on success, or C if an error has occured. ( Invalid keyword/URL formats etc ). =head2 keywords Returns a list containing all current defined keywords =head2 keyword $keyword [, $tracker_url ] If passed a single argument, returns the current URL for the keyword, or C if the keyword does not exist. If passed two arguments, it will add a new keyword search, or replace an existing one, returning true on success, or C if the keyword or tracker URL are invalid. =head2 default [ $tracker_url ] If passed, explicitly sets the tracker URL to be used for the default search. Returns the default search URL Returns C if attempting to set an invalid tracker_url =head2 default_keyword $tracker_url Sets the default search to be the same as an already existing keyword search. Returns true on success. Returns C if the keyword does not exist. =head2 process $string The C methods takes a string as argument, and applies the searches to it. Returns the processed string on success. Returns C on error. =head2 errstr When an error occurs, the C method allows you to get access to the error message. C can be called as either a static or object method. i.e. The following are equivalent # Calling errstr as a static method my $linker = HTML::TrackerLink->new( 'badurl' ); die HTML::TrackerLink->errstr; # Calling errstr as an object method my $linker = HTML::TrackerLink->new( 'badurl' ); die $linker->errstr; =head1 TO DO Although the code for this module was extracted from a known working application, this package itself has only basic tests. Please report any bugs encountered. =head1 SUPPORT Bugs should be reported via the CPAN bug tracker at L For other issues, or commercial enhancement or support, contact the author. =head1 AUTHORS Adam Kennedy Eadamk@cpan.orgE =head1 COPYRIGHT Copyright 2002 - 2008 Adam Kennedy. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. The full text of the license can be found in the LICENSE file included with this module. =cut