package HTML::WikiConverter::Socialtext; use warnings; use strict; use base 'HTML::WikiConverter'; our $VERSION = '0.03'; =head1 NAME HTML::WikiConverter::Socialtext - Convert HTML to Socialtext markup =head1 SYNOPSIS use HTML::WikiConverter; my $wc = new HTML::WikiConverter( dialect => 'Socialtext'); print $wc->html2wiki( $html ); =head1 DESCRIPTION This module contains rules for converting HTML into Socialtext markup. See L for additional usage details. =cut sub rules { my %rules = ( hr => { replace => "\n----\n" }, br => { replace => "\n" }, h1 => { start => '^ ', block => 1, trim => 'both', line_format => 'single' }, h2 => { start => '^^ ', block => 1, trim => 'both', line_format => 'single' }, h3 => { start => '^^^ ', block => 1, trim => 'both', line_format => 'single' }, h4 => { start => '^^^^ ', block => 1, trim => 'both', line_format => 'single' }, h5 => { start => '^^^^^ ', block => 1, trim => 'both', line_format => 'single' }, h6 => { start => '^^^^^^ ', block => 1, trim => 'both', line_format => 'single' }, p => { block => 1, line_format => 'multi' }, b => { start => '*', end => '*', line_format => 'single', trim => 'both' }, strong => { alias => 'b' }, i => { start => '_', end => '_', line_format => 'single', trim => 'both' }, em => { alias => 'i' }, u => { start => '_', end => '_', line_format => 'single', trim => 'both' }, strike => { start => '-', end => '-', line_format => 'single', trim => 'both' }, s => { alias => 'strike' }, tt => { start => '`', end => '`', trim => 'both', line_format => 'single' }, code => { alias => 'tt' }, pre => { start => "\n.pre\n", end => "\n.pre\n", line_prefix => '', line_format => 'blocks' }, a => { replace => \&_link }, img => { replace => \&_image }, table => { block => 1, line_format => 'multi', trim => 'none' }, tr => { end => " |\n" }, td => { start => '| ', end => ' ' }, th => { alias => 'td' }, ul => { line_format => 'multi', block => 1 }, ol => { alias => 'ul' }, li => { start => \&_li_start, trim => 'leading' }, dl => { alias => 'ul' }, dt => { alias => 'li' }, dd => { alias => 'li' }, ); return \%rules; } sub _li_start { my( $self, $node, $rules ) = @_; my @parent_lists = $node->look_up( _tag => qr/ul|ol|dl/ ); my $depth = @parent_lists; my $bullet = ''; $bullet = '*' if $node->parent->tag eq 'ul'; $bullet = '>' if $node->parent->tag eq 'dl'; $bullet = '#' if $node->parent->tag eq 'ol'; my $prefix = ( $bullet ) x $depth; return "\n$prefix "; } sub _link { my( $self, $node, $rules ) = @_; my $url = $node->attr('href') || ''; my $text = $self->get_elem_contents($node) || ''; $text =~ s/\[(.*)\]/$1/g; if ( $text =~ /image:/ ) { return $text }; my $url_check; if ($url =~ /^index.cgi\?/) { $url_check = $url; $url_check =~ s/^index.cgi\?//g; } if( my $title = $url_check ) { my $title_clean = $self->_get_clean_name($title); my $text_clean = $self->_get_clean_name($text); return "[$text]" if $text_clean eq $title_clean; return "\"$text\"[$title]" if $text ne $title; } else { return $url if $text eq $url; return "\"$text\"<$url>"; } } sub _get_clean_name { my ($self, $text) = @_; $text =~ s/[_\/\-']/ /g; $text =~ s/\%20/ /g; $text =~ s/(\w)/\l$1/g; return $text; } sub _image { my( $self, $node, $rules ) = @_; my $image_file = $node->attr('src'); if ( $image_file !~ /http/) { $image_file =~ s/.*\/([^\/]+)$/$1/g; $image_file =~ s/\?action=.*$//g; return '{image: ' . $image_file . '} ' || ''; } else { return $image_file; } } sub preprocess_node { my( $self, $node ) = @_; $self->strip_aname($node) if $node->tag eq 'a'; return unless $node->tag; $self->caption2para($node) if $node->tag eq 'caption'; } sub postprocess_output { my( $self, $outref ) = @_; # We need to deal with the weird rules we have for tables and bullets # with postprocessing $$outref =~ s/\|\n\*/\| \*/gs; $$outref =~ s/\|\n\#/\| \#/gs; $$outref =~ s/\n +\| +/ \| /gs; $$outref =~ s/\n +\|\n/ \|\n/gs; } =head1 AUTHOR Kirsten L. Jones<< >> =head1 BUGS Please report any bugs or feature requests to C, or through the web interface at L. I will be notified, and then you'll automatically be notified of progress on your bug as I make changes. =head1 SUPPORT You can find documentation for this module with the perldoc command. perldoc HTML::WikiConverter::Socialtext You can also look for information at: =over 4 =item * AnnoCPAN: Annotated CPAN documentation L =item * CPAN Ratings L =item * RT: CPAN's request tracker L =item * Search CPAN L =back =head1 COPYRIGHT & LICENSE Copyright 2006 Kirsten L. Jones, all rights reserved. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =cut 1;