package Compress::LeadingBlankSpaces; use 5.004; use strict; use vars qw($VERSION); $VERSION = '0.06'; sub new { # class/instance constructor, ready to sub-class my $proto = shift; my $class = ref($proto) || $proto; my $self = {}; bless ($self, $class); $self->{TAGS} = []; # a reference to the array of special tags $self->{TAGS}->[0]->{HEADER} = '
{TAGS}->[0]->{FOOTER} = '';
$self->{TAGS}->[1]->{HEADER} = '';
$self->{TAGS}->[2]->{HEADER} = '{TAGS}->[2]->{FOOTER} = '';
$self->{FORMATTED} = -1; # index of currently active special tag.
# we should never compress blank spaces within the FORMATTED content.
return $self;
}
# sub format_status takes one optional parameter.
# If called with an argument, it sets the FORMATTED field;
# otherwise it just returns the value held by that field,
#
sub format_status {
my $self = shift;
my $val = shift;
$self->{FORMATTED} = $val if defined ($val);
return $self->{FORMATTED};
}
sub squeeze_string {
my $self = shift;
my $buf = shift;
return '' unless $buf; # empty, zero or undefined input...
chomp $buf; # the problem of the file's last character that is not a 'new-string'
# was brought to my attention by Chris Clandingboel on 07/29/04. Thanks Chris!
if ( $self->{FORMATTED} >= 0 ){
# no compression:
my $end_tag = $self->{TAGS}->[$self->{FORMATTED}]->{FOOTER};
# note: full end-tag should appear within one string only!
$self->{FORMATTED} = -1 if $buf =~ /$end_tag/i; # resume the compression
# since the next input
} else { # try to compress
$buf =~ s/^\s+(\S.*)/$1/;
while ($buf =~ /^\s/o){
$buf =~ s/^\s+//o;
}
my $index = 0;
foreach ( @{ $self->{TAGS} } ){
my $beg_tag = $self->{TAGS}->[$index]->{HEADER};
if ($buf =~ /$beg_tag/i){ # it might be a special tag
if ($buf =~ /$beg_tag>/i # simple
or $buf =~ /$beg_tag\s/i # has in-line parameters
or $buf =~ /$beg_tag$/i # has next-line parameters
){ # this _is_ a special tag
$self->{FORMATTED} = $index; # hold on the compression
# since the next input
}
}
last if $self->{FORMATTED} >= 0;
$index += 1;
}
}
return '' unless length($buf) > 0;
return $buf."\n";
}
1;
__END__
=head1 NAME
Compress::LeadingBlankSpaces - Perl class to compress leading blank spaces in (HTML, JavaScript, etc.) web content.
=head1 SYNOPSIS
use Compress::LeadingBlankSpaces;
my $lco_r = Compress::LeadingBlankSpaces->new();
. . .
my $source_string = ' some content'."\n";
. . .
my $outgoing_string = $lco_r->squeeze_string ($source_string);
. . .
my $squeeze_status = $lco_r->format_status(); # to check later...
=head1 DESCRIPTION
This class provides the functionality for the most simple web content compression.
Basically, the outgoing web content (HTML, JavaScript, etc.) contains a lot of leading blank spaces,
because of being structured on development stage.
Usually, the browser ignores all leading blank spaces.
Indeed, the amount of those blank spaces is significant
and could be estimated as 10 to 20 percent of the length of regular web page.
We can reduce this part of the web traffic on busy servers
with no visible impact on transferred web content. This could be helpful
especially for old browsers incapable to understand modern content compression.
The main functionality of this class is concentrated within the C