package File::LocalizeNewlines; =pod =head1 NAME File::LocalizeNewlines - Localize the newlines for one or more files =head1 DESCRIPTION For people that routinely work with a mixture of different platforms that have conflicting newline formats (mainly *NIX and Win32) there are a number of different situations that can result in files having their newlines get corrupted. File::LocalizeNewlines provides a mechanism for one off or bulk detection and conversion of these files to the newline style for the local platform. The module implements the conversion using a standard "universal line seperator" regex, which ensures that files with any of the different newlines, plus a couple of common "broken" newlines, including multiple different types mixed in the same file, are all converted to the local platform's newline style. =head1 METHODS =cut use 5.005; use strict; use File::Spec 0.80 (); use File::Find::Rule 0.20 (); use File::Slurp 9999.04 (); use Class::Default 1.0 (); use FileHandle 0 (); use Params::Util 0.10 '_INSTANCE'; use vars qw{$VERSION @ISA}; BEGIN { $VERSION = '1.12'; @ISA = 'Class::Default'; } ##################################################################### # Constructor and Accessors =pod =head2 new param => value, ... The C constructor creates a new conversion object. By default, the conversion object will process all files and convert them to the local platform's newline format. Takes some optional parameters =over =item filter =E File::Find::Rule The C param allows you to provide an instantiate L object, that will used to determine the list of files to check or process. =item newline =E $newline The C option allows you to provide an alternative newline format to the local one. The newline format should be provided as a literal string. For example, to force Win32 newlines, you would use my $Object = File::LocalizeNewlines->new( newline => "\015\012" ); =item verbose =E 1 The C option will cause the C object to print status information to C as it runs. =back Returns a new C object. =cut sub new { my $class = ref $_[0] ? ref shift : shift; my %args = @_; # Create the basic object my $self = bless { }, $class; # Check the file filter if ( _INSTANCE($args{filter}, 'File::Find::Rule') ) { $self->{Find} = $args{filter}; $self->{Find}->file->relative; } # Allow for a custom platform $self->{newline} = $args{newline} if $args{newline}; # Check the verbose mode if ( _CAN($args{verbose}, 'print') ) { $self->{verbose} = $args{verbose}; } elsif ( $args{verbose} ) { $self->{verbose} = 1; } $self; } =pod =head2 Find The C accessor returns the L object that will be used for the file search. =cut sub Find { my $self = $_[0]->_self; $self->{Find} or File::Find::Rule->file->relative; } =pod =head2 newline The C accessor returns the newline format that will be used in the localisation process. =cut sub newline { $_[0]->_self->{newline} or "\n"; } ##################################################################### # Methods =pod =head2 localized $file The C method takes an argument of a single file name or file handle and tests it to see it is localized correctly. Returns true if localized correctly, false if not, or C on error. =cut sub localized { my $self = shift->_self; my $file = (defined $_[0] and ref $_[0]) ? shift : (defined $_[0] and -f $_[0]) ? shift : return undef; my $newline = $self->newline; my $content = File::Slurp::read_file( $file ); # Create the localized version of the file my $localized = $content; $localized =~ s/(?:\015{1,2}\012|\015|\012)/$newline/sg; $localized eq $content; } =pod =head2 find $dir The C method takes the path for a dir (or file) and returns a list of relative files names for all of the files that do B have their newlines correctly localized. Returns a list of file names, or the null list if there are no files, or if an incorrect path was provided. =cut sub find { my $self = shift->_self; my $path = _DIRECTORY(shift) or return (); # Find all the files to test my @files = $self->Find->in( $path ); @files = grep { ! $self->localized( File::Spec->catfile( $path, $_ ) ) } @files; @files; } =pod =head2 localize $file | $dir The C method takes a file, file handle or directory as argument and localizes the newlines of the file, or all files within the directory (that match the filter if one was provided). Returns the number of files that were localized, zero if no files needed to be localized, or C on error. =cut sub localize { my $self = shift->_self; my $path = (defined $_[0] and ref $_[0]) ? shift : (defined $_[0] and -e $_[0]) ? shift : return undef; # Switch on file or dir (-f $path or ref $_[0]) ? $self->_localize_file( $path ) : $self->_localize_dir( $path ); } sub _localize_dir { my $self = shift->_self; my $path = _DIRECTORY(shift) or return undef; # Find the files to localise my @files = $self->Find->in( $path ); # Localize the files my $count = 0; my $newline = $self->newline; foreach ( @files ) { my $file = File::Spec->catfile( $path, $_ ); my $content = File::Slurp::read_file( $file ); my $localized = $content; $localized =~ s/(?:\015{1,2}\012|\015|\012)/$newline/sg; next if $localized eq $content; File::Slurp::write_file( $file, $localized ) or return undef; $self->_message( "Localized $file\n" ); $count++; } $count; } sub _localize_file { my $self = shift->_self; my $file = (defined $_[0] and ref $_[0]) ? shift : (defined $_[0] and -f $_[0]) ? shift : return undef; # Does the file need to be localised my $newline = $self->newline; my $content = File::Slurp::read_file( $file ); my $localized = $content; $localized =~ s/(?:\015{1,2}\012|\015|\012)/$newline/sg; return 0 if $content eq $localized; # Save the localised version File::Slurp::write_file( $file, $localized ) or return undef; $self->_message( "Localized $file\n" ) unless ref $file; 1; } sub _message { my $self = shift; return 1 unless defined $self->{verbose}; my $message = shift; $message .= "\n" unless $message =~ /\n$/; if ( _CAN( $self->{verbose}, 'print' ) ) { $self->{verbose}->print( $message ); } else { print STDOUT $message; } } sub _CAN { (_INSTANCE($_[0], 'UNIVERSAL') and $_[0]->can($_[1])) ? shift : undef; } sub _DIRECTORY { (defined $_[0] and -d $_[0]) ? shift : undef; } 1; =pod =head1 SUPPORT Bugs should always be submitted via the CPAN bug tracker L For other issues, contact the maintainer. =head1 AUTHOR Adam Kennedy Eadamk@cpan.orgE =head1 ACKNOWLEDGEMENTS Thank you to Phase N (L) for permitting the open sourcing and release of this distribution. L support added by David Dick Eddick@cpan.orgE =head1 COPYRIGHT Copyright 2005 - 2009 Adam Kennedy. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. The full text of the license can be found in the LICENSE file included with this module. =cut