package load; # Make sure we have version info for this module $VERSION = '0.19'; #-------------------------------------------------------------------------- # No, we're NOT using strict here. There are several reasons, the most # important being that strict bleeds into the string eval's that load.pm # is doing, causing compilation errors in all but the most simple modules. # If you _do_ want stricture as a developer of load.pm, simply de-activate # the lines of the BEGIN block below here #-------------------------------------------------------------------------- BEGIN { # We're fooling the Kwalitee checker into thinking we're strict use strict; } # Define loading now flag # Do this at compile time # Make sure we have warnings or dummy warnings for older Perl's # Set flag indicating whether everything should be loaded immediately my $now; BEGIN { eval {require warnings} or do {$INC{'warnings.pm'} = ''}; $now = $ENV{'LOAD_NOW'} || 0; # environment var undocumented for now # If there seems to be a version for "ifdef" loaded # Die now if it is too old # Set compile time flag for availability of "ifdef.pm" # Else (no "ifdef" loaded) # Set compile time flag for non-availability of "ifdef.pm" if (defined $ifdef::VERSION) { die "Must have 'ifdef' version 0.07 or higher to handle on demand loading\n" if $ifdef::VERSION < 0.07; *IFDEF = sub () { 1 }; } else { *IFDEF = sub () { 0 }; } # If we're supposed to trace # Set compile time flag indicating we want a trace to STDERR # Create the subroutine for showing the trace # Else # Set compile time flag indicating we DON'T want a trace to STDERR if ($ENV{'LOAD_TRACE'}) { *TRACE = sub () { 1 }; eval <<'EOD'; # only way to ensure it isn't there when we're not tracing sub _trace { my $tid = $threads::VERSION ? ' ['.threads->tid.']' : ''; warn "load$tid: ",$_[0],$/; } #_trace EOD } else { *TRACE = sub () { 0 }; } # Allow for dirty tricks # Save current code ref of UNIVERSAL::can (will continue inside closure) # Replace it with something that will also check on demand subroutines no warnings 'redefine'; my $can = \&UNIVERSAL::can; *UNIVERSAL::can = sub { &{$can}( @_ ) || (ref( $_[0] ) ? undef : _can( @_ )) }; } #BEGIN # Hash with modules that should be used extra, keyed to package my %use; # Satisfy -require- 1; #--------------------------------------------------------------------------- # class methods #--------------------------------------------------------------------------- # IN: 1 class (ignored) # 2 package for which to add additional use-s # 3 additional module to be used sub register { $use{$_[1]} = ($use{$_[1]} || '')."use $_[2];" } #register #--------------------------------------------------------------------------- # standard Perl features #--------------------------------------------------------------------------- # IN: 1 class (ignored) # 2..N various parameters sub import { # Obtain the class (so we can check whether load or AutoLoader usage) # Obtain the module name # Initialize the context flag my $class = shift; my ($module,$filename) = caller(); # If there were any parameters specified # Initialize the autoload export flag # Initialize the scan flag # Create local copy of load now flag if (@_) { my $inmain = $module eq 'main'; my $autoload = !$inmain; my $scan = 1; my $thisnow = $now; # For all of the parameters specified # If we want to load everything now # Set flags accordingly foreach (@_) { if ($_ eq 'now') { ($inmain ? $now = $thisnow : $thisnow) = $scan = 1; # Elsif we want to load ondemand # Set flags accordingly } elsif ($_ eq 'ondemand') { ($inmain ? $now = $thisnow : $thisnow) = 0; $scan = 1; # Elseif we want to export AUTOLOAD sub (AUTOLOAD = AutoLoader compatible) # Die now if we're called from a script # Mark to export AUTOLOAD } elsif (m#^(?:autoload|AUTOLOAD)$#) { die "Can not $_ in main namespace" if $inmain; $autoload = 1; # Elseif we don't want to scan now # Set flags accordingly } elsif ($_ eq 'dontscan') { ($inmain ? $now = $thisnow : $thisnow) = $scan = 0; # Elseif we want the AUTOLOAD to be inherited # Die now if we're called from a script # Mark to _not_ export AUTOLOAD } elsif ($_ eq 'inherit') { die "Can not inherit in main namespace" if $inmain; $autoload = 0; # Elseif we want to enable AutoLoader mode # Die now if activating AutoLoader mode from a module } elsif ($_ eq 'AutoLoader') { die "Can only activate AutoLoader emulation mode from script" unless $inmain; # If we didn't emulate AutoLoader before # Set the import routine of AutoLoader to this one # Set the AUTOLOAD routine of AutoLoader to load's one # Mark AutoLoader.pm as loaded so that it will not actually get loaded if (!$INC{'AutoLoader.pm'} or $INC{'AutoLoader.pm'} ne $INC{__PACKAGE__.'.pm'}) { *AutoLoader::import = \&import; *AutoLoader::AUTOLOAD = \&AUTOLOAD; $INC{'AutoLoader.pm'} = $INC{__PACKAGE__.'.pm'}; } # Else # Die now indicating unknown parameter } else { die "Don't know how to handle $_"; } } # If we're in a module # Scan the file, using local flag setting, if we should scan # Allow for some dirty tricks # Export AUTOLOAD if so requested unless ($inmain) { _scan( $module,$thisnow ) if $scan; no strict 'refs'; *{$module.'::AUTOLOAD'} = \&AUTOLOAD if $autoload; } # Elseif called from a script # Die indicating that doesn't make any sense } elsif ($module eq 'main' and $filename ne '-e') { die "Does not make sense to just 'use $class;' from your script"; # Else (no parameters specified) # Scan the source # If we're called for "load" (which exports by default) # Allow for variable reference stuff # And export the AUTOLOAD subroutine } else { _scan( $module ); if ($class eq __PACKAGE__) { no strict 'refs'; *{$module.'::AUTOLOAD'} = \&AUTOLOAD; } } } #import #--------------------------------------------------------------------------- sub AUTOLOAD { # Obtain the module and subroutine name # Go execute the routine if it exists $load::AUTOLOAD =~ m#^(.*)::(.*?)$#; goto &{$load::AUTOLOAD} if _can( $1,$2 ); # Return if we requested DESTROY # Obtain caller information # Die with the appropriate information return if $2 eq 'DESTROY'; my ($package,$filename,$line) = caller; die "Undefined subroutine &$load::AUTOLOAD called at $filename line $line\n"; } #AUTOLOAD #--------------------------------------------------------------------------- # internal subroutines #--------------------------------------------------------------------------- # IN: 1 module to scan (AAA::BBB) # 2 optional: flag to load everything now sub _scan { # Obtain the module # Obtain the load now flag # Make sure $_ is localized properly # Make sure we won't clobber sensitive system vars my $module = shift; my $loadnow = defined( $_[0] ) ? shift : $now; local $_ = \my $foo; local( $!,$@ ); # Obtain the filename, die if failed # Attempt to open the file for reading, die if failed # Set binmode just to make sure my $file = _filename( $module ) or die "Could not find file for '$module'"; open( VERSION,"<$file" ) # use VERSION as glob to save memory or die "Could not open file '$file' for '$module': $!"; binmode VERSION # needed for Windows systems, apparently or die "Could not set binmode on '$file': $!"; # Initialize line number # Initialize the within pod flag # Initialize the package name we're working for # Make sure "ifdef" starts with a clean slate if needed my $line = 0; my $pod = 0; my $package = ''; &ifdef::reset if IFDEF; # should get optimized away if not needed # While there are lines to be read # Do whatever conversions are needed # Increment line number # Reloop if a pod line, setting flag right on the fly # Reloop now if in pod or a comment line # Outloop now if we found the good stuff # Reloop if there is no package specification # Die now if we found a package declaration before # Set the package (it's the first one) while () { &ifdef::oneline if IFDEF; # should get optimized away if not needed $line++; $pod = !m#^=cut#, next if m#^=\w#; next if $pod or m#^\s*\##; last if m#^__END__#; next unless m#^package\s+([\w:]+)\s*;#; die "Found package '$1' after '$package'" if $package; $package = $1; } # Die now if there is no package # Die now if it is not the right package die "Could not find package name" unless $package; die "Found package $package inside '$file'" if $package ne $module; # Save the line after which __END__ sits # Save the offset of the first line after __END__ my $endline = $line+1; my $endstart = tell VERSION; # If we're supposed to load now # Show trace info if requested if ($loadnow) { _trace( "now $module, line $endline (offset $endstart, onwards)" ) if TRACE; # Create the package prelude # Obtain the source in so that we can eval this under taint # Eval the source code, possibly processing through 'ifdef.pm" # Die now if failed my $source = < =~ m#^(.*)$#s; $1}; eval (IFDEF ? ifdef::process( $source ) : $source ); die "Error evaluating source: $@" if $@; # Else (we're to load everything ondemand) # Initialize the start position # Initialize the sub name being handled # Initialize the line number of the sub being handled # Initialize the original length of the line (needed only when ifdeffing) } else { my $start; my $sub = ''; my $subline; my $length; # While there are lines to be read # Save the length of the original line if needed # Do any conversions that are needed # Increment line number # Reloop if a pod line, setting flag right on the fly # Reloop now if in pod or a comment line # Outloop now if we hit the actual documentation while () { $length = length if IFDEF; &ifdef::oneline if IFDEF; $line++; $pod = !m#^=cut#, next if m#^=\w#; next if $pod or m#^\s*\##; last if m#^__END__#; # Die now if there is a package found (while we have one already) # Reloop if we didn't reach a new sub die "Only one package per file: found '$1' after '$package'" if m#^package\s+([\w:]+)\s*;#; next unless m#^sub\s+([\w:]+)#; # Remember the location where this sub starts # Store the information of the previous sub if there was one # Set the name of this sub # Die now if it is fully qualified sub # Remember where at which line number this sub starts # Remember where at which offset this sub starts # Store the information of the last sub if there was one my $seek = tell( VERSION ) - (IFDEF ? $length : length); _store( $module,$sub,$subline,$start,$seek-$start ) if $sub; $sub = $1; die "Cannot handle fully qualified subroutine '$sub'\n" if $sub =~ m#::#; $subline = $line; $start = $seek; } _store( $module, $sub, $subline, $start, (defined() ? tell( VERSION ) - length() : -s VERSION) - $start ) if $sub; } # Mark this module as scanned # Close the handle, we're done $load::AUTOLOAD{$module} = undef; close( VERSION ); } #_scan #--------------------------------------------------------------------------- # IN: 1 module name (AAA::BBB) # OUT: 1 filename (/..../AAA/BBB.pm) or undef if not known sub _filename { # Obtain the key # Convert the ::'s to /'s # Return whatever is available for that (my $key = $_[0]) =~ s#::#/#g; my $filename = $INC{"$key.pm"}; return $filename unless ref $filename; $filename = $filename->( "$key.pm" ); $filename; } #_filename #--------------------------------------------------------------------------- # IN: 1 module name # 2 subroutine name (not fully qualified) # 3 line number where sub starts # 4 offset where sub starts # 5 number of bytes to read sub _store { # Show trace info if so requested # Make sure there is a stub # Die now if there was an error # Store the data _trace( "store $_[0]::$_[1], line $_[2] (offset $_[3], $_[4] bytes)" ) if TRACE; eval "package $_[0]; sub $_[1]"; die "Could not create stub: $@\n" if $@; $load::AUTOLOAD{$_[0],$_[1]} = pack( 'L3',$_[2],$_[3],$_[4] ) } #_store #--------------------------------------------------------------------------- # IN: 1 module to load subroutine from # 2 subroutine to load # OUT: 1 reference to subroutine (if exists and loaded, else undef) sub _can { # Obtain the module and subroutine name # Return now if trying for application (the real UNIVERSAL::can should do that) my ($module,$sub) = @_; return if $module eq 'main'; # Scan the file if it wasn't done yet # Obtain coordinates of subroutine # Return now if not known _scan( $module ) unless exists $load::AUTOLOAD{$module}; my ($subline,$start,$length) = unpack( 'L3',$load::AUTOLOAD{$module,$sub} || '' ); return unless $start; # Make sure we don't clobber sensitive system variables # Obtain the filename or die # Open the file or die # Set binmode just to make sure # Seek to the right place or die local( $!,$@ ); my $file = _filename( $module ) or die "Could not find file for '$module.pm'"; open( VERSION,"<$file" ) # use VERSION glob to conserve memory or die "Could not open file '$file' for '$module.pm': $!"; binmode VERSION # needed for Windows systems, apparently or die "Could not set binmode on '$file': $!"; seek( VERSION,$start,0 ) or die "Could not seek to $start for $module\::$sub"; # Show trace info if so requested # Initialize the source to be evalled _trace( "ondemand ${module}::$sub, line $subline (offset $start, $length bytes)" ) if TRACE; my $use = $use{$module} || ''; my $source = < and L. And adds some more features. In a situation where you want to use as little memory as possible, the "load" pragma (in the context of a module) is a drop-in replacement for L. But for situations where you want to have a module load everything it could ever possibly need (e.g. when starting a mod_perl server in pre-fork mode), the "load" pragma can be used (in the context of an application) to have all subroutines of a module loaded without having to make any change to the source of the module in question. So the typical use inside a module is to have: package Your::Module; use load; in the source. And to place all subroutines that you want to be loadable on demand after the (first) __END__. If an application developer decides that all subroutines should be loaded at compile time, (s)he can say in the application: use load 'now'; use Your::Module; This will cause the subroutines of Your::Module to all be loaded at compile time. =head1 MODES OF OPERATION There are basically two places where you can call the "load" pragma: =head2 inside a module When you call the "load" pragma inside a module, you're basically enabling that module for having an external control when certain subroutines will be loaded. As with AutoLoader, any subroutines that should be loaded on demand, should be located B an __END__ line. If no parameters are specified with the C, then the "autoload" parameter is assumed. Whether the module's subroutines are loaded at compile time or on demand, is determined by the calling application. If the application doesn't specify anything specific, the "ondemand" keyword will also be assumed. =head2 inside an application When you call the "load" pragma inside an application, you're basically specifying when subroutines will be loaded by "load" enhanced modules. As an application developer, you can basically use two keywords: "ondemand" and "now". If an application does not call the "load" pragma, the "ondemand" keyword will be assumed. With "ondemand", subroutines will only be loaded when they are actually executed. This saves memory at the expense of extra CPU the first time the subroutine is called. The "now" keyword indicates that all subroutines of all modules that are enhanced with the "load" pragma, will be loaded at compile time (thus using more memory, but B having an extra CPU overhead the first time the subroutine is executed). =head1 KEYWORDS The following keywords are recognized with the C command: =head2 ondemand The "ondemand" keyword indicates that subroutines, of modules that are enhanced with the "load" pragma, will only be loaded when they are actually called. If the "ondemand" keyword is used in the context of an application, all modules that are subsequently Cd, will be forced to load subroutines only when they are actually called (unless the module itself forces a specific setting). If the "ondemand" keyword is used in the context of a module, it indicates that the subroutines of that module, should B be loaded when they are actually needed. Since this takes away the choice from the application developer, the use of the "ondemand" keyword in module context is not encouraged. See also the L and L keywords. =head2 now The "now" keyword indicates that subroutines, of modules that are enhanced with the "load" pragma, will be loaded at compile time. If the "now" keyword is used in the context of an application, all modules that are subsequently Cd, will be forced to load all subroutines at compile time (unless the module forces a specific setting itself). If the "now" keyword is used in the context of a module, it indicates that the subroutines of that module, should B be loaded at compile time. Since this takes away the choice from the application developer, the use of the "now" keyword in module context is not encouraged. See also the L keyword. =head2 dontscan The "dontscan" keyword only makes sense when used in the context of a module. Normally, when a module that is enhanced with the "load" pragma is compiled, the source after the __END__ is scanned for the locations of the subroutines. This makes the compiling of modules a little slower, but allows for a faster (initial) lookup of (yet) unloaded subroutines during execution. If the "dontscan" keyword is specified, this scanning of the source is skipped at compile time. However, as soon as an attempt is made to ececute a subroutine from this module, then first the scanning of the source is performed, before the subroutine in question is loaded. So, you should use the "dontscan" keyword if you are reasonably sure that you will only need subroutines from the module in special cases. In all other cases it will make more sense to have the source scanned at compile time. The "dontscan" keyword will be ignored if an application developer forces subroutines to be loaded at compile time with the L keyword. =head2 autoload The "autoload" keyword only makes sense when used in the context of a module. It indicates that a generic AUTOLOAD subroutine will be exported to the module's namespace. It is selected by default if you use the "load" pragma without parameters in the source of a module. See also the L keyword to B export the generic AUTOLOAD subroutine. =head2 inherit The "inherit" keyword only makes sense when used in the context of a module. It indicates that B AUTOLOAD subroutine will be exported to the module's namespace. This can e.g. be used when you need to have your own AUTOLOAD routine. That AUTOLOAD routine should then contain: $load::AUTOLOAD = $sub; goto &load::AUTOLOAD; to access the "load" pragma functionality. Another case to use the "inherit" keyword would be in a sub-class of a module which also is "load" enhanced. In that case, the inheritance will cause the AUTOLOAD subroutine of the base class to be used, thereby accessing the "load" pragma automagically (and hence the naming of the keyword of course). See also the L keyword to have the module use the generic AUTOLOAD subroutine. =head2 AutoLoader The "AutoLoader" keyword enables AutoLoader emulation mode. It basically takes over the functionality of the AutoLoader module (which is part of Perl's core, and which is used by many of Perl's core modules). Use of AutoLoader emulation mode usually only makes sense in a mod_perl prefork environment (in combination with the "now" keyword), or a threaded Perl environment. It basically adds the flexibility of subroutine loading options of the "load" pragma to the existing codebase of Perl's core and CPAN modules. It is typically invoked from the command line: perl -Mload=AutoLoader or in a mod_perl configuration: use load qw(AutoLoader now); # as early as possible # rest of modules to be loaded The AutoLoader emulation mode has the further advantage for modules being developed with AutoLoader, as it is possible to run the module before having to have installed the module (which is normally a requirement with using AutoLoader). Please note that AutoLoader emulation will only work properly for any modules loaded B the "load" module is loaded. It is therefore important to activate the AutoLoader as soon as possible, before B other modules have been loaded. Of particular interest in this respect are the L and the L modules. =head1 REQUIRED MODULES (none) =head1 DIFFERENCES WITH SIMILAR MODULES There are a number of (core) modules that more or less do the same thing as the "load" pragma. =head2 AutoSplit / AutoLoader The "load" pragma is very similar to the AutoSplit / AutoLoader combination. The main difference is that the splitting takes place when the "load" import is called in a module and that there are no external files created. Instead, just the offsets and lengths are recorded in a hash (when "ondemand" is active) or all the source after __END__ is eval'led (when "now" is active). From a module developer point of view, the advantage is that you do not need to install a module before you can test it. From an application developer point of view, you have the flexibility of having everything loaded now or later (on demand). From a memory usage point of view, the "load" offset/length hash takes up more memory than the equivalent AutoLoader setup. On the other hand, accessing the source of a subroutine may generally be faster because the file is more likely to reside in the operating system's buffers already. As an extra feature, the "load" pragma allows an application to force all subroutines to be loaded at compile time, which is not possible with AutoLoader. The "AutoLoader emulation" mode causes AutoLoader to be replaced by "load", increasing further flexibility in loading options (which can be particularly important in the L<"mod_perl prefork"> situation) and ease of use during development of modules using AutoLoader (as you don't need to install the module before you can test it). =head2 SelfLoader The "load" pragma also has some functionality in common with the SelfLoader module. But it gives more granularity: with SelfLoader, all subroutines that are not loaded directly, will be loaded if B not yet loaded subroutine is requested. It also adds complexities if your module needs to use the handle. So the "load" pragma gives more flexibility and fewer development complexities. And of course, an application can force all subroutines to be loaded at compile time when needed with the "load" pragma. =head1 UNIVERSAL::can To ensure the functioning of the ->can class method and &UNIVERSAL::can, the "load" pragma hijacks the standard UNIVERSAL::can routine so that it can check whether the subroutine/method that you want to check for, actually exists and have a code reference to it returned. This has a side effect that you the subroutine checked for, is loaded. You can use this side effect to load subroutines without calling them. Your::Module->can( 'loadthisnow' ); will load the subroutine "loadthisnow" of the Your::Module module without actually calling it. =head1 CAVEATS Currently you may not have multiple packages in the same file, nor can you have fully qualified subroutine names. The parser that looks for package names and subroutines, is not very smart. This is intentionally so, as making it smarter will make it a lot slower, but probably still not smart enough. Therefore, the C and C's B be at the start of a line. And the name of the C B be on the same line as the C. =head1 EXAMPLES Some code examples. Please note that these are just a part of an actual situation. =head2 base class package Your::Module; use load; Exports the generic AUTOLOAD subroutine and adheres to whatever the application developer specifies as mode of operation. =head2 sub class package Your::Module::Adapted; @ISA = qw(Your::Module); use load (); Does B export the generic AUTOLOAD subroutine, but inherits it from its base class. Also implicitely specifies the "dontscan" keyword, causing the source of the module to be scanned only when the first not yet loaded subroutine is about to be executed. If you only want to have the "inherit" keyword functionality, then you must specify that explicitely: package Your::Module::Adapted; @ISA = qw(Your::Module); use load 'inherit'; =head2 custom AUTOLOAD package Your::Module; use load 'inherit'; sub AUTOLOAD { if (some condition) { $load::AUTOLOAD = $Your::Module::AUTOLOAD; goto &load::AUTOLOAD; } # do your own stuff } If you want to use your own AUTOLOAD subroutine, but still want to use the functionality offered by the "load" pragma, you can use the above construct. =head2 mod_perl prefork use load qw(AutoLoader now); use Your::Module; In pre-fork mod_perl applications (the default mod_perl applications before mod_perl 2.0), it is advantageous to load all possible subroutines when the Apache process is started. This is because the operating system will share memory using a process called "Copy On Write". So even though it will take more memory initially, that memory loss is easily evened out by the gains of having everything shared. Loading a not yet loaded subroutine in that situation, will cause otherwise shared memory to become unshared. Thereby increasing the overall memory usage, because the amount that becomes unshared is typically a lot more than the extra memory used by the subroutine (which is caused by fragmentation of allocated memory). The B emulation mode causes all modules that use C to be handled by C. In combination with the "now" mode, this means that many system modules will also be loaded completely at server startup (causing a grow in initial use of memory, but sharing more memory means that overall memory usage is significantly reduced. =head2 threaded applications and mod_perl worker use Your::Module; Threaded Perl applications, of which mod_perl applications using the "worker" module are a special case, function best when subroutines are only loaded when they are actually needed. This is caused by the nature of the threading model of Perl, in which all data-structures are B to each thread (essentially forcing them to become unshared as far as the operating system is concerned). Benchmarks have shown that the overhead of the extra CPU is easily offset by the reduction of the amount of data that needs to be copied (and processed) when a thread is created. A little additional memory reduction can be achieved with the L emulation mode: this will prevent the AutoLoader module to be loaded (but have its functionality handled by the "load" pragma). =head1 SOURCE FILTERS If your module wants to use "load" to load subroutines on demand B that module needs a source filter (which is usually activated with a "use" statement), then those modules need to be used when the source of the subroutine is compiled. The class method "register" is intended to be used from such a module, typicallly like this: sub import { my $package = caller(); load->register( $package,__PACKAGE__ ) # register caller's package if defined( $load::VERSION ) # if load.pm loaded and $load::VERSION > 0.11; # and recent enough } The first parameter is the name of the package B which subroutines need extra modules "use"d. The second parameter is the name of the module that needs to be "use"d. =head1 TODO The coordinates of a subroutine in a module (start,number of bytes) are stored in a hash in the load namespace. Ideally, this information should be stored in the stash of the module to which they apply. Then the internals that check for the existence of a subroutine, would see that the subroutine doesn't exist (yet), but that there is an offset and length (and implicitely, a file from %INC) from which the source could be read and evalled. Loading all of the subroutines should maybe be handled inside the Perl parser, having it skip __END__ when the global "now" flag is set. Possibly we should use the handle from a module if there is one, or dup it and use that, rather than opening the file again. Add L emulation mode. =head1 MODULE RATING If you want to find out how this module is appreciated by other people, please check out this module's rating at L (if there are any ratings for this module). If you like this module, or otherwise would like to have your opinion known, you can add your rating of this module at L. =head1 ACKNOWLEDGEMENTS Frank Tolstrup for helping ironing out all of the Windows related issues. =head1 AUTHOR Elizabeth Mattijsen, . Please report bugs to . =head1 COPYRIGHT Copyright (c) 2002-2007 Elizabeth Mattijsen . All rights reserved. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =head1 SEE ALSO L, L, L, L. =cut