package Catalyst::Plugin::Session::State::URI; use base qw/Catalyst::Plugin::Session::State Class::Accessor::Fast/; use strict; use warnings; use HTML::TokeParser::Simple; use MIME::Types; use MRO::Compat; use URI; use URI::Find; use URI::QueryParam; our $VERSION = '0.08'; __PACKAGE__->mk_accessors(qw/_sessionid_from_uri _sessionid_to_rewrite/); sub get_session_id { my ( $c, @args ) = @_; return $c->_sessionid_from_uri || $c->maybe::next::method(@args); } sub set_session_id { my ( $c, $sid, @args ) = @_; $c->_sessionid_to_rewrite($sid); $c->maybe::next::method($sid, @args); } sub delete_session_id { my ( $c, @args ) = @_; $c->_sessionid_from_uri(undef); $c->_sessionid_to_rewrite(undef); $c->maybe::next::method(@args); } sub setup_session { my $c = shift(); $c->maybe::next::method(@_); my %defaults = ( rewrite => 1, no_rewrite_if_cookie => 1, ); my $config = $c->config->{session} ||= {}; foreach my $key ( keys %defaults ) { $config->{$key} = $defaults{$key} unless exists $config->{$key}; } } sub finalize { my $c = shift; $c->session_rewrite_if_needed; return $c->maybe::next::method(@_); } sub session_rewrite_if_needed { my $c = shift; my $sid = $c->_sessionid_to_rewrite || $c->_sessionid_from_uri; if ( $sid and $c->session_should_rewrite ) { $c->log->debug("rewriting response elements to include session id") if $c->debug; if ( $c->session_should_rewrite_redirect ) { $c->rewrite_redirect_with_session_id($sid); } if ( $c->session_should_rewrite_body ) { $c->rewrite_body_with_session_id($sid); } } } sub rewrite_body_with_session_id { my ( $c, $sid ) = @_; if ( ($c->response->content_type || '') =~ /html/ # XML too? or (!$c->response->content_type and $c->response->body =~ /^\s*<[?!]?\s*\w+/ ), # if it looks like html ) { $c->rewrite_html_with_session_id($sid); } else { $c->rewrite_text_with_session_id($sid); } } sub _session_rewriting_html_tag_map { return { a => "href", form => "action", link => "href", img => "src", script => "src", }; } sub rewrite_html_with_session_id { my ( $c, $sid ) = @_; my $p = HTML::TokeParser::Simple->new( string => ($c->response->body || return) ); $c->log->debug("Rewriting HTML body with the token parser") if $c->debug; my $tag_map = $c->_session_rewriting_html_tag_map; my $body = ''; while ( my $token = $p->get_token ) { if ( my $tag = $token->get_tag ) { # rewrite tags according to the map if ( my $attr_name = $tag_map->{$tag} ) { if ( defined(my $attr_value = $token->get_attr($attr_name) ) ) { $attr_value = $c->uri_with_sessionid($attr_value, $sid) if $c->session_should_rewrite_uri($attr_value); $token->set_attr( $attr_name, $attr_value ); } } } $body .= $token->as_is; } $c->response->body($body); } sub rewrite_text_with_session_id { my ( $c, $sid ) = @_; my $body = $c->response->body || return; $c->log->debug("Rewriting plain body with URI::Find") if $c->debug; URI::Find->new(sub { my ( $uri, $orig_uri ) = @_; if ( $c->session_should_rewrite_uri($uri) ) { my $rewritten = $c->uri_with_sessionid($uri, $sid); if ( $orig_uri =~ s/\Q$uri/$rewritten/ ) { # try to keep formatting return $orig_uri; } elsif ( $orig_uri =~ /^(<(?:URI:)?).*(>)$/ ) { return "$1$rewritten$2"; } else { return $rewritten; } } else { return $orig_uri; } })->find( \$body ); $c->response->body( $body ); } sub rewrite_redirect_with_session_id { my ( $c, $sid ) = @_; my $location = $c->response->location || return; $c->log->debug("Rewriting location header") if $c->debug; $c->response->location( $c->uri_with_sessionid($location, $sid) ) if $c->session_should_rewrite_uri($location); } sub session_should_rewrite { my $c = shift; return unless $c->config->{session}{rewrite}; if ( $c->isa("Catalyst::Plugin::Session::State::Cookie") and $c->config->{session}{no_rewrite_if_cookie} ) { return if defined($c->get_session_cookie); } return 1; } sub session_should_rewrite_type { my $c = shift; if ( my $types = $c->config->{session}{rewrite_types} ) { my @req_type = $c->response->content_type; # split foreach my $type ( @$types ) { if ( ref($type) ) { return 1 if $type->( $c, @req_type ); } else { return 1 if lc($type) eq $req_type[0]; } } return; } else { return 1; } } sub session_should_rewrite_body { my $c = shift; return $c->session_should_rewrite_type; } sub session_should_rewrite_redirect { my $c = shift; ($c->response->status || 0) =~ /^\s*3\d\d\s*$/; } sub uri_for { my ( $c, $path, @args ) = @_; return $c->config->{session}{overload_uri_for} ? $c->uri_with_sessionid($c->maybe::next::method($path, @args)) : $c->maybe::next::method($path, @args); } sub uri_with_sessionid { my ( $c, $uri, $sid ) = @_; $sid ||= $c->sessionid; my $uri_obj = eval { URI->new($uri) } || return $uri; return $c->config->{session}{param} ? $c->uri_with_param_sessionid($uri_obj, $sid) : $c->uri_with_path_sessionid($uri_obj, $sid); } sub uri_with_param_sessionid { my ( $c, $uri_obj, $sid ) = @_; my $param_name = $c->config->{session}{param}; $uri_obj->query_param( $param_name => $sid ); return $uri_obj; } sub uri_with_path_sessionid { my ( $c, $uri_obj, $sid ) = @_; $uri_obj->path( join( "/-/", $uri_obj->path, $sid ) ); return $uri_obj; } sub session_should_rewrite_uri { my ( $c, $uri_text ) = @_; my $uri_obj = eval { URI->new($uri_text) } || return; # ignore the url outside my $rel = $uri_obj->abs( $c->request->base ); return unless index( $rel, $c->request->base ) == 0; return unless $c->session_should_rewrite_uri_mime_type($rel); if ( my $param = $c->config->{session}{param} ) { # use param style rewriting # if the URI query string doesn't contain $param return not defined $uri_obj->query_param($param); } else { # use path style rewriting # if the URI isn't already rewritten return $uri_obj->path !~ m#/-/#; } } sub session_should_rewrite_uri_mime_type { my ( $c, $uri ) = @_; # ignore media type such as gif, pdf and etc if ( $uri->path =~ m#\.(\w+)(?:\?|$)# ) { my $mt = new MIME::Types->mimeTypeOf($1); if ( ref $mt ) { return if $mt->isBinary; } } return 1; } sub prepare_action { my $c = shift; if ( my $param = $c->config->{session}{param} ) { # use param style rewriting if ( my $sid = $c->request->param($param) ) { $c->_sessionid_from_uri($sid); $c->log->debug(qq/Found sessionid "$sid" in query parameters/) if $c->debug; } } else { # use path style rewriting if ( my ( $path, $sid ) = ( $c->request->path =~ m{^ (?: (.*) / )? -/ (.+) $}x ) ) { $c->request->path( defined($path) ? $path : "" ); $c->log->debug(qq/Found sessionid "$sid" in uri path/) if $c->debug; $c->_sessionid_from_uri($sid); } } $c->maybe::next::method(@_); } __PACKAGE__ __END__ =pod =head1 NAME Catalyst::Plugin::Session::State::URI - Saves session IDs by rewriting URIs delivered to the client, and extracting the session ID from requested URIs. =head1 SYNOPSIS use Catalyst qw/Session Session::State::URI Session::Store::Foo/; # If you want the param style rewriting, set the parameter MyApp->config->{session} = { param => 'sessionid', # or whatever you like }; =head1 DESCRIPTION In order for L to work the session ID needs to be stored on the client, and the session data needs to be stored on the server. This plugin cheats and instead of storing the session id on the client, it simply embeds the session id into every URI sent to the user. =head1 METHODS =over 4 =item session_should_rewrite This method is consulted by C. The body will be rewritten only if it returns a true value. This method will B return true unless C<< $c->config->{session}{rewrite} >> is true (the default). To globally disable rewriting simply set this parameter to false. If C<< $c->config->{session}{no_rewrite_if_cookie} >> is true (the default), L is also in use, and the user agent sent a cookie for the sesion then this method will return false. =item session_should_rewrite_body This method just calls C. =item session_should_rewrite_type Whether or not the content type of the body should be rewritten. For compatibility this method will B test the response's content type without configuration. If you want to do that you must provide a list of valid content types in C<< $c->config->{session}{rewrite_types} >>, or subclass this method. =item session_should_rewrite_redirect Whether or not to rewrite the C header of the response. If the status code is a number in the 3xx range then this returns true. =item session_should_rewrite_uri $uri_text This method is to determine whether a URI should be rewritten. It will return true for URIs under C<$c-Ereq-Ebase>, and it will also use L to filter the links which point to png, pdf and etc with the file extension. You are encouraged to override this method if it's logic doesn't suit your setup. =item session_should_rewrite_uri_mime_type $uri_obj A sub test of session_should_rewrite_uri, that checks if the file name's guessed mime type is of a kind we should rewrite URIs to. Files which are typically static (images, etc) will thus not be rewritten in order to not get 404s or pass bogus parameters to the server. If C<$uri_obj>'s path causes L to return true for the C test then then the URI will not be rewritten. =item uri_with_sessionid $uri_text, [ $sid ] By path style rewriting, it will appends C to the uri path. http://myapp/link -> http://myapp/link/-/$sessionid By param style rewriting, it will add a parameter key/value pair after the uri path. http://myapp/link -> http://myapp/link?$param=$sessionid If $sid is not provided it will default to C<< $c->sessionid >>. =item session_rewrite_if_needed Rewrite the response if necessary. =item rewrite_body_with_session_id $sid Calls either C or C depending on the content type. =item rewrite_html_with_session_id $sid Rewrites the body using L. This method of rewriting also matches relative URIs, and is thus more robust. =item rewrite_text_with_session_id $sid Rewrites the body using L. This method is used when the content does not appear to be HTML. =item rewrite_redirect_with_session_id $sid Rewrites the C header. =item uri_with_param_sessionid =item uri_with_path_sessionid =back =head1 EXTENDED METHODS =over 4 =item prepare_action Will restore the session if the request URI is formatted accordingly, and rewrite the URI to remove the additional part. =item finalize If C returns a true value, L is used to traverse the body to replace all URLs which get true returned by C so that they contain the session ID. =item delete_session_id =item get_session_id =item set_session_id =item setup_session =item uri_for =back =head1 CAVEATS =head2 Session Hijacking URI sessions are very prone to session hijacking problems. Make sure your users know not to copy and paste URIs to prevent these problems, and always provide a way to safely link to public resources. Also make sure to never link to external sites without going through a gateway page that does not have session data in it's URI, so that the external site doesn't get any session IDs in the http referrer header. Due to these issues this plugin should be used as a last resort, as L is more appropriate 99% of the time. Take a look at the IP address limiting features in L to see make some of these problems less dangerous. =head3 Goodbye page recipe To exclude some sections of your application, like a goodbye page (see L) you should make extend the C method to return true if the URI does not point to the goodbye page, extend C to not rewrite URIs that match C (so that external URIs with that in their path as a parameter to the goodbye page will not be destroyed) and finally extend C to rewrite URIs with the following logic: =over 4 =item * URIs that match C are appended with session data ( C<< $c->maybe::next::method >>). =item * External URIs (everything else) should be prepended by the goodbye page. (e.g. C). =back But note that this behavior will be problematic when you are e.g. submitting POSTs to forms on external sites. =head1 SEE ALSO L, L,L C, C. =head1 AUTHORS This module is derived from L code, and has been heavily modified since. =over 4 =item Andrew Ford =item Andy Grundman =item Christian Hansen =item Yuval Kogman, C =item Marcus Ramberg =item Sebastian Riedel =item Hu Hailin =back =head1 COPYRIGHT This program is free software, you can redistribute it and/or modify it under the same terms as Perl itself. =cut 1;