# $Id: /mirror/gungho/lib/Gungho/Component/Throttle/Domain.pm 8775 2007-11-08T09:53:44.496906Z lestrrat $ # # Copyright (c) 2007 Daisuke Maki # All rights reserved. package Gungho::Component::Throttle::Domain; use strict; use warnings; use base qw(Gungho::Component::Throttle::Throttler); __PACKAGE__->mk_classdata($_) for qw(matcher); sub setup { my $self = shift; my $config = $self->config->{throttle}{domain}; $self->prepare_throttler( map { ($_ => $config->{$_}) } qw(max_items interval db_file throttler cache) ); my $domains = $config->{domains} || []; my $matcher; if (@$domains) { my $sub = <url; my \$host = \$url->host; EOSUB foreach my $d (@$domains) { if (my $re = $d->{match}) { # protect ourselves from "/" $re =~ s/\//\\\//g; $sub .= " (\$host =~ /$re/) and return 1;\n"; } } $sub .= "\nreturn 0;\n}"; $matcher = eval $sub or die; } $self->matcher($matcher); $self->next::method(@_); } sub throttle { my $c = shift; my $request = shift; my $do_throttle = 1; my $code = $c->matcher; if ($code) { $do_throttle = $code->($request); } if ($do_throttle) { my $t = $c->throttler; if (! $t->try_push(key => $request->notes('original_host') || $request->url->host)) { $c->log->debug( $request->url . " throttled by Throttle::Domain" ); return (); } } return $c->next::method($request); } 1; __END__ =head1 NAME Gungho::Component::Throttle::Domain - Throttle By Domain =head1 SYNOPSIS --- throttle: domain: max_items 1000 interval: 3600 domains: - match: 'A [Regular]+ Exp?ression' - match: \.cpan\.org$ components: - Throttle::Domain =head1 DESCRIPITION This component allows you to throttle requests by domain names. You can specify a regular expression, in which case only the domains that match the particular regular expression will be throttled. Otherwise, the hostname from each request will be used as the key to throttle. =head1 CONFIGURATION All configuration parameters are specified in throttle.domain hash: throttle: doamin: key1: value =head2 max_items Specifies the max number of items that can be fetched within the time specified in "interval" =head2 interval Specifies the interval to which to apply the max_items configuration. =head2 domains Specifies the domain to apply the throttling. If unspecified, the same throttling configuration will be applied to all domains =head1 METHODS =head2 setup =head2 throttle($request) Checks if a request can be executed succesfully. Returns 1 if it's ok to execute the request. =cut