#!/usr/bin/perl -sw

# parallel_wget [-np] [-n=XX] http://www.forbrug.dk/mad/

$parent= not $np;
$parallel_processes = $n || 10;
$url= shift;

if($url =~ /^[a-z0-9]+\.[a-z0-9.]+/i) {
    # www.forbrug.dk/mad/ -> http://www.forbrug.dk/mad/ -> 
    $url = "http://".$url;
}
debug("url: $url\n");

if($parent) {
    # http://www.forbrug.dk/mad/ -> http://www.forbrug.dk/
    $base = $url;
    $base =~ s{([a-z]+://[^/]+).*}{$1/}i;
} else {
    $base = $url;
}
debug("base: $base\n");

$accepted_url = $base;
debug("accepted_url: $accepted_url\n");
$accepted_url =~ s/(\W)/\\$1/g;
$accepted_url = "^".$accepted_url;
debug("accepted_url: $accepted_url\n");

open(CONF,">parallel_wget.log") || die;
print CONF '$accepted_url = ',$accepted_url,"\n";
print CONF '$unaccepted_url = \?',"\n";
print CONF "\n$url\n";
close CONF;

@do_it=("wget_worker.pl",$parallel_processes,"parallel_wget.log");
debug("@do_it\n");
system(@do_it);

sub debug {
    $debug and print STDERR @_;
}

$debug=$n=$np=1; # ignore perl -w
