|
@@ -0,0 +1,98 @@ |
|
|
|
|
|
#!/usr/bin/perl |
|
|
|
|
|
|
|
|
|
|
|
use strict; |
|
|
|
|
|
use warnings; |
|
|
|
|
|
|
|
|
|
|
|
use CGI qw(:cgi); |
|
|
|
|
|
use HTML::TreeBuilder; |
|
|
|
|
|
use LWP::UserAgent; |
|
|
|
|
|
use XML::Writer; |
|
|
|
|
|
|
|
|
|
|
|
# The master URLs for the North Hertfordshire planning search |
|
|
|
|
|
our $SearchURL = "http://www.north-herts.gov.uk/dcdataonline/Pages/acolnetcgi.gov?ACTION=UNWRAP&RIPNAME=Root.pgesearch"; |
|
|
|
|
|
|
|
|
|
|
|
# We're a CGI script... |
|
|
|
|
|
my $query = CGI->new(); |
|
|
|
|
|
|
|
|
|
|
|
# Get the date to fetch |
|
|
|
|
|
my $date = $query->param("day") . "/" . $query->param("month") . "/" . $query->param("year"); |
|
|
|
|
|
|
|
|
|
|
|
# Construct an LWP user agent |
|
|
|
|
|
our $UA = LWP::UserAgent->new(env_proxy => 1); |
|
|
|
|
|
|
|
|
|
|
|
# Fetch the search page |
|
|
|
|
|
my $page = do_get($SearchURL); |
|
|
|
|
|
|
|
|
|
|
|
# Find the form submission URL |
|
|
|
|
|
my $form = $page->look_down("_tag" => "form", name => "frmSearch"); |
|
|
|
|
|
my $url = URI->new_abs($form->attr("action"), $SearchURL); |
|
|
|
|
|
|
|
|
|
|
|
# Do the search |
|
|
|
|
|
$page = do_post($url, {"regdate1" => $date, "regdate2" => $date}); |
|
|
|
|
|
|
|
|
|
|
|
# Output an HTTP response header |
|
|
|
|
|
print $query->header(-type => "text/xml"); |
|
|
|
|
|
|
|
|
|
|
|
# Create an XML output stream |
|
|
|
|
|
my $Writer = XML::Writer->new(DATA_MODE => 1); |
|
|
|
|
|
|
|
|
|
|
|
# Output the XML header data |
|
|
|
|
|
$Writer->xmlDecl("UTF-8"); |
|
|
|
|
|
$Writer->startTag("planning"); |
|
|
|
|
|
$Writer->dataElement("authority_name", "North Hertfordshire District Council"); |
|
|
|
|
|
$Writer->dataElement("authority_short_name", "North Hertfordshire"); |
|
|
|
|
|
$Writer->startTag("applications"); |
|
|
|
|
|
|
|
|
|
|
|
# Process each table of the results |
|
|
|
|
|
foreach my $table ($page->look_down("_tag" => "table", "class" => "results-table")) |
|
|
|
|
|
{ |
|
|
|
|
|
my @rows = map { $_->look_down("_tag" => "td") } $table->look_down("_tag" => "tr"); |
|
|
|
|
|
my $reference = $rows[0]->as_trimmed_text; |
|
|
|
|
|
my $infourl = $rows[0]->look_down("_tag" => "a")->attr("href"); |
|
|
|
|
|
my $date = $rows[1]->as_trimmed_text; |
|
|
|
|
|
my $address = $rows[3]->as_trimmed_text; |
|
|
|
|
|
my $description = $rows[4]->as_trimmed_text; |
|
|
|
|
|
my $postcode; |
|
|
|
|
|
|
|
|
|
|
|
if ($address =~ /\s+([A-Z]+\d+\s+\d+[A-Z]+)$/) |
|
|
|
|
|
{ |
|
|
|
|
|
$postcode = $1; |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
$Writer->startTag("application"); |
|
|
|
|
|
$Writer->dataElement("council_reference", $reference); |
|
|
|
|
|
$Writer->dataElement("address", $address); |
|
|
|
|
|
$Writer->dataElement("postcode", $postcode); |
|
|
|
|
|
$Writer->dataElement("description", $description); |
|
|
|
|
|
$Writer->dataElement("info_url", $infourl); |
|
|
|
|
|
$Writer->dataElement("comment_url", "mailto:service\@north-herts.gov.uk?subject=Comment on Planning Application"); |
|
|
|
|
|
$Writer->dataElement("date_received", $date); |
|
|
|
|
|
$Writer->endTag("application"); |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
# Finish off XML output |
|
|
|
|
|
$Writer->endTag("applications"); |
|
|
|
|
|
$Writer->endTag("planning"); |
|
|
|
|
|
$Writer->end(); |
|
|
|
|
|
|
|
|
|
|
|
exit 0; |
|
|
|
|
|
|
|
|
|
|
|
# Make a GET request |
|
|
|
|
|
sub do_get |
|
|
|
|
|
{ |
|
|
|
|
|
my $response = $UA->get(@_); |
|
|
|
|
|
|
|
|
|
|
|
die $response->status_line unless $response->is_success; |
|
|
|
|
|
|
|
|
|
|
|
return HTML::TreeBuilder->new_from_content($response->content); |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
# Make a POST request |
|
|
|
|
|
sub do_post |
|
|
|
|
|
{ |
|
|
|
|
|
my $response = $UA->post(@_, Content_Type => "form-data"); |
|
|
|
|
|
|
|
|
|
|
|
die $response->status_line unless $response->is_success; |
|
|
|
|
|
|
|
|
|
|
|
return HTML::TreeBuilder->new_from_content($response->content); |
|
|
|
|
|
} |