| @@ -0,0 +1,122 @@ | |||||
| #!/usr/local/bin/perl | |||||
| use strict; | |||||
| use warnings; | |||||
| use CGI qw(:cgi); | |||||
| use HTML::TreeBuilder; | |||||
| use LWP::UserAgent; | |||||
| use XML::Writer; | |||||
| # The master URLs for the East Herts planning search | |||||
| our $SearchURL = "http://e-services.eastherts.gov.uk/swiftlg/apas/run/WPHAPPCRITERIA"; | |||||
| our $InfoURL = "http://e-services.eastherts.gov.uk/swiftlg/apas/run/WPHAPPDETAIL.DisplayUrl?theApnID="; | |||||
| our $CommentURL = "http://e-services.eastherts.gov.uk/swiftlg/apas/run/wphmakerep.displayURL?ApnID="; | |||||
| # We're a CGI script... | |||||
| my $query = CGI->new(); | |||||
| # Get the date to fetch | |||||
| my $date = $query->param("day") . "/" . $query->param("month") . "/" . $query->param("year"); | |||||
| # Construct an LWP user agent | |||||
| our $UA = LWP::UserAgent->new(env_proxy => 1); | |||||
| # Do the search | |||||
| my $page = do_post($SearchURL, | |||||
| {"REGFROMDATE.MAINBODY.WPACIS.1." => $date, | |||||
| "REGTODATE.MAINBODY.WPACIS.1." => $date, | |||||
| "SEARCHBUTTON.MAINBODY.WPACIS.1." => "Search"}); | |||||
| # Output an HTTP response header | |||||
| print $query->header(-type => "text/xml"); | |||||
| # Create an XML output stream | |||||
| my $Writer = XML::Writer->new(DATA_MODE => 1); | |||||
| # Output the XML header data | |||||
| $Writer->xmlDecl("UTF-8"); | |||||
| $Writer->startTag("planning"); | |||||
| $Writer->dataElement("authority_name", "East Herts Council"); | |||||
| $Writer->dataElement("authority_short_name", "East Herts"); | |||||
| $Writer->startTag("applications"); | |||||
| # Output any applications on the first page | |||||
| output_applications($page); | |||||
| # Loop over any additional results pages | |||||
| foreach my $link ($page->look_down("_tag" => "a", "href" => qr/^WPHAPPSEARCHRES\.displayResultsURL/)) | |||||
| { | |||||
| # Fetch this page... | |||||
| $page = do_get(URI->new_abs($link->attr("href"), $SearchURL)); | |||||
| # ...and output the applications from it | |||||
| output_applications($page); | |||||
| } | |||||
| # Finish off XML output | |||||
| $Writer->endTag("applications"); | |||||
| $Writer->endTag("planning"); | |||||
| $Writer->end(); | |||||
| exit 0; | |||||
| # Make a GET request | |||||
| sub do_get | |||||
| { | |||||
| my $response = $UA->get(@_); | |||||
| die $response->status_line unless $response->is_success; | |||||
| return HTML::TreeBuilder->new_from_content($response->content); | |||||
| } | |||||
| # Make a POST request | |||||
| sub do_post | |||||
| { | |||||
| my $response = $UA->post(@_); | |||||
| die $response->status_line unless $response->is_success; | |||||
| return HTML::TreeBuilder->new_from_content($response->content); | |||||
| } | |||||
| # Output applications from a results page | |||||
| sub output_applications | |||||
| { | |||||
| my $page = shift; | |||||
| # Find the result table | |||||
| my $table = $page->look_down("_tag" => "table", "cellspacing" => "2", "cellpadding" => "2"); | |||||
| # Process each row of the results | |||||
| foreach my $row ($table->look_down("_tag" => "tr")) | |||||
| { | |||||
| my @cells = $row->look_down("_tag" => "td"); | |||||
| if (@cells >= 3) | |||||
| { | |||||
| my $reference = $cells[0]->as_trimmed_text; | |||||
| my $description = $cells[1]->as_trimmed_text; | |||||
| my $address = $cells[2]->as_trimmed_text; | |||||
| my $postcode; | |||||
| if ($address =~ /\s+([A-Z]+\d+\s+\d+[A-Z]+)$/) | |||||
| { | |||||
| $postcode = $1; | |||||
| } | |||||
| $Writer->startTag("application"); | |||||
| $Writer->dataElement("council_reference", $reference); | |||||
| $Writer->dataElement("address", $address); | |||||
| $Writer->dataElement("postcode", $postcode); | |||||
| $Writer->dataElement("description", $description); | |||||
| $Writer->dataElement("info_url", $InfoURL . $reference); | |||||
| $Writer->dataElement("comment_url", $CommentURL . $reference); | |||||
| $Writer->dataElement("date_received", $date); | |||||
| $Writer->endTag("application"); | |||||
| } | |||||
| } | |||||
| return; | |||||
| } | |||||
| @@ -0,0 +1,98 @@ | |||||
| #!/usr/bin/perl | |||||
| use strict; | |||||
| use warnings; | |||||
| use CGI qw(:cgi); | |||||
| use HTML::TreeBuilder; | |||||
| use LWP::UserAgent; | |||||
| use XML::Writer; | |||||
| # The master URLs for the North Hertfordshire planning search | |||||
| our $SearchURL = "http://www.north-herts.gov.uk/dcdataonline/Pages/acolnetcgi.gov?ACTION=UNWRAP&RIPNAME=Root.pgesearch"; | |||||
| # We're a CGI script... | |||||
| my $query = CGI->new(); | |||||
| # Get the date to fetch | |||||
| my $date = $query->param("day") . "/" . $query->param("month") . "/" . $query->param("year"); | |||||
| # Construct an LWP user agent | |||||
| our $UA = LWP::UserAgent->new(env_proxy => 1); | |||||
| # Fetch the search page | |||||
| my $page = do_get($SearchURL); | |||||
| # Find the form submission URL | |||||
| my $form = $page->look_down("_tag" => "form", name => "frmSearch"); | |||||
| my $url = URI->new_abs($form->attr("action"), $SearchURL); | |||||
| # Do the search | |||||
| $page = do_post($url, {"regdate1" => $date, "regdate2" => $date}); | |||||
| # Output an HTTP response header | |||||
| print $query->header(-type => "text/xml"); | |||||
| # Create an XML output stream | |||||
| my $Writer = XML::Writer->new(DATA_MODE => 1); | |||||
| # Output the XML header data | |||||
| $Writer->xmlDecl("UTF-8"); | |||||
| $Writer->startTag("planning"); | |||||
| $Writer->dataElement("authority_name", "North Hertfordshire District Council"); | |||||
| $Writer->dataElement("authority_short_name", "North Hertfordshire"); | |||||
| $Writer->startTag("applications"); | |||||
| # Process each table of the results | |||||
| foreach my $table ($page->look_down("_tag" => "table", "class" => "results-table")) | |||||
| { | |||||
| my @rows = map { $_->look_down("_tag" => "td") } $table->look_down("_tag" => "tr"); | |||||
| my $reference = $rows[0]->as_trimmed_text; | |||||
| my $infourl = $rows[0]->look_down("_tag" => "a")->attr("href"); | |||||
| my $date = $rows[1]->as_trimmed_text; | |||||
| my $address = $rows[3]->as_trimmed_text; | |||||
| my $description = $rows[4]->as_trimmed_text; | |||||
| my $postcode; | |||||
| if ($address =~ /\s+([A-Z]+\d+\s+\d+[A-Z]+)$/) | |||||
| { | |||||
| $postcode = $1; | |||||
| } | |||||
| $Writer->startTag("application"); | |||||
| $Writer->dataElement("council_reference", $reference); | |||||
| $Writer->dataElement("address", $address); | |||||
| $Writer->dataElement("postcode", $postcode); | |||||
| $Writer->dataElement("description", $description); | |||||
| $Writer->dataElement("info_url", $infourl); | |||||
| $Writer->dataElement("comment_url", "mailto:service\@north-herts.gov.uk?subject=Comment on Planning Application"); | |||||
| $Writer->dataElement("date_received", $date); | |||||
| $Writer->endTag("application"); | |||||
| } | |||||
| # Finish off XML output | |||||
| $Writer->endTag("applications"); | |||||
| $Writer->endTag("planning"); | |||||
| $Writer->end(); | |||||
| exit 0; | |||||
| # Make a GET request | |||||
| sub do_get | |||||
| { | |||||
| my $response = $UA->get(@_); | |||||
| die $response->status_line unless $response->is_success; | |||||
| return HTML::TreeBuilder->new_from_content($response->content); | |||||
| } | |||||
| # Make a POST request | |||||
| sub do_post | |||||
| { | |||||
| my $response = $UA->post(@_, Content_Type => "form-data"); | |||||
| die $response->status_line unless $response->is_success; | |||||
| return HTML::TreeBuilder->new_from_content($response->content); | |||||
| } | |||||
| @@ -7,3 +7,6 @@ | |||||
| "AcolnetParser.py", "420" | "AcolnetParser.py", "420" | ||||
| "MultipartPostHandler.py", "420" | "MultipartPostHandler.py", "420" | ||||
| "FastWeb.py", "420" | "FastWeb.py", "420" | ||||
| "broxbourne.cgi", "493" | |||||
| "EastHerts.cgi", "493" | |||||
| "NorthHerts.cgi", "493" | |||||
| @@ -0,0 +1,162 @@ | |||||
| #!/usr/bin/perl | |||||
| use strict; | |||||
| use warnings; | |||||
| use CGI qw(:cgi); | |||||
| use DateTime; | |||||
| use HTML::TreeBuilder; | |||||
| use LWP::UserAgent; | |||||
| use XML::Writer; | |||||
| # The master URL for the Broxbourne planning search | |||||
| our $SearchURL = "http://www2.broxbourne.gov.uk/planningsearch/webform1.aspx"; | |||||
| # We're a CGI script... | |||||
| my $query = CGI->new(); | |||||
| # Get the date as an offset from 2000-01-01 | |||||
| my $epoch = DateTime->new(year => 2000, month => 1, day => 1); | |||||
| my $querydate = DateTime->new(year => $query->param("year"), | |||||
| month => $query->param("month"), | |||||
| day => $query->param("day")); | |||||
| $querydate = $querydate->delta_days($epoch)->delta_days; | |||||
| # Construct an LWP user agent | |||||
| our $UA = LWP::UserAgent->new(env_proxy => 1); | |||||
| # Post the URL to get an initial blank form | |||||
| my $state = get_state(do_post()); | |||||
| # Post each date in turn to build up the state - you can thank | |||||
| # Microsoft and ASP.NET for the horrible way we have to do this | |||||
| # by posting each argument in turn to build up the state | |||||
| $state = get_state(do_post_back($state, 'DateSelector1$Calendar1', $querydate)); | |||||
| $state = get_state(do_post_back($state, 'DateSelector2$Calendar1', $querydate)); | |||||
| # Output an HTTP response header | |||||
| print $query->header(-type => "text/xml"); | |||||
| # Create an XML output stream | |||||
| my $Writer = XML::Writer->new(DATA_MODE => 1); | |||||
| # Output the XML header data | |||||
| $Writer->xmlDecl("UTF-8"); | |||||
| $Writer->startTag("planning"); | |||||
| $Writer->dataElement("authority_name", "Borough of Broxbourne"); | |||||
| $Writer->dataElement("authority_short_name", "Broxbourne"); | |||||
| $Writer->startTag("applications"); | |||||
| # Get the arguments for the search... | |||||
| my $args = { | |||||
| "Srch" => "rb1", | |||||
| "__VIEWSTATE" => $state, | |||||
| "btnSearch" => "Search", | |||||
| "tbReference" => "", | |||||
| "tbRef2" => "" | |||||
| }; | |||||
| # ...and then (at last) we can do the search! | |||||
| my $page = do_post($args); | |||||
| # Loop processing pages of results | |||||
| while ($page) | |||||
| { | |||||
| my $table = $page->look_down("_tag" => "table", "id" => "DataGrid1"); | |||||
| # Remember the state | |||||
| $state = get_state($page); | |||||
| # Clear the page for now - this will be reinitialised if we | |||||
| # find another page of results to make us go round the loop | |||||
| # all over again | |||||
| undef $page; | |||||
| # Check that we found a table - searches that find no results | |||||
| # produce a page with no table in it | |||||
| if ($table) | |||||
| { | |||||
| # Process each row of the results | |||||
| foreach my $row ($table->look_down("_tag" => "tr")) | |||||
| { | |||||
| my @cells = $row->look_down("_tag" => "td"); | |||||
| if ($cells[0]->look_down("_tag" => "input")) | |||||
| { | |||||
| my $reference = $cells[1]->as_trimmed_text; | |||||
| my $date = $cells[2]->as_trimmed_text; | |||||
| my $address = $cells[3]->as_trimmed_text; | |||||
| my $description = $cells[4]->as_trimmed_text; | |||||
| my $postcode; | |||||
| if ($address =~ /\s+([A-Z]+\d+\s+\d+[A-Z]+)$/) | |||||
| { | |||||
| $postcode = $1; | |||||
| } | |||||
| $Writer->startTag("application"); | |||||
| $Writer->dataElement("council_reference", $reference); | |||||
| $Writer->dataElement("address", $address); | |||||
| $Writer->dataElement("postcode", $postcode); | |||||
| $Writer->dataElement("description", $description); | |||||
| $Writer->dataElement("date_received", $date); | |||||
| $Writer->endTag("application"); | |||||
| } | |||||
| elsif ($cells[0]->attr("colspan") && $cells[0]->attr("colspan") eq "5") | |||||
| { | |||||
| foreach my $link ($cells[0]->look_down("_tag" => "a")) | |||||
| { | |||||
| if ($link->as_trimmed_text eq ">" && | |||||
| $link->attr("href") =~ /^javascript:__doPostBack\('([^\']*)','([^\']*)'\)$/) | |||||
| { | |||||
| $page = do_post_back($state, $1, $2); | |||||
| } | |||||
| } | |||||
| } | |||||
| } | |||||
| } | |||||
| } | |||||
| # Finish off XML output | |||||
| $Writer->endTag("applications"); | |||||
| $Writer->endTag("planning"); | |||||
| $Writer->end(); | |||||
| exit 0; | |||||
| # Extract the state from a page so we can repost it | |||||
| sub get_state | |||||
| { | |||||
| my $page = shift; | |||||
| my $viewstate = $page->look_down("_tag" => "input", "name" => "__VIEWSTATE"); | |||||
| return $viewstate->attr("value"); | |||||
| } | |||||
| # Fake up what the doPostBack javascript function in the page does... | |||||
| sub do_post_back | |||||
| { | |||||
| my $state = shift; | |||||
| my $target = shift; | |||||
| my $argument = shift; | |||||
| $target =~ s/\$/:/g; | |||||
| my $args = { | |||||
| "__EVENTTARGET" => $target, | |||||
| "__EVENTARGUMENT" => $argument, | |||||
| "__VIEWSTATE" => $state | |||||
| }; | |||||
| return do_post($args); | |||||
| } | |||||
| # Post to the planning search page | |||||
| sub do_post | |||||
| { | |||||
| my $response = $UA->post($SearchURL, @_); | |||||
| die $response->status_line unless $response->is_success; | |||||
| return HTML::TreeBuilder->new_from_content($response->content); | |||||
| } | |||||