use postcode from address when no postcode is available in publicaccess

parser add currently failing surrey heath parser
17 年之前 · cef4ccbcf6
--- a/cgi-bin/AcolnetParser.py
+++ b/cgi-bin/AcolnetParser.py
@@ -159,8 +159,8 @@ class AcolnetParser(HTMLParser.HTMLParser):
        search_form_response = urllib2.urlopen(self.base_url)
        search_form_contents = search_form_response.read()

        #outfile = open("tmpfile", "w")
        #outfile.write(search_form_contents)
        outfile = open("tmpfile", "w")
        outfile.write(search_form_contents)

        # This sometimes causes a problem in HTMLParser, so let's just get the link
        # out with a regex...
@@ -410,6 +410,14 @@ class SuffolkCoastalParser(AcolnetParser):
    proposal_tr = 5

    comments_email_address = "d.c.admin@suffolkcoastal.gov.uk"

 class SurreyHeathParser(AcolnetParser):
    case_number_tr = 1 # this one can be got by the td class attribute
    reg_date_tr = 2
    location_tr = 4
    proposal_tr = 5

    comments_email_address = "development-control@surreyheath.gov.uk"
    
 if __name__ == '__main__':
    day = 15
@@ -425,7 +433,7 @@ if __name__ == '__main__':
    # canterbury
    # results as columns of one table

    parser = OldhamParser("Oldham", "Oldham", "http://planning.oldham.gov.uk/planning//acolnetcgi.gov?ACTION=UNWRAP&RIPNAME=Root.pgesearch")
    parser = SurreyHeathParser("Surrey Heath", "Surrey Heath", "https://www.public.surreyheath-online.gov.uk/whalecom60b1ef305f59f921/whalecom0/Scripts/PlanningPagesOnline/acolnetcgi.gov?ACTION=UNWRAP&RIPNAME=Root.pgesearch")
    
    print parser.getResults(day, month, year)
    
--- a/cgi-bin/Allerdale.cgi
+++ b/cgi-bin/Allerdale.cgi
--- a/cgi-bin/Alnwick.cgi
+++ b/cgi-bin/Alnwick.cgi
--- a/cgi-bin/Angus.cgi
+++ b/cgi-bin/Angus.cgi
--- a/cgi-bin/Aylesbury
+++ b/cgi-bin/Aylesbury
--- a/cgi-bin/Babergh.cgi
+++ b/cgi-bin/Babergh.cgi
--- a/cgi-bin/Barrow.cgi
+++ b/cgi-bin/Barrow.cgi
--- a/cgi-bin/Basildon.cgi
+++ b/cgi-bin/Basildon.cgi
--- a/cgi-bin/Basingstoke
+++ b/cgi-bin/Basingstoke
--- a/cgi-bin/Bassetlaw.cgi
+++ b/cgi-bin/Bassetlaw.cgi
--- a/cgi-bin/Bath.cgi
+++ b/cgi-bin/Bath.cgi
--- a/cgi-bin/Bexley.cgi
+++ b/cgi-bin/Bexley.cgi
--- a/cgi-bin/Blaby.cgi
+++ b/cgi-bin/Blaby.cgi
--- a/cgi-bin/Bolsover.cgi
+++ b/cgi-bin/Bolsover.cgi
--- a/cgi-bin/Bridgnorth.cgi
+++ b/cgi-bin/Bridgnorth.cgi
--- a/cgi-bin/Bristol.cgi
+++ b/cgi-bin/Bristol.cgi
--- a/cgi-bin/Buckinghamshire.cgi
+++ b/cgi-bin/Buckinghamshire.cgi
--- a/cgi-bin/Bury.cgi
+++ b/cgi-bin/Bury.cgi
--- a/cgi-bin/Carlisle.cgi
+++ b/cgi-bin/Carlisle.cgi
--- a/cgi-bin/Chelmsford.cgi
+++ b/cgi-bin/Chelmsford.cgi
--- a/cgi-bin/Cherwell.cgi
+++ b/cgi-bin/Cherwell.cgi
--- a/cgi-bin/Chorley.cgi
+++ b/cgi-bin/Chorley.cgi
--- a/cgi-bin/City
+++ b/cgi-bin/City
--- a/cgi-bin/Cornwall.cgi
+++ b/cgi-bin/Cornwall.cgi
--- a/cgi-bin/Coventry.cgi
+++ b/cgi-bin/Coventry.cgi
--- a/cgi-bin/Croydon.cgi
+++ b/cgi-bin/Croydon.cgi
--- a/cgi-bin/Denbighshire.cgi
+++ b/cgi-bin/Denbighshire.cgi
--- a/cgi-bin/Derby.cgi
+++ b/cgi-bin/Derby.cgi
--- a/cgi-bin/Doncaster.cgi
+++ b/cgi-bin/Doncaster.cgi
--- a/cgi-bin/Dundee.cgi
+++ b/cgi-bin/Dundee.cgi
--- a/cgi-bin/Durham.cgi
+++ b/cgi-bin/Durham.cgi
--- a/cgi-bin/Ealing.cgi
+++ b/cgi-bin/Ealing.cgi
--- a/cgi-bin/Easington.cgi
+++ b/cgi-bin/Easington.cgi
--- a/cgi-bin/East
+++ b/cgi-bin/East
--- a/cgi-bin/East
+++ b/cgi-bin/East
--- a/cgi-bin/East
+++ b/cgi-bin/East
--- a/cgi-bin/Edinburgh.cgi
+++ b/cgi-bin/Edinburgh.cgi
--- a/cgi-bin/Epsom
+++ b/cgi-bin/Epsom
--- a/cgi-bin/Fenland.cgi
+++ b/cgi-bin/Fenland.cgi
--- a/cgi-bin/Fylde.cgi
+++ b/cgi-bin/Fylde.cgi
--- a/cgi-bin/Gateshead.cgi
+++ b/cgi-bin/Gateshead.cgi
--- a/cgi-bin/Gedling.cgi
+++ b/cgi-bin/Gedling.cgi
--- a/cgi-bin/Gloucestershire.cgi
+++ b/cgi-bin/Gloucestershire.cgi
--- a/cgi-bin/Gravesham.cgi
+++ b/cgi-bin/Gravesham.cgi
--- a/cgi-bin/Hammersmith
+++ b/cgi-bin/Hammersmith
--- a/cgi-bin/Haringey.cgi
+++ b/cgi-bin/Haringey.cgi
--- a/cgi-bin/Harlow.cgi
+++ b/cgi-bin/Harlow.cgi
--- a/cgi-bin/Harrogate.cgi
+++ b/cgi-bin/Harrogate.cgi
--- a/cgi-bin/Hart.cgi
+++ b/cgi-bin/Hart.cgi
--- a/cgi-bin/Hartlepool.cgi
+++ b/cgi-bin/Hartlepool.cgi
--- a/cgi-bin/Hertsmere.cgi
+++ b/cgi-bin/Hertsmere.cgi
--- a/cgi-bin/High
+++ b/cgi-bin/High
--- a/cgi-bin/Huntingdonshire.cgi
+++ b/cgi-bin/Huntingdonshire.cgi
--- a/cgi-bin/Kerrier.cgi
+++ b/cgi-bin/Kerrier.cgi
--- a/cgi-bin/Knowsley.cgi
+++ b/cgi-bin/Knowsley.cgi
--- a/cgi-bin/Lancaster.cgi
+++ b/cgi-bin/Lancaster.cgi
--- a/cgi-bin/Lewisham.cgi
+++ b/cgi-bin/Lewisham.cgi
--- a/cgi-bin/Luton.cgi
+++ b/cgi-bin/Luton.cgi
--- a/cgi-bin/Malvern
+++ b/cgi-bin/Malvern
--- a/cgi-bin/Manchester.cgi
+++ b/cgi-bin/Manchester.cgi
--- a/cgi-bin/Mid
+++ b/cgi-bin/Mid
--- a/cgi-bin/Milton
+++ b/cgi-bin/Milton
--- a/Leicestershire.cgi
+++ b/Leicestershire.cgi
--- a/cgi-bin/New
+++ b/cgi-bin/New
--- a/cgi-bin/Newcastle-under-Lyme.cgi
+++ b/cgi-bin/Newcastle-under-Lyme.cgi
--- a/cgi-bin/Newcastle.cgi
+++ b/cgi-bin/Newcastle.cgi
--- a/cgi-bin/Newham.cgi
+++ b/cgi-bin/Newham.cgi
--- a/Hertfordshire.cgi
+++ b/Hertfordshire.cgi
--- a/cgi-bin/North
+++ b/cgi-bin/North
--- a/Warwickshire.cgi
+++ b/Warwickshire.cgi
--- a/Wiltshire.cgi
+++ b/Wiltshire.cgi
--- a/cgi-bin/Northumberland.cgi
+++ b/cgi-bin/Northumberland.cgi
--- a/cgi-bin/Oadby
+++ b/cgi-bin/Oadby
--- a/cgi-bin/Oldham.cgi
+++ b/cgi-bin/Oldham.cgi
--- a/cgi-bin/Oswestry.cgi
+++ b/cgi-bin/Oswestry.cgi
--- a/cgi-bin/Peterborough.cgi
+++ b/cgi-bin/Peterborough.cgi
--- a/cgi-bin/Portsmouth.cgi
+++ b/cgi-bin/Portsmouth.cgi
--- a/cgi-bin/PublicAccess.py
+++ b/cgi-bin/PublicAccess.py
@@ -10,7 +10,7 @@ import cookielib
 cookie_jar = cookielib.CookieJar()


 from PlanningUtils import fixNewlines, PlanningAuthorityResults, PlanningApplication
 from PlanningUtils import fixNewlines, getPostcodeFromText, PlanningAuthorityResults, PlanningApplication


 search_form_url_end = "DcApplication/application_searchform.aspx"
@@ -167,6 +167,9 @@ class PublicAccessParser(HTMLParser.HTMLParser):
                # one found on the property page
                if property_file_parser.postcode is not None:
                    self._current_application.postcode = property_file_parser.postcode
                else:
                    # If there is no postcode in here, then we'll have to make do with regexing one out of the address.
                    self._current_application.postcode = getPostcodeFromText(self._current_application.address)

                # There is no need for us to look at any more attributes.
 		break
--- a/cgi-bin/Redditch.cgi
+++ b/cgi-bin/Redditch.cgi
--- a/cgi-bin/Renfrewshire.cgi
+++ b/cgi-bin/Renfrewshire.cgi
--- a/cgi-bin/Rushmoor.cgi
+++ b/cgi-bin/Rushmoor.cgi
--- a/cgi-bin/Scarborough.cgi
+++ b/cgi-bin/Scarborough.cgi
--- a/cgi-bin/Selby.cgi
+++ b/cgi-bin/Selby.cgi
--- a/cgi-bin/Sevenoaks.cgi
+++ b/cgi-bin/Sevenoaks.cgi
--- a/Bedfordshire.cgi
+++ b/Bedfordshire.cgi
--- a/cgi-bin/South
+++ b/cgi-bin/South
--- a/cgi-bin/South
+++ b/cgi-bin/South
--- a/Staffordshire.cgi
+++ b/Staffordshire.cgi
--- a/cgi-bin/SouthOxfordshire.cgi
+++ b/cgi-bin/SouthOxfordshire.cgi
--- a/cgi-bin/Southampton.cgi
+++ b/cgi-bin/Southampton.cgi
--- a/cgi-bin/Spelthorne.cgi
+++ b/cgi-bin/Spelthorne.cgi
--- a/Helens.cgi
+++ b/Helens.cgi
--- a/cgi-bin/Stevenage.cgi
+++ b/cgi-bin/Stevenage.cgi
--- a/cgi-bin/Stirling.cgi
+++ b/cgi-bin/Stirling.cgi
--- a/cgi-bin/Stockton-On-Tees.cgi
+++ b/cgi-bin/Stockton-On-Tees.cgi
--- a/cgi-bin/Stratford.cgi
+++ b/cgi-bin/Stratford.cgi
--- a/cgi-bin/Suffolk
+++ b/cgi-bin/Suffolk
--- a/cgi-bin/Sunderland.cgi
+++ b/cgi-bin/Sunderland.cgi
--- a/cgi-bin/Surrey
+++ b/cgi-bin/Surrey
@@ -0,0 +1,29 @@
 #!/usr/local/bin/python

 # This is the parser for Surrey Heath Borough Council.
 # it is generated from the file CGITemplate

 import cgi
 import cgitb
 #cgitb.enable(display=0, logdir="/tmp")


 form = cgi.FieldStorage()
 day = form.getfirst('day')
 month = form.getfirst('month')
 year = form.getfirst('year')


 authority_name = "Surrey Heath Borough Council"
 authority_short_name = "Surrey Heath"
 base_url = "https://www.public.surreyheath-online.gov.uk/whalecom60b1ef305f59f921/whalecom0/Scripts/PlanningPagesOnline/acolnetcgi.gov?ACTION=UNWRAP&RIPNAME=Root.pgesearch"

 import AcolnetParser

 parser = AcolnetParser.SurreyHeathParser(authority_name, authority_short_name, base_url)

 xml = parser.getResults(day, month, year)

 print "Content-Type: text/xml"     # XML is following
 print
 print xml                          # print the xml
--- a/cgi-bin/Teignbridge.cgi
+++ b/cgi-bin/Teignbridge.cgi