Explorar el Código

Set up planet scraper. This get's us 5 new councils (though one, Tewkesbury, has no postcodes)

import/raw
duncan.parkes hace 16 años
padre
commit
9018285d28
Se han modificado 3 ficheros con 15 adiciones y 2 borrados
  1. +1
    -0
      trunk/python_scrapers/OtherFilesToCopy.csv
  2. +8
    -1
      trunk/python_scrapers/Planet.py
  3. +6
    -1
      trunk/python_scrapers/SitesToGenerate.csv

+ 1
- 0
trunk/python_scrapers/OtherFilesToCopy.csv Ver fichero

@@ -19,3 +19,4 @@
"WestDorset.cgi", "493"
"Christchurch.cgi", "493"
"WAM.py", "420"
"Planet.py", "420"

+ 8
- 1
trunk/python_scrapers/Planet.py Ver fichero

@@ -147,9 +147,16 @@ class PlanetParser:


if __name__ == '__main__':
# parser = PlanetParser("Worcester City Council", "Worcester", "http://www.worcester.gov.uk:8080/planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", debug=True)
# parser = PlanetParser("Elmbridge Borough Council", "Elmbridge", "http://www2.elmbridge.gov.uk/Planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry")
# parser = PlanetParser("North Lincolnshire Council", "North Lincolnshire", "http://www.planning.northlincs.gov.uk/planet/ispforms.asp?ServiceKey=SysDoc-PlanetApplicationEnquiry")
# parser = PlanetParser("Rydale District Council", "Rydale", "http://www.ryedale.gov.uk/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry")
parser = PlanetParser("Tewkesbury Borough Council", "Tewkesbury", "http://planning.tewkesbury.gov.uk/Planet/ispforms.asp?serviceKey=07WCC04163103430")
print parser.getResults(21,5,2008)
# parser = PlanetParser("Worcester City Council", "Worcester", "http://www.worcester.gov.uk:8080/planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", debug=True)

# TODO

# 1) Pagination
# 2) Work OK with no results.

# 3) Use OSGB for Tewkesbury?

+ 6
- 1
trunk/python_scrapers/SitesToGenerate.csv Ver fichero

@@ -201,4 +201,9 @@
"Rother District Council", "Rother", "http://www.planning.rother.gov.uk/WAM/pas/searchApplications.do", "WAM", "WAMParser"
"South Gloucestershire Council", "South Gloucestershire", "http://planning.southglos.gov.uk/WAM/pas/WeeklyApplications.do", "WAM", "BraintreeParser"
"London Borough of Tower Hamlets", "Tower Hamlets", "http://194.201.98.213/WAM/weeklyApplications.do", "WAM", "BraintreeParser"
"Sheffield City Council", "Sheffield", "http://planning.sheffield.gov.uk/publicaccess/tdc/", "PublicAccess", "PublicAccessParser"
"Sheffield City Council", "Sheffield", "http://planning.sheffield.gov.uk/publicaccess/tdc/", "PublicAccess", "PublicAccessParser"
"Elmbridge Borough Council", "Elmbridge", "http://www2.elmbridge.gov.uk/Planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", "Planet", "PlanetParser"
"North Lincolnshire Council", "North Lincolnshire", "http://www.planning.northlincs.gov.uk/planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", "Planet", "PlanetParser"
"Ryedale District Council", "Ryedale", "http://www.ryedale.gov.uk/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", "Planet", "PlanetParser"
"Tewkesbury Borough Council", "Tewkesbury", "http://planning.tewkesbury.gov.uk/Planet/ispforms.asp?serviceKey=07WCC04163103430", "Planet", "PlanetParser"
"Worcester City Council", "Worcester", "http://www.worcester.gov.uk:8080/planet/ispforms.asp?serviceKey=SysDoc-PlanetApplicationEnquiry", "Planet", "PlanetParser"

Cargando…
Cancelar
Guardar