Explorar el Código

Some Documents tabs don't have the number in them

tags/v0.4.5
Adrian Short hace 6 años
padre
commit
f70d4f2598
Se han modificado 1 ficheros con 15 adiciones y 7 borrados
  1. +15
    -7
      lib/uk_planning_scraper.rb

+ 15
- 7
lib/uk_planning_scraper.rb Ver fichero

@@ -103,14 +103,22 @@ module UKPlanningScraper
app[:scraped_at] = Time.now

# The Documents tab doesn't show if there are no documents (we get li.nodocuments instead)
if documents_link = res.at('#tab_documents')
app[:documents_count] = documents_link.inner_text.match(/\d+/)[0].to_i
app[:documents_url] = @base_url + documents_link[:href]
else
app[:documents_count] = 0
app[:documents_url] = nil
# Bradford has #tab_documents but without the document count on it
app[:documents_count] = 0
app[:documents_url] = nil

if documents_link = res.at('.associateddocument a')
if documents_link.inner_text.match(/\d+/)
app[:documents_count] = documents_link.inner_text.match(/\d+/)[0].to_i
app[:documents_url] = @base_url + documents_link[:href]
end
elsif documents_link = res.at('#tab_documents')
if documents_link.inner_text.match(/\d+/)
app[:documents_count] = documents_link.inner_text.match(/\d+/)[0].to_i
app[:documents_url] = @base_url + documents_link[:href]
end
end

# We need to find values in the table by using the th labels.
# The row indexes/positions change from site to site (or even app to app) so we can't rely on that.



Cargando…
Cancelar
Guardar