|
|
@@ -228,13 +228,13 @@ def probe_common_docs(base_url:, key:, danum:, referer:)
|
|
|
saved = download_doc(pdf_url, referer: referer, council_reference: danum_raw, jar: SESSION_JAR)
|
|
|
local_rel = "/files/launceston/#{safe_name(danum_raw)}/#{File.basename(saved)}"
|
|
|
rescue StandardError => e
|
|
|
- warn "DOC download failed (probe) for #{danum_raw} #{File.basename(pdf_url)}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "DOC download failed (probe) for #{danum_raw} #{File.basename(pdf_url)}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
found << { name: File.basename(pdf_url), url: pdf_url, local_url: local_rel }
|
|
|
end
|
|
|
rescue StandardError => e
|
|
|
- warn "[launcestoncity] probe failed for #{pdf_url}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "[launcestoncity] probe failed for #{pdf_url}: #{e.class} #{e.message}"
|
|
|
next
|
|
|
end
|
|
|
end
|
|
|
@@ -371,7 +371,7 @@ tables.each do |t|
|
|
|
saved = download_doc(href, referer: candidate_url, council_reference: council_reference, jar: SESSION_JAR)
|
|
|
local_rel = "/files/launceston/#{safe_name(council_reference)}/#{File.basename(saved)}"
|
|
|
rescue StandardError => e
|
|
|
- warn "DOC download failed for #{council_reference} #{name}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "DOC download failed for #{council_reference} #{name}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
|
|
|
@@ -398,7 +398,7 @@ tables.each do |t|
|
|
|
anchors_added = probed.size if probed.any?
|
|
|
end
|
|
|
rescue StandardError => e
|
|
|
- warn "Probe fallback failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "Probe fallback failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
|
|
|
@@ -413,23 +413,23 @@ tables.each do |t|
|
|
|
FileUtils.mkdir_p(dump_dir)
|
|
|
File.write(File.join(dump_dir, "#{safe_name(council_reference)}.html"), list_html[0, 5000])
|
|
|
rescue StandardError => e
|
|
|
- warn "Failed to write dump for #{council_reference}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "Failed to write dump for #{council_reference}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
|
|
|
rescue StandardError => e
|
|
|
- warn "Doc list fetch failed for #{council_reference} at #{candidate_url} (referer: #{ref}): #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "Doc list fetch failed for #{council_reference} at #{candidate_url} (referer: #{ref}): #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
end
|
|
|
|
|
|
if used_url.nil?
|
|
|
- warn "Docs page had no usable links for #{council_reference} after variants: #{variants_for_doc_list(doc_list_url).join(' | ')}"
|
|
|
+ Log.warn "scraper", "Docs page had no usable links for #{council_reference} after variants: #{variants_for_doc_list(doc_list_url).join(' | ')}"
|
|
|
end
|
|
|
|
|
|
|
|
|
rescue StandardError => e
|
|
|
- warn "Doc list fetch failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "Doc list fetch failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
|
|
|
@@ -469,7 +469,7 @@ tables.each do |t|
|
|
|
})
|
|
|
|
|
|
rescue StandardError => e
|
|
|
- warn "Enrich failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
+ Log.warn "scraper", "Enrich failed for #{council_reference}: #{e.class} #{e.message}"
|
|
|
end
|
|
|
end
|
|
|
|