Skip to content

Commit

Permalink
Update scraper.rb
Browse files Browse the repository at this point in the history
  • Loading branch information
BfB-Schenefeld committed Apr 21, 2024
1 parent 8f4133e commit 89a0283
Showing 1 changed file with 13 additions and 9 deletions.
22 changes: 13 additions & 9 deletions scraper.rb
Original file line number Diff line number Diff line change
Expand Up @@ -34,15 +34,20 @@ def scrape_event_details(event_url)

event_data = []
document.css('tr').each do |row|
index_number = row.css('td.tonr a').text.strip
betreff = row.css('td.tobetreff div a').text.strip
vorlage_link = row.at_css('td.tovonr a')
vorlage_url = vorlage_link ? "https://www.sitzungsdienst-schenefeld.de/bi/#{vorlage_link['href']}" : "No Vorlage"
vorlage_text = vorlage_link ? vorlage_link.text.strip : "No Vorlage"
# Prüfe, ob sinnvolle Daten vorhanden sind
if row.css('td.tonr a').any? && row.css('td.tobetreff div a').any?
index_number = row.css('td.tonr a').text.strip
betreff = row.css('td.tobetreff div a').text.strip
vorlage_link = row.at_css('td.tovonr a')
vorlage_url = vorlage_link ? "https://www.sitzungsdienst-schenefeld.de/bi/#{vorlage_link['href']}" : "Keine Vorlage"
vorlage_text = vorlage_link ? vorlage_link.text.strip : "Keine Vorlage"

# Save data to an array
event_data << [index_number, betreff, vorlage_text, vorlage_url]
puts "Found: #{index_number}, Betreff: #{betreff}, Vorlage: #{vorlage_text}, Vorlage URL: #{vorlage_url}"
# Speichere Daten nur, wenn 'index_number' und 'betreff' nicht leer sind
if !index_number.empty? && !betreff.empty?
event_data << [index_number, betreff, vorlage_text, vorlage_url]
puts "Found: #{index_number}, Betreff: #{betreff}, Vorlage: #{vorlage_text}, Vorlage URL: #{vorlage_url}"
end
end
end
return event_data
end
Expand Down Expand Up @@ -71,4 +76,3 @@ def save_to_csv(data)

# Start scraping
scrape_calendar_data(2024, 3)

0 comments on commit 89a0283

Please sign in to comment.