Skip to content

Commit

Permalink
Update scraper.rb
Browse files Browse the repository at this point in the history
  • Loading branch information
BfB-Schenefeld committed Apr 21, 2024
1 parent 5b5852c commit e1d30ab
Showing 1 changed file with 4 additions and 7 deletions.
11 changes: 4 additions & 7 deletions scraper.rb
Original file line number Diff line number Diff line change
Expand Up @@ -35,21 +35,19 @@ def scrape_event_details(event_url)
event_data = []
document.css('tr').each do |row|
index_number = row.css('td.tonr a').text.strip
# Überprüfe, ob ein Hyperlink vorhanden ist und extrahiere entsprechend den Text
betreff_link = row.css('td.tobetreff div a').first
betreff_text = if betreff_link
betreff_link.text.strip
else
row.css('td.tobetreff div').text.strip
end
vorlage_link = row.at_css('td.tovonr a')
vorlage_url = vorlage_link ? "https://www.sitzungsdienst-schenefeld.de/bi/#{vorlage_link['href']}" : "Keine Vorlage"
vorlage_text = vorlage_link ? vorlage_link.text.strip : "Keine Vorlage"
vorlage_text = vorlage_link ? vorlage_link.text.strip : "-"

# Speichere Daten nur, wenn 'index_number' und 'betreff_text' nicht leer sind
if !index_number.empty? && !betreff_text.empty?
event_data << [index_number, betreff_text, vorlage_text, vorlage_url]
puts "Found: #{index_number}, Betreff: #{betreff_text}, Vorlage: #{vorlage_text}, Vorlage URL: #{vorlage_url}"
event_data << [index_number, betreff_text, vorlage_text]
puts "Found: #{index_number}, Betreff: #{betreff_text}, Vorlage: #{vorlage_text}"
end
end
return event_data
Expand All @@ -72,11 +70,10 @@ def scrape_calendar_data(year, month)
# Function to save data to CSV
def save_to_csv(data)
CSV.open("event_details.csv", "wb") do |csv|
csv << ["Index Number", "Betreff", "Vorlage Text", "Vorlage URL"]
csv << ["Index Number", "Betreff", "Vorlage"]
data.each { |row| csv << row }
end
end

# Start scraping
scrape_calendar_data(2024, 3)

0 comments on commit e1d30ab

Please sign in to comment.