för att man inte kan ladda upp fler filer
This commit is contained in:
99
crawler.py
Normal file
99
crawler.py
Normal file
@ -0,0 +1,99 @@
|
||||
import requests
|
||||
from bs4 import BeautifulSoup
|
||||
import json
|
||||
import os
|
||||
from selenium import webdriver
|
||||
from selenium.webdriver.chrome.options import Options
|
||||
|
||||
# CONFIGURATION
|
||||
NATIONER_URL = "https://www.nationsguiden.se/" # Example URL, replace with actual
|
||||
DISCORD_WEBHOOK_URL = "https://discord.com/api/webhooks/1437888900747104317/TI2RfDGC5dzoi5JGz6UO2aD23teYNwa6pLQOskhaDnsSVe3cr8_rly0L3K0VyIYARgeR"
|
||||
|
||||
|
||||
def fetch_nationer_open_times(url):
|
||||
import re
|
||||
print(f"DEBUG: Current working directory is {os.getcwd()}")
|
||||
# Use headless browser to get rendered DOM and extract event data
|
||||
chrome_options = Options()
|
||||
chrome_options.add_argument('--headless')
|
||||
chrome_options.add_argument('--disable-gpu')
|
||||
chrome_options.add_argument('--no-sandbox')
|
||||
driver = webdriver.Chrome(options=chrome_options)
|
||||
driver.get(url)
|
||||
import time
|
||||
time.sleep(5) # Wait for JS to load events
|
||||
|
||||
nationer_data = []
|
||||
# Find all event blocks (adjust selector as needed)
|
||||
event_blocks = driver.find_elements("css selector", "div.flex.flex-col.justify-evenly")
|
||||
print(f"DEBUG: Found {len(event_blocks)} event blocks in DOM.")
|
||||
for block in event_blocks:
|
||||
try:
|
||||
event_title = block.find_element("css selector", "h4 a").text.strip()
|
||||
except Exception:
|
||||
event_title = ""
|
||||
try:
|
||||
organiser = block.find_element("css selector", "a.text-primary, p.text-primary").text.strip()
|
||||
except Exception:
|
||||
organiser = ""
|
||||
try:
|
||||
open_time = block.find_element("css selector", "time").text.strip()
|
||||
except Exception:
|
||||
open_time = ""
|
||||
try:
|
||||
permalink = block.find_element("css selector", "h4 a").get_attribute("href")
|
||||
except Exception:
|
||||
permalink = ""
|
||||
if event_title:
|
||||
print(f"DEBUG: Event: {event_title}, Organiser: {organiser}, Time: {open_time}")
|
||||
nationer_data.append({
|
||||
"event": event_title,
|
||||
"nation": organiser,
|
||||
"open_time": open_time,
|
||||
"permalink": permalink
|
||||
})
|
||||
driver.quit()
|
||||
# Write debug file for extracted events
|
||||
debug_path = os.path.abspath("/mnt/serverdata/html/crawlernation/events_debug.json")
|
||||
try:
|
||||
with open(debug_path, "w", encoding="utf-8") as f:
|
||||
json.dump(nationer_data, f, ensure_ascii=False, indent=2)
|
||||
print(f"Wrote debug event data to {debug_path}")
|
||||
except Exception as e:
|
||||
print(f"Error writing debug file: {e}")
|
||||
return nationer_data
|
||||
|
||||
|
||||
def send_to_discord_webhook(data, webhook_url):
|
||||
if not webhook_url:
|
||||
raise ValueError("DISCORD_WEBHOOK_URL not set")
|
||||
content = "Nationer Öppna Idag:\n"
|
||||
for item in data:
|
||||
content += f"**{item['nation']}**\nEvent: {item['event']}\nTid: {item['open_time']}\n---\n"
|
||||
# Discord message limit is 2000 characters
|
||||
if len(content) > 1900:
|
||||
content = content[:1900] + "... (truncated)"
|
||||
payload = {"content": content}
|
||||
try:
|
||||
|
||||
response = requests.post(webhook_url, json=payload)
|
||||
response.raise_for_status()
|
||||
return response.status_code
|
||||
except requests.exceptions.HTTPError as e:
|
||||
print(f"Discord webhook error: {e}\nPayload: {payload}")
|
||||
return None
|
||||
|
||||
|
||||
def main():
|
||||
nationer_data = fetch_nationer_open_times(NATIONER_URL)
|
||||
if nationer_data:
|
||||
send_to_discord_webhook(nationer_data, DISCORD_WEBHOOK_URL)
|
||||
else:
|
||||
send_to_discord_webhook([
|
||||
{"nation": "Inga aktiviteter hittades.", "event": "", "open_time": ""}
|
||||
], DISCORD_WEBHOOK_URL)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
|
||||
7
docker-compose.yml
Normal file
7
docker-compose.yml
Normal file
@ -0,0 +1,7 @@
|
||||
version: '3.8'
|
||||
services:
|
||||
crawler:
|
||||
build: .
|
||||
environment:
|
||||
- DISCORD_WEBHOOK_URL=https://discord.com/api/webhooks/1437888900747104317/TI2RfDGC5dzoi5JGz6UO2aD23teYNwa6pLQOskhaDnsSVe3cr8_rly0L3K0VyIYARgeR
|
||||
shm_size: '2gb' # For Chrome headless stability
|
||||
1287
event_blocks_debug.html
Normal file
1287
event_blocks_debug.html
Normal file
File diff suppressed because one or more lines are too long
344
events_debug.json
Normal file
344
events_debug.json
Normal file
@ -0,0 +1,344 @@
|
||||
[
|
||||
{
|
||||
"event": "Frukost på Stockholms nation",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 07:30-10:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/frukost-pa-stockholms-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Frukost i Majs Café",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 08:00-10:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/frukost-i-majs-cafe/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser – Södermanlands-Nerikes Nationsbibliotek",
|
||||
"nation": "Södermanlands-Nerikes nation",
|
||||
"open_time": "Idag 08:00-19:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-sodermanlands-nerikes-nationsbibliotek/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser och bibliotek på Norrlands nation",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 08:00-20:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-och-bibliotek-pa-norrlands-nation-2/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser",
|
||||
"nation": "Smålands nation",
|
||||
"open_time": "Idag 10:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser/"
|
||||
},
|
||||
{
|
||||
"event": "Gotlands Pluggfika",
|
||||
"nation": "Gotlands nation",
|
||||
"open_time": "Idag 10:00-16:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pluggfika/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser på Göteborgs Nation",
|
||||
"nation": "Göteborgs nation",
|
||||
"open_time": "Idag 10:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-pa-goteborgs-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser",
|
||||
"nation": "Östgöta nation",
|
||||
"open_time": "Idag 10:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-4/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser",
|
||||
"nation": "Gästrike-Hälsinge nation",
|
||||
"open_time": "Idag 10:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-2/"
|
||||
},
|
||||
{
|
||||
"event": "Studieplatser på Västmanlands-Dala nation",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 10:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/studieplatser-pa-vastmanlands-dala-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Library",
|
||||
"nation": "Uplands nation",
|
||||
"open_time": "Idag 12:00-14:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/library-4/"
|
||||
},
|
||||
{
|
||||
"event": "Utlåningstid — Smålands bibliotek",
|
||||
"nation": "Smålands nation",
|
||||
"open_time": "Idag 13:00-15:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/utlaningstid-smalands-bibliotek-2/"
|
||||
},
|
||||
{
|
||||
"event": "Bibliotekets öppettider",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 15:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bibliotekets-oppettider/"
|
||||
},
|
||||
{
|
||||
"event": "Bibliotekets lånetider",
|
||||
"nation": "Västgöta nation",
|
||||
"open_time": "Idag 17:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bibliotekets-lanetider/"
|
||||
},
|
||||
{
|
||||
"event": "Uplands nation – Office hours 1Q",
|
||||
"nation": "Uplands nation",
|
||||
"open_time": "Idag 10:00-12:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/uplands-nation-office-hours-1q-3/"
|
||||
},
|
||||
{
|
||||
"event": "Mottagningstid 1Q & 3Q",
|
||||
"nation": "Gästrike-Hälsinge nation",
|
||||
"open_time": "Idag 11:00-13:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/mottagningstid-1q-3q/"
|
||||
},
|
||||
{
|
||||
"event": "Mottagningstider på Göteborgs Nation",
|
||||
"nation": "Göteborgs nation",
|
||||
"open_time": "Idag 11:00-15:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/mottagningstider-pa-goteborgs-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Kanslitider på Norrlands nation",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 13:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/kanslitider-pa-norrlands-nation-4/"
|
||||
},
|
||||
{
|
||||
"event": "Mottagningstider på Stockholms nation",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 14:00-16:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/mottagningstider-pa-stockholms-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Kuratorsexpeditionens öppettider",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 14:00-16:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/kuratorsexpeditionens-oppettider-3/"
|
||||
},
|
||||
{
|
||||
"event": "BiblioteKarins mottagningstid",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 15:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bibliotekarins-mottagningstid/"
|
||||
},
|
||||
{
|
||||
"event": "Gästkortsförsäljning hos Kuratorskonventet",
|
||||
"nation": "Startsida",
|
||||
"open_time": "Idag 17:00-19:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/gastkortsforsaljning-hos-kuratorskonventet/"
|
||||
},
|
||||
{
|
||||
"event": "Café Bakfickan",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 10:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/cafe-bakfickan/"
|
||||
},
|
||||
{
|
||||
"event": "Hattstugan",
|
||||
"nation": "Östgöta nation",
|
||||
"open_time": "Idag 11:00-14:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/hattstugan/"
|
||||
},
|
||||
{
|
||||
"event": "Lunch på Stockholms nation",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 11:30-13:15",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/lunch-pa-stockholms-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Lunch å Södermanlands-Nerikes nation",
|
||||
"nation": "Södermanlands-Nerikes nation",
|
||||
"open_time": "Idag 11:30-13:30",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/lunch-a-sodermanlands-nerikes-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Lunch i Majs Café",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 12:00-14:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/lunch-i-majs-cafe/"
|
||||
},
|
||||
{
|
||||
"event": "Sopplunch",
|
||||
"nation": "Västgöta nation",
|
||||
"open_time": "Idag 12:00-14:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/sopplunch/"
|
||||
},
|
||||
{
|
||||
"event": "Gotlands Pluggfika",
|
||||
"nation": "Gotlands nation",
|
||||
"open_time": "Idag 10:00-16:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pluggfika/"
|
||||
},
|
||||
{
|
||||
"event": "Café Bakfickan",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 10:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/cafe-bakfickan/"
|
||||
},
|
||||
{
|
||||
"event": "Hattstugan",
|
||||
"nation": "Östgöta nation",
|
||||
"open_time": "Idag 11:00-14:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/hattstugan/"
|
||||
},
|
||||
{
|
||||
"event": "Carl Larssons café",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 11:30-15:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/carl-larssons-cafe/"
|
||||
},
|
||||
{
|
||||
"event": "Söderbloms Café ☕",
|
||||
"nation": "Gästrike-Hälsinge nation",
|
||||
"open_time": "Idag 12:00-15:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/soderbloms-cafe/"
|
||||
},
|
||||
{
|
||||
"event": "Fika i Majs Café",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 14:00-17:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/fika-i-majs-cafe/"
|
||||
},
|
||||
{
|
||||
"event": "V-Dala Puben",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "2025-11-11 18:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/v-dala-puben/"
|
||||
},
|
||||
{
|
||||
"event": "Pub Bakfickan",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 17:00-23:59",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pub-bakfickan/"
|
||||
},
|
||||
{
|
||||
"event": "Orvars Krog",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 17:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/orvars-krog/"
|
||||
},
|
||||
{
|
||||
"event": "Wermlandskällar’n | Värmlands nation",
|
||||
"nation": "Värmlands nation",
|
||||
"open_time": "Idag 17:30-00:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/wermlandskallarn-varmlands-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Svantes Källare",
|
||||
"nation": "Uplands nation",
|
||||
"open_time": "Idag 18:00-23:55",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/svantes-kallare/"
|
||||
},
|
||||
{
|
||||
"event": "Pub Kronan",
|
||||
"nation": "Kalmar nation",
|
||||
"open_time": "Idag 18:00-23:59",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pub-kronan-7/"
|
||||
},
|
||||
{
|
||||
"event": "Pub Djäknen",
|
||||
"nation": "Västgöta nation",
|
||||
"open_time": "Idag 18:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pub-djaknen-2/"
|
||||
},
|
||||
{
|
||||
"event": "V-Dala Puben",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 18:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/v-dala-puben/"
|
||||
},
|
||||
{
|
||||
"event": "Ghuben",
|
||||
"nation": "Gästrike-Hälsinge nation",
|
||||
"open_time": "Idag 18:00-23:55",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/ghuben-3/"
|
||||
},
|
||||
{
|
||||
"event": "Tages källare",
|
||||
"nation": "Östgöta nation",
|
||||
"open_time": "Idag 18:00-23:55",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/tages-kallare/"
|
||||
},
|
||||
{
|
||||
"event": "PUB HYTTAN – Smålands nation",
|
||||
"nation": "Smålands nation",
|
||||
"open_time": "Idag 18:00-23:30",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pub-hyttan/"
|
||||
},
|
||||
{
|
||||
"event": "Glenns Pub",
|
||||
"nation": "Göteborgs nation",
|
||||
"open_time": "Idag 18:00-00:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/glenns-pub/"
|
||||
},
|
||||
{
|
||||
"event": "Pub Bakfickan",
|
||||
"nation": "Stockholms nation",
|
||||
"open_time": "Idag 17:00-23:59",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pub-bakfickan/"
|
||||
},
|
||||
{
|
||||
"event": "Bistro å Södermanlands-Nerikes nation",
|
||||
"nation": "Södermanlands-Nerikes nation",
|
||||
"open_time": "Idag 18:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bistro-a-sodermanlands-nerikes-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Utlåningstid — Smålands bibliotek",
|
||||
"nation": "Smålands nation",
|
||||
"open_time": "Idag 13:00-15:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/utlaningstid-smalands-bibliotek-2/"
|
||||
},
|
||||
{
|
||||
"event": "BiblioteKarins mottagningstid",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 15:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bibliotekarins-mottagningstid/"
|
||||
},
|
||||
{
|
||||
"event": "Bibliotekets öppettider",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "Idag 15:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/bibliotekets-oppettider/"
|
||||
},
|
||||
{
|
||||
"event": "Pubquiz å Södermanlands-Nerikes nation",
|
||||
"nation": "Södermanlands-Nerikes nation",
|
||||
"open_time": "Idag 18:00-20:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/pubquiz-a-sodermanlands-nerikes-nation-2/"
|
||||
},
|
||||
{
|
||||
"event": "Yoga",
|
||||
"nation": "Östgöta nation",
|
||||
"open_time": "Idag 18:00-19:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/yoga/"
|
||||
},
|
||||
{
|
||||
"event": "Löpning med VGIF",
|
||||
"nation": "",
|
||||
"open_time": "Idag 18:00-19:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/lopning-med-vgif/"
|
||||
},
|
||||
{
|
||||
"event": "Y2K HEXAGON på Norrlands nation",
|
||||
"nation": "Norrlands nation",
|
||||
"open_time": "Idag 21:00-01:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/y2k-hexagon-pa-norrlands-nation/"
|
||||
},
|
||||
{
|
||||
"event": "Släpp Kontaktdagen",
|
||||
"nation": "Västmanlands-Dala nation",
|
||||
"open_time": "2025-11-11 22:30-02:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/slapp-kontaktdagen/"
|
||||
},
|
||||
{
|
||||
"event": "Utlåningstid Södermanlands-Nerikes Nationsbibliotek",
|
||||
"nation": "Södermanlands-Nerikes nation",
|
||||
"open_time": "Idag 16:00-18:00",
|
||||
"permalink": "https://www.nationsguiden.se/events/event/utlaningstid-sodermanlands-nerikes-nationsbibliotek/"
|
||||
}
|
||||
]
|
||||
597
full_page_debug.html
Normal file
597
full_page_debug.html
Normal file
File diff suppressed because one or more lines are too long
17
h4_blocks_debug.html
Normal file
17
h4_blocks_debug.html
Normal file
@ -0,0 +1,17 @@
|
||||
<h4 class="text-lg sm:text-xl font-bold">
|
||||
<a :href="event.permalink" x-text="event.title">
|
||||
</a>
|
||||
</h4>
|
||||
|
||||
|
||||
|
||||
<a :href="event.organiser.permalink" class="text-primary text-sm sm:text-base sm:mt-1" x-show="event.organiser.permalink" x-text="event.organiser.title">
|
||||
</a>
|
||||
|
||||
|
||||
|
||||
<p class="text-primary text-sm sm:text-base sm:mt-1" x-show="!event.organiser.permalink" x-text="event.organiser.title">
|
||||
</p>
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user