mirror of
https://gitlab.dit.htwk-leipzig.de/fsr-im/tools/flatscraper.git
synced 2026-01-16 03:22:26 +01:00
44 lines
1.3 KiB
Python
44 lines
1.3 KiB
Python
import requests
|
|
from src.lwb.scraper import EASYSQUARE_HEADERS
|
|
|
|
def scrape_image(url, owner):
|
|
session = requests.Session()
|
|
response = None
|
|
|
|
if owner == "BGL":
|
|
response = session.get(url)
|
|
if response.status_code != 200:
|
|
print(f"Fehler beim Abrufen von BGL: {response.status_code}")
|
|
# return empty image
|
|
return b''
|
|
|
|
if owner == "VLW":
|
|
response = session.get(url)
|
|
if response.status_code != 200:
|
|
print(f"Fehler beim Abrufen von VLW: {response.status_code}")
|
|
# return empty image
|
|
return b''
|
|
|
|
if owner == "LWB":
|
|
# Image URL already carries the required params; only send headers
|
|
response = session.get(url, headers=EASYSQUARE_HEADERS)
|
|
if response.status_code != 200:
|
|
print(
|
|
f"Fehler beim Abrufen von Easysquare: "
|
|
f"{response.status_code}"
|
|
)
|
|
# return empty image
|
|
return b''
|
|
|
|
# Handle other owners or fallback
|
|
if response is None:
|
|
response = session.get(url)
|
|
if response.status_code != 200:
|
|
print(
|
|
f"Fehler beim Abrufen der Standardquelle: "
|
|
f"{response.status_code}"
|
|
)
|
|
return b''
|
|
|
|
return response.content
|