mirror of
https://gitlab.dit.htwk-leipzig.de/fsr-im/tools/flatscraper.git
synced 2026-01-16 16:22:27 +01:00
feat: add BGL scraper and integrate into main scraping process; update image scraping logic
This commit is contained in:
@@ -1,16 +1,23 @@
|
||||
import requests
|
||||
from src.lwb.scraper import EASYSQUARE_HEADERS, EASYSQUARE_PARAMS
|
||||
|
||||
def scrape_image(url):
|
||||
def scrape_image(url, owner):
|
||||
session = requests.Session()
|
||||
response = session.get(url, headers=EASYSQUARE_HEADERS, params=EASYSQUARE_PARAMS)
|
||||
|
||||
if response.status_code != 200:
|
||||
print(f"Fehler beim Abrufen von Easysquare: {response.status_code}")
|
||||
# return empty image
|
||||
return b''
|
||||
if owner == "BGL":
|
||||
response = session.get(url)
|
||||
if response.status_code != 200:
|
||||
print(f"Fehler beim Abrufen von BGL: {response.status_code}")
|
||||
# return empty image
|
||||
return b''
|
||||
|
||||
if owner == "LWB":
|
||||
response = session.get(url, headers=EASYSQUARE_HEADERS, params=EASYSQUARE_PARAMS)
|
||||
if response.status_code != 200:
|
||||
print(f"Fehler beim Abrufen von Easysquare: {response.status_code}")
|
||||
# return empty image
|
||||
return b''
|
||||
|
||||
# get image from response
|
||||
|
||||
return response.content
|
||||
|
||||
|
||||
Reference in New Issue
Block a user