Establish sql connection only after data got scraped successfully
This commit is contained in:
parent
fc952670bb
commit
9fb1d81652
@ -13,6 +13,18 @@ class DwdScraper:
|
||||
last_station = self.get_station_to_update()
|
||||
print("checking station", last_station)
|
||||
|
||||
print(last_station)
|
||||
r = requests.get('https://opendata.dwd.de/climate_environment/CDC/observations_germany/climate/daily/kl/recent/tageswerte_KL_' + str(last_station) + '_akt.zip', stream=True)
|
||||
print(r.url)
|
||||
if r.status_code != 200:
|
||||
return
|
||||
|
||||
zip = zipfile.ZipFile(io.BytesIO(r.content))
|
||||
files = zip.namelist()
|
||||
print(files)
|
||||
files_climate = [f for f in files if f.startswith("produkt_klima_")]
|
||||
print(files_climate)
|
||||
|
||||
with psycopg2.connect(config_db["uri"]) as conn:
|
||||
with conn.cursor() as cur:
|
||||
|
||||
@ -22,19 +34,6 @@ class DwdScraper:
|
||||
curr_station_id = current_station[0]
|
||||
curr_station_dwd_id = current_station[4]
|
||||
|
||||
print(curr_station_dwd_id)
|
||||
r = requests.get('https://opendata.dwd.de/climate_environment/CDC/observations_germany/climate/daily/kl/recent/tageswerte_KL_' + str(curr_station_dwd_id) + '_akt.zip', stream=True)
|
||||
print(r.url)
|
||||
if r.status_code == 200:
|
||||
zip = zipfile.ZipFile(io.BytesIO(r.content))
|
||||
files = zip.namelist()
|
||||
print(files)
|
||||
files_climate = [f for f in files if f.startswith("produkt_klima_")]
|
||||
print(files_climate)
|
||||
|
||||
|
||||
buffer = []
|
||||
|
||||
is_first_line = True
|
||||
|
||||
for line in zip.open(files_climate[0]):
|
||||
|
Loading…
Reference in New Issue
Block a user