diff --git a/.gitignore b/.gitignore index 482c31a..73c68fc 100644 --- a/.gitignore +++ b/.gitignore @@ -569,3 +569,4 @@ FodyWeavers.xsd .idea/ *.sln.iml +dwd-data* diff --git a/importy.py b/importy.py new file mode 100644 index 0000000..f84e811 --- /dev/null +++ b/importy.py @@ -0,0 +1,52 @@ +from operator import contains +import requests +import os + +import zipfile +import io + +url = 'https://opendata.dwd.de/climate_environment/CDC/observations_germany/climate/10_minutes/air_temperature/now/' +download_folder = 'dwd-data/' + +response = requests.get(url) + +#print(response.text) + +from bs4 import BeautifulSoup + +soup = BeautifulSoup(response.text, 'html.parser') + +print(soup.title) + +if not os.path.isdir(download_folder): + os.mkdir(download_folder) + +dwd_links = soup.findAll('a') + +i = int(1) +dwd_len = len(dwd_links) - 3 + +for file_text in dwd_links: + dwd_len = len(dwd_links) - 3 + + if (str(file_text.text).__contains__('10minutenwerte')): + dest_file = download_folder + file_text.text + if not os.path.isfile(dest_file): + file_url = url + "/" + file_text.text + + download(file_url, dest_file) + + print("Download ", i," von ",dwd_len) + i += 1 + + def download(url, dest_file): + response = requests.get(file_url) + open(dest_file, 'wb').write(response.content) + +for filename in os.listdir(download_folder): + file_path = os.path.join(download_folder, filename) + + zip=zipfile.ZipFile(file_path) + f=zip.open(zip.namelist()[0]) + contents=f.read() + print(contents) \ No newline at end of file