From f233bc1208950e3a9658a6b3bc8426e09cdb0607 Mon Sep 17 00:00:00 2001 From: Jim Martens Date: Wed, 8 Jan 2020 21:04:50 +0100 Subject: [PATCH] Save documents in extra directory --- src/twomartens/allrisscraper/main.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/twomartens/allrisscraper/main.py b/src/twomartens/allrisscraper/main.py index 623b43c..f22899e 100644 --- a/src/twomartens/allrisscraper/main.py +++ b/src/twomartens/allrisscraper/main.py @@ -115,16 +115,17 @@ def download_documents(driver: webdriver.WebDriver, meetings: List[meeting.Meeti invitation_item = form_elements[2] invitation_link = f"{base_link}?DOLFDNR={invitation_item.find_element_by_name('DOLFDNR').get_property('value')}&options=64" driver.get(agenda_link) - save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}-{meeting.name}-Tagesordnung.pdf") + save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}_{meeting.name}/Tagesordnung.pdf") driver.get(total_link) - save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}-{meeting.name}-Mappe.pdf") + save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}_{meeting.name}/Mappe.pdf") driver.get(invitation_link) - save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}-{meeting.name}-Einladung.pdf") + save_pdf(driver.current_url, f"{pdf_location}{meeting.date.isoformat()}_{meeting.name}/Einladung.pdf") def save_pdf(url: str, dest: str) -> None: file_data: request = request.urlopen(url) data_to_write = file_data.read() + os.makedirs(os.path.dirname(dest), exist_ok=True) with open(dest, "wb") as file: file.write(data_to_write)