From cae39c4494b89c3790a8052830769373a91da66b Mon Sep 17 00:00:00 2001 From: frankknoll Date: Fri, 13 May 2022 00:22:38 +0200 Subject: [PATCH] refactoring --- src/HowBadIsMyBatch.ipynb | 31 +++++++++++++++++++++---------- 1 file changed, 21 insertions(+), 10 deletions(-) diff --git a/src/HowBadIsMyBatch.ipynb b/src/HowBadIsMyBatch.ipynb index c93bcb6d209..b18d39c17e7 100644 --- a/src/HowBadIsMyBatch.ipynb +++ b/src/HowBadIsMyBatch.ipynb @@ -99,25 +99,36 @@ "from selenium.webdriver.chrome.options import Options\n", "from selenium.webdriver.common.by import By\n", "\n", - "downloadDir = \"/home/frankknoll/Dokumente/Corona/projects/HowBadIsMyBatch/src/VAERS/tmp\"\n", - "file2Download = '2022VAERSData.zip'\n", - "captchaImageFile = 'captchaImage.jpeg'\n", - "\n", - "def getWebDriver(downloadDir):\n", + "def _getOptions(downloadDir, isHeadless):\n", " options = Options()\n", + " options.headless = isHeadless\n", " options.add_experimental_option(\"prefs\", {\"download.default_directory\" : downloadDir})\n", + " return options\n", + "\n", + "def getWebDriver(downloadDir, isHeadless):\n", " return webdriver.Chrome(\n", " service = ChromeService(executable_path = ChromeDriverManager().install()),\n", - " options = options)\n", - "\n", - "driver = getWebDriver(downloadDir)\n", - "driver.get('https://vaers.hhs.gov/eSubDownload/index.jsp?fn=' + file2Download)\n", + " options = _getOptions(downloadDir, isHeadless))\n", "\n", "def saveCaptchaImageAs(captchaImageFile):\n", " captchaImage = driver.find_element(By.CSS_SELECTOR, \"img[src='captchaImage']\")\n", " with open(captchaImageFile, 'wb') as file:\n", - " file.write(captchaImage.screenshot_as_png)\n", + " file.write(captchaImage.screenshot_as_png)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8ac81845", + "metadata": {}, + "outputs": [], + "source": [ + "downloadDir = \"/home/frankknoll/Dokumente/Corona/projects/HowBadIsMyBatch/src/VAERS/tmp\"\n", + "file2Download = '2022VAERSData.zip'\n", + "captchaImageFile = 'captchaImage.jpeg'\n", "\n", + "driver = getWebDriver(downloadDir, isHeadless = False)\n", + "driver.get('https://vaers.hhs.gov/eSubDownload/index.jsp?fn=' + file2Download)\n", "saveCaptchaImageAs(captchaImageFile)" ] },