-
Notifications
You must be signed in to change notification settings - Fork 1
/
SeleniumPDFdownloader.py
47 lines (35 loc) · 1.88 KB
/
SeleniumPDFdownloader.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
#***TESTED ON UBUNTU 18*******
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.common.exceptions import TimeoutException
import urllib, os, urllib.request
import time
options = webdriver.FirefoxOptions()
options.headless=False
#driver = webdriver.Firefox(options= options)
# fp = webdriver.FirefoxProfile('/home/USER/.mozilla/firefox/9tn0o76g.default-release')
# fp.set_preference("browser.download.folderList",2)
# fp.set_preference("browser.download.dir", os.getcwd())
# driver = webdriver.Firefox(firefox_profile=fp)
profile = webdriver.FirefoxProfile()
profile.set_preference("browser.download.folderList", 2)
profile.set_preference("browser.download.manager.showWhenStarting", False)
# ENTER DOWNLOAD PATH HERE:
profile.set_preference("browser.download.dir", "/home/USER/Downloads/")
profile.set_preference("browser.helperApps.neverAsk.saveToDisk", "application/pdf")
profile.set_preference("pdfjs.disabled", True)
driver = webdriver.Firefox(profile, options= options)
driver.maximize_window()
time.sleep(0)
for i in range(1,56):
#Insert your own URL
driver.get("INSERT URL HERE")
#Replace the paths below in quotations with the xpaths of where to click
driver.find_element_by_xpath('/html/body/div/div[1]/div/main/article/div/div/div/div[6]/div[1]').click()
driver.find_element_by_xpath('/html/body/div/div[1]/div/main/article/div/div/div/div[6]/ul/li[24]/div').click()
driver.find_element_by_xpath(f'/html/body/div/div[1]/div/main/article/div/div/div/div[6]/ul/li[24]/ul/li[{i}]/a').click()
driver.find_element_by_xpath('/html/body/div/div[1]/div/main/article/div/div/div/p[1]/a').click()
#https://stackoverflow.com/questions/23800195/auto-download-pdf-in-firefox