- 论坛徽章:
- 0
|
想把网址下按目录下载文件
from selenium import webdriver
from selenium.webdriver.firefox.options import Options
from bs4 import BeautifulSoup
options = Options()
options.headless = True
dr=webdriver.Firefox(executable_path='/usr/lib/firefox/geckodriver',options=options)
dr.get(url)
neirong= driver.page_source
driver.close()
soup = BeautifulSoup(neirong,'lxml')
k=[]
for l in soup.find_all('a'):
k.append(l.get('href'))
一直出错 安了geck到usrlibfirefox下 提示
Traceback (most recent call last): File "2beautifulsoup.py", line 12, in <module> dr=webdriver.Firefox(executable_path='/usr/lib/firefox/geckodriver',options=options) File "/usr/local/lib/python3.5/dist-packages/selenium/webdriver/firefox/webdriver.py", line 174, in __init__ keep_alive=True) File "/usr/local/lib/python3.5/dist-packages/selenium/webdriver/remote/webdriver.py", line 157, in __init__ self.start_session(capabilities, browser_profile) File "/usr/local/lib/python3.5/dist-packages/selenium/webdriver/remote/webdriver.py", line 252, in start_session response = self.execute(Command.NEW_SESSION, parameters) File "/usr/local/lib/python3.5/dist-packages/selenium/webdriver/remote/webdriver.py", line 321, in execute self.error_handler.check_response(response) File "/usr/local/lib/python3.5/dist-packages/selenium/webdriver/remote/errorhandler.py", line 242, in check_response raise exception_class(message, screen, stacktrace) selenium.common.exceptions.WebDriverException: Message: invalid argument: can't kill an exited process ---------
网上有说版本有说重启
|
|