我是使用Python进行网页抓取的新手。我的目的是检索所关注单词的动词。例如dictionary.com针对单词的不同词性定义,我想输入一个感兴趣的单词,然后点击搜索图标,在结果页面中,我想提取标题“动词”下的信息。
我为此安装了硒
但是我得到了错误:
WebDriverException: Message: invalid argument: can't kill an exited process.
我有Firefox版本> 60,Selenium 3.141.0,geckodriver 0.26和Python 2.7(与Python 3.3一起尝试,但得到相同的错误)。
from selenium import webdriver
from selenium.common.exceptions import TimeoutException
from selenium.webdriver.support.ui import WebDriverWait # available since 2.4.0
from selenium.webdriver.support import expected_conditions as EC # available since 2.26.0
# Create a new instance of the Firefox driver
driver = webdriver.Firefox()
我的geckodriver位于PATH定义的文件夹中
WebDriverExceptionTraceback (most recent call last)
<ipython-input-7-55833ccbae5a> in <module>()
8
9 # Create a new instance of the Firefox driver
---> 10 driver = webdriver.Firefox(executable_path=r'../webscraping/geckodriver')
11
12 # go to the google home page
../site-packages/selenium/webdriver/firefox/webdriver.pyc in __init__(self,firefox_profile,firefox_binary,timeout,capabilities,proxy,executable_path,options,service_log_path,firefox_options,service_args,desired_capabilities,log_path,keep_alive)
172 command_executor=executor,173 desired_capabilities=capabilities,--> 174 keep_alive=True)
175
176 # Selenium remote
../site-packages/selenium/webdriver/remote/webdriver.pyc in __init__(self,command_executor,browser_profile,keep_alive,file_detector,options)
155 warnings.warn("Please use FirefoxOptions to set browser profile",156 DeprecationWarning,stacklevel=2)
--> 157 self.start_session(capabilities,browser_profile)
158 self._switch_to = SwitchTo(self)
159 self._mobile = Mobile(self)
../site-packages/selenium/webdriver/remote/webdriver.pyc in start_session(self,browser_profile)
250 parameters = {"capabilities": w3c_caps,251 "desiredCapabilities": capabilities}
--> 252 response = self.execute(Command.NEW_SESSION,parameters)
253 if 'sessionId' not in response:
254 response = response['value']
../site-packages/selenium/webdriver/remote/webdriver.pyc in execute(self,driver_command,params)
319 response = self.command_executor.execute(driver_command,params)
320 if response:
--> 321 self.error_handler.check_response(response)
322 response['value'] = self._unwrap_value(
323 response.get('value',None))
../site-packages/selenium/webdriver/remote/errorhandler.pyc in check_response(self,response)
240 alert_text = value['alert'].get('text')
241 raise exception_class(message,screen,stacktrace,alert_text)
--> 242 raise exception_class(message,stacktrace)
243
244 def _value_or_default(self,obj,key,default):
WebDriverException: Message: invalid argument: can't kill an exited process