Ошибка при использовании selenium webdriver (raise exception_class(message, screen, stacktrace))
from selenium import webdriver
from bs4 import BeautifulSoup
import chromedriver_autoinstaller
chromedriver_autoinstaller.install()
driver = webdriver.Chrome()
def main(url="https://ficbook.net/collections/26473868"):
a = scalp(url)
print(a)
for item in a.items():
print(item[1])
print(fic_scalp(item))
def scalp(url="https://ficbook.net/collections/26473868"):
dir = {}
driver.get(url)
page_src = driver.page_source
soup = BeautifulSoup(page_src, 'lxml')
fics = soup.findAll('a', class_='visit-link')
for num, fic in enumerate(fics):
link = 'https://ficbook.net' + fic.get('href')
ln = int(len(str(fic.text)) - 13)
name = str(fic.text)[:ln]
dir[name] = link
return dir
def fic_scalp(url ='https://ficbook.net/readfic/12274255'): # Не работает, ссылка работает в
# качестве примера
dir = {}
driver.get(str(url))
page_src = driver.page_source
soup = BeautifulSoup(page_src, 'lxml')
soup = soup.find('ul', class_='list-unstyled list-of-fanfic-parts clearfix')
parts = soup.findAll('li', class_='part')
for part in parts:
prt = part.find('a', class_='part-link visit-link ')
prt_link = prt.get('href')
prt = part.find('div', class_='part-title word-break')
prt_name = prt.text
dir[prt_name] = prt_link
return dir
if __name__ == "__main__":
# Iter(urls)
main()
Вывод:
Traceback (most recent call last):
File "F:\Py_projects\Educ\py_files\ficbook_scalping\test.py", line 59, in <module>
main()
File "F:\Py_projects\Educ\py_files\ficbook_scalping\test.py", line 14, in main
print(fic_scalp(item))
File "F:\Py_projects\Educ\py_files\ficbook_scalping\test.py", line 39, in fic_scalp
driver.get(str(url))
File "F:\Py_projects\Educ\venv\lib\site-packages\selenium\webdriver\remote\webdriver.py", line 446, in get
{'Сила': 'https://ficbook.net/readfic/12274255', 'Искусство Обмана ': 'https://ficbook.net/readfic/10835428', 'Хогвартский вор': 'https://ficbook.net/readfic/12177843', 'Ведьмак: Путь Дракона': 'https://ficbook.net/readfic/9417582', 'Я не Люк Скайуокер': 'https://ficbook.net/readfic/12436578'}
https://ficbook.net/readfic/12274255
self.execute(Command.GET, {'url': url})
File "F:\Py_projects\Educ\venv\lib\site-packages\selenium\webdriver\remote\webdriver.py", line 434, in execute
self.error_handler.check_response(response)
File "F:\Py_projects\Educ\venv\lib\site-packages\selenium\webdriver\remote\errorhandler.py", line 243, in check_response
raise exception_class(message, screen, stacktrace)
selenium.common.exceptions.InvalidArgumentException: Message: invalid argument
(Session info: chrome=104.0.5112.81)
Stacktrace:
Backtrace:
Ordinal0 [0x0028AF23+2207523]
Ordinal0 [0x002230E1+1781985]
Ordinal0 [0x00133EB0+802480]
Ordinal0 [0x001273F6+750582]
Ordinal0 [0x00125F05+745221]
Ordinal0 [0x001261CD+745933]
Ordinal0 [0x001357B4+808884]
Ordinal0 [0x0018E0AD+1171629]
Ordinal0 [0x0017D5EC+1103340]
Ordinal0 [0x0018D9F2+1169906]
Ordinal0 [0x0017D406+1102854]
Ordinal0 [0x001575F0+947696]
Ordinal0 [0x001584E6+951526]
GetHandleVerifier [0x00532A12+2733954]
GetHandleVerifier [0x00524E28+2677656]
GetHandleVerifier [0x003146EA+513114]
GetHandleVerifier [0x00313796+509190]
Ordinal0 [0x00229CEB+1809643]
Ordinal0 [0x0022E448+1827912]
Ordinal0 [0x0022E535+1828149]
Ordinal0 [0x00237960+1866080]
BaseThreadInitThunk [0x773B6359+25]
RtlGetAppContainerNamedObjectPath [0x776487D4+228]
RtlGetAppContainerNamedObjectPath [0x776487A4+180]
(No symbol) [0x00000000]