Многостраничный парсинг¶
Пример последовательного парсинга нескольких страниц.
from cdriv import CDriv
urls = [
"https://site.com/page1",
"https://site.com/page2",
"https://site.com/page3",
]
with CDriv() as driver:
driver.new_session()
for url in urls:
driver.navigate(url)
driver.wait_for_element(".content", timeout=10)
title = driver.get_text("h1")
text = driver.get_text(".content")
links = driver.get_all_attributes("a", "href")
print(f"=== {title} ===")
print(f"Текст: {text[:100]}...")
print(f"Ссылок найдено: {len(links)}")
print()