跳转至

多页面抓取

顺序抓取多个页面的示例。

from cdriv import CDriv

urls = [
    "https://site.com/page1",
    "https://site.com/page2",
    "https://site.com/page3",
]

with CDriv() as driver:
    driver.new_session()

    for url in urls:
        driver.navigate(url)
        driver.wait_for_element(".content", timeout=10)

        title = driver.get_text("h1")
        text = driver.get_text(".content")
        links = driver.get_all_attributes("a", "href")

        print(f"=== {title} ===")
        print(f"文本: {text[:100]}...")
        print(f"链接数: {len(links)}")
        print()