Selenium 操作 Firefox 浏览器自动采集网页


主要代码:

from selenium import webdriver
from selenium.webdriver.common.by import By


def main():

    firefox_profile = webdriver.FirefoxProfile(
        "C:\\Users\\Admin\\AppData\\Roaming\\Mozilla\\Firefox\\Profiles\\admin.default-esr")
    browser = webdriver.Firefox(firefox_profile=firefox_profile)
    page = 300

    while page > 0:
        url = 'https://www.abc.com/page-{}.html'.format(page)
        browser.get(url)
        with open(file='html/' + str(page) + '.html', mode='a', encoding='utf-8') as f:
            f.write(browser.page_source)
        page = page - 1

    browser.quit()


if __name__ == '__main__':
    main()