python网络爬虫(第七章:无头浏览器+规避检测)

案例

from selenium import webdriver
from time import sleep
#实现无可视化界面(其实就是后台运行,不要显示在显示屏上面)
from selenium.webdriver.chrome.options import Options
#实现规避检测
from selenium.webdriver import ChromeOptions

#1.实现无可视化界面的操作
chrome_options = Options()
chrome_options.add_argument('--headless')
chrome_options.add_argument('--disable-gpu')

#2.实现规避检测
option = ChromeOptions()
option.add_experimental_option('excludeSwitches',['enable-automation'])


driver = webdriver.Chrome('./chromedriver.exe',chrome_options=chrome_options,options=option)

driver.get('https://www.baidu.com')

sleep(5)
print(driver.page_source)
driver.quit()

无头浏览器

step1:导包 from selenium.webdriver.chrome.options import Options
step2:实现无可视化界面的操作
	chrome_options = Options()
	chrome_options.add_argument('--headless')
	chrome_options.add_argument('--disable-gpu')
step3:在服务器对象中添加数据
	driver = webdriver.Chrome('./chromedriver.exe',chrome_options=chrome_options)  #之前是driver = webdriver.Chrome('./chromedriver.exe')

规避检测

step1:导包 from selenium.webdriver import ChromeOptions
step2:实现规避规则
	option = ChromeOptions()
	option.add_experimental_option('excludeSwitches',['enable-automation'])
step3:添加数据
	driver = webdriver.Chrome('./chromedriver.exe',chrome_options=chrome_options,options=option)   #之前driver = webdriver.Chrome('./chromedriver.exe')

版权声明:本文为qq_38633279原创文章,遵循CC 4.0 BY-SA版权协议,转载请附上原文出处链接和本声明。