下拉菜单的实践
from selenium import webdriver
from selenium.webdriver.common.action_chains import ActionChains
from selenium.webdriver.support.select import Select
import time
"""
下拉菜单的实践
Select(sel).select_by_index(2)
"""
driver = webdriver.Chrome(r"C:\Users\xxxx\Desktop\chromedriver.exe")
driver.get("https://www.baidu.com")
time.sleep(3)
above = driver.find_element_by_link_text(u"设置")
ActionChains(driver).move_to_element(above).perform()
time.sleep(1)
driver.find_element_by_link_text("搜索设置").click()
time.sleep(1)
sel = driver.find_element_by_id("nr")
Select(sel).select_by_index(2)
time.sleep(2)
driver.close()
文件的下载
from selenium import webdriver
import time
"""
file_down 文件的下载
"""
import os
options = webdriver.ChromeOptions()
prefs = {"profile.default_content_setting.popups":0,"download.default_directory":"./"}
options.add_experimental_option("prefs",prefs)
"""
已经下载了:只不过目录不是我们指定的目标目录
下载到了google浏览器自己的默认目录中了:r"C:\Users\xxxx\Downloads"
"""
driver = webdriver.Chrome(r"C:\Users\xxxx\Desktop\chromedriver.exe")
driver.get("https://pypi.org/project/selenium/#files")
driver.find_element_by_link_text("selenium-3.141.0.tar.gz").click()
time.sleep(10)
driver.close()
爬取快代理的所有的ip:port
爬取快代理的所有的ip:port
from selenium import webdriver
import time
for i in range(100):
url = "https://www.kuaidaili.com/free/inha/"
driver = webdriver.Chrome(r"C:\Users\xxxx\Desktop\chromedriver.exe")
url = url + str(i+1) + "/"
driver.get(url)
time.sleep(1)
data = driver.find_elements_by_xpath("//tbody//tr")
for da in data:
ip = da.find_element_by_xpath("./td[1]").text
port = da.find_element_by_xpath("./td[2]").text
print(ip + ":" + port)
print("第" + str(i+1) + "页下载完成")
driver.close()
break