import re
import threading
from urllib import request
import time
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.support.select import Select
def openURL():
driver = webdriver.PhantomJS()
driver.get("http://www.baidu.com")
print(driver.page_source)
def sendSearch():
driver = webdriver.Chrome()
driver.get("http://www.python.org")
assert "Python" in driver.title
elem = driver.find_element_by_name("q")
elem.send_keys("pycon")
elem.send_keys(Keys.RETURN)
print(driver.page_source)
def getElement():
driver = webdriver.Chrome()
driver.get("http://www.baidu.com")
element = driver.find_element_by_id("kw")
element.send_keys("海贼王", Keys.RETURN)
def getForm():
driver = webdriver.Chrome()
driver.get("http://www.baidu.com")
select = Select(driver.find_element_by_name('name'))
select.select_by_index(1)
select.deselect_all()
driver.find_element_by_id("submit").click()
def Cookies():
driver = webdriver.Chrome()
driver.get("http://www.example.com")
cookie = {"name": "foo", "value": "bar"}
driver.add_cookie(cookie)
driver.get_cookies()
def downImg(imgUrl, filename):
request.urlretrieve(imgUrl, filename)
print(filename, "下载完成")
def getImage():
driver = webdriver.Chrome()
driver.maximize_window()
driver.get("https://tieba.baidu.com/f?kw=%E6%B5%B7%E8%B4%BC%E7%8E%8B&ie=utf-8&pn=550")
while True:
for i in range(10):
driver.execute_script("window.scrollBy(0,1000)")
time.sleep(3)
driver.execute_script("window.scrollTo(0, document.body.scrollHeight)")
break
print(driver.page_source)
html = driver.page_source
pattern = re.compile("<img.* src=\"(https?://.*?)\".*>")
reslist = pattern.findall(html)
print(reslist)
tlist = []
basepath = "E:/PyDownload/"
for i in range(len(reslist)):
imgUrl = reslist[i]
print(imgUrl)
try:
try:
filename = re.search(".*/(.*\.((jpg)|(jpeg)|(png)|(gif)|(bmp)))", imgUrl).group(1)
except Exception as e:
print(e)
filename = "未命名-" + str(int(time.time())) + ".jpg"
print(filename)
filename = basepath + filename
t = threading.Thread(target=downImg, args=(imgUrl, filename))
tlist.append(t)
t.start()
except Exception as e:
print(e)
for t in tlist:
t.join()
pass
if __name__ == '__main__':
openURL()
sendSearch()
getElement()
getImage()
pass