import requests
from lxml import etree
from urllib import request
import time
def huya_spider():
url = 'https://www.huya.com/g/2168#tag2609'
User_Agent = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/76.0.3809.87 Safari/537.36"
headers = {
'User_Agent':User_Agent
}
res = requests.get(url)
result = res.text
print(res)
data = etree.HTML(result)
alist = data.xpath('//img[@class="pic"]')
cnt = 0
for woman in alist:
cnt = cnt + 1
img = woman.xpath('./@data-original')[0]
img = img.split("?")[0]
name = woman.xpath('./@alt')[0]
path = 'D:\\img\\'
try:
print(img)
path2 = path + str(cnt) + ".png"
print(path2)
request.urlretrieve(img, path2)
except Exception as e:
print(e)
pass
time.sleep(3)
huya_spider()
