虎牙爬虫 并保存到 同级目录 English_name_image文件夹下

from itertools import combinations
import string
from urllib.request import urlretrieve
import requests
from lxml import etree
l = string.ascii_lowercase
ll = []
for i in combinations(l, 2):
    ll.append(i[0] + i[1])

url = "https://www.huya.com/g/4079"
headers = {
     
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.88 Safari/537.36 Edg/87.0.664.57"
}

resp = requests.get(url=url, headers=headers)
data = etree.HTML(resp.content)
friends_list = data.xpath('//img[@class="pic"]')
for j, friend in enumerate(friends_list):
    img = friend.xpath('./@data-original')[0]
    img = img.split('?')[0]
    urlretrieve(img, r'English_name_image/' + ll[j] + '.png')

你可能感兴趣的:(虎牙爬虫 并保存到 同级目录 English_name_image文件夹下)