from lxmlimport html
import requests
headers = {
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.93 Safari/537.36'
}
#url = 'https://pic.netbian.com/4kmeinv/'
for iin range(2, 137): #由于想代码量简洁,第一页就不获取
url ='https://pic.netbian.com/4kmeinv/index_{}.html'.format(i) #获取url
response = requests.get(url=url, headers=headers) #请求
etree = html.fromstring(response.text) #获取tree结构实例
li_list = etree.xpath('/html//div[@class="slist"]//li') #定位到li标签
for liin li_list:
img ='https://pic.netbian.com' + li.xpath('./a/img/@src')[0] #定位到图片
filename = li.xpath('./a/img/@alt')[0] #定位到图片名字
filename = filename.encode('iso-8859-1').decode('gbk') +'.jpg' #进行编码修改
img_data = requests.get(img).content #获取图片内容
filename ='C:/Users/Administrator/PycharmProjects/pythonProject/img/'+filename #定义图片存放路径,这里用的是绝对路径
with open(filename, 'wb')as fp: #保存到本地
fp.write(img_data)
print(filename, '保存成功')