import re
import requests
headers = {
'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36'
}
url = "https://www.bilibili.com/"
response = requests.get(url,headers=headers)
html = response.text
pattern = re.compile(r"<div.*?groom-module home-card.*?<img.*?src=(.*?)alt",re.S)
items = re.findall(pattern,html)
i = 0
for item in items:
item = "http:"+ re.sub('"','',item)
r = requests.get(item)
with open("D:\\TEST\\"+str(i)+'.jpg','wb') as f :
f.write(r.content)
print("图片:"+str(i)+'.jpg'+"写入成功!")
i+=1
B站首页情况:
运行结果:
转载于:https://www.cnblogs.com/shuimohei/p/10335750.html