import os
import requests
import re
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.45 Safari/537.36'
}
if not os.path.exists('./qiutu'):
os.mkdir('./qiutu')
url='https://www.qiushibaike.com/i...'
page_data=requests.get(url=url,headers=headers).text
ex='<div class="thumb">.*?<img src="(.*?)" alt.*?</div>'
img_src_list=re.findall(ex,page_data,re.S)
for src in img_src_list:
src='https:'+src
img_date=requests.get(url=src,headers=headers).content
img_name=src.split('/')[-1]
imgpath='./qiutu/'+img_name
with open(imgpath,'wb') as fp:
fp.write(img_date)
print("图片爬取完成")