看到好看的图片了
python:
"""
"""
import io,os,re,requests
from PIL import Image
from io import BytesIO
import ssl
ssl.\_create\_default\_https\_context = ssl.\_create\_unverified_context
print("开始-->>>>")
#神秘连接
url = 'https://img.fghrsh.net/explore/recent/?list=images&page=1&seek=nZLx0'
#没有第一个文件夹先创建文件夹
if not os.path.exists(os.getcwd()+'\\\pic'+'\\\'+str(1)):
os.makedirs(os.getcwd()+'\\\pic'+'\\\'+str(1))
#从第一个文件夹开始
fileNumber=1
#抓40页的图
for i in range(1,40):
#获取当前url
r= requests.get(url)
print("当前url",url)
r.encoding = 'utf-8'
data = r.text
#提取png网址
fir = re.findall(r'img src=".*?" alt',data)
fir = str(fir).replace('img src="','').replace('" alt','').replace('.md','')
print("fir:",fir)
fir = fir.split(',')\[0:-1\]
#保存图片
for idx,url in enumerate(fir):
url = url\[2:-1\]
if 'gif' in url:
print('出现gif')
elif '涉嫌违规' in url:
print('出现违规')
else:
print('url',url)
if not os.path.exists(os.getcwd()+'\\\pic'+'\\\'+str(1)):
os.makedirs(os.getcwd()+'\\\pic'+'\\\'+str(1))
img_path=(os.getcwd()+'\\\pic'+'\\\'+str(fileNumber)+'\\\')+str(idx+1).zfill(3)+'.png'
print('img\_path',img\_path)
response = requests.get(url)
img_data =response.content
image = Image.open(io.BytesIO(img_data))
image.save(img_path)
#获取页面链接
https=re.findall(r'<a data-pagination="next" href="https://img.fghrsh.net/explore/recent\\/\\?list=images&page=\[0-9\]{1,2}&seek=\[a-zA-z0-9\]{5}"',data)
print('获取的下一个地址',https)
https=str(https).replace('<a data-pagination="next" href="','').replace('"','')
print('nexturl',str(https))
https=https.replace('\[','').replace('\]','').replace("'",'')
print('nexturl',https)
url=https
#新建下一个文件夹
fileNumber=fileNumber+1
if not os.path.exists(os.getcwd()+'\\\pic'+'\\\'+str(fileNumber)):
os.makedirs(os.getcwd()+'\\\pic'+'\\\'+str(fileNumber))