admin管理员组文章数量:1516870
requests
```#进行爬取
import requests
import os
from requests_html import HTMLSession#必须使用session = HTMLSession()
session = HTMLSession()
os.makedirs('C:/表情包',exist_ok=True)
path='C:/表情包/'
a=0
fail=0
def save(respone,name):with open(path+name+'.jpg','wb') as f:f.write(respone)
def savegif(respone,name):with open(path + name + '.gif', 'wb') as f:f.write(respone)
def src(i):r=session.get('/'+str(i)+'.html')for i in range(1,46):div=r.html.find('#bqb > div.ui.segment.imghover > div:nth-child('+str(i)+') > a > img',first=True)# print(div.find('img'))#直接定位到img标签,具体分析,获取相应的数据try:print(div.attrs['data-original'])#获取到地址print(div.attrs['title'])#获取到titletitle=div.attrs['title']link=str(div.attrs['data-original'])print(link)connet=requests.get(link)if (link[-3:]=='jpg'):save(connet.content,title)else:savegif(connet.content, title)# with open(path + title + '.jpg', 'wb') as f:# f.write(connet.content)except:print("没有定位到超链接")global failfail=fail+1global aa=a+1print('在下载第d%张'%a)#下载了多少个print('失败d%张'%fail)for i in range(0,201):src(i)本文标签: requests
版权声明:本文标题:requests 内容由网友自发贡献,该文观点仅代表作者本人, 转载请联系作者并注明出处:https://www.betaflare.com/biancheng/1704549622a628271.html, 本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如发现本站有涉嫌抄袭侵权/违法违规的内容,一经查实,本站将立刻删除。


发表评论