mport requests
import re
#fileurl='href="https://ppt.1ppt.com/uploads/soft/2209/1-2209201G044.zip'
#https://www.1ppt.com/plus/download.php?open=0&aid=97069&cid=3
#遍历ppt模板列表页
for i in range(1,15):
url=f'https://www.1ppt.com/xiazai/ppt_xiazai_{i}.html'
#请求头,模拟浏览器
headers={'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/78.0.3904.108 Safari/537.36'}
#请求数据
respons=requests.get(url=url,headers=headers)
#自动识别编码
respons.encoding=respons.apparent_encoding
print(respons.text)
data_list=re.findall('
(.*?)
',respons.text)
print(data_list)
for id,title in data_list:
url_1=f'https://www.1ppt.com/plus/download.php?open=0&aid={id}&cid=3'
respons_1=requests.get(url=url_1,headers=headers)
print(respons_1.text)
zip_url=re.findall('',respons_1.text)
print(zip_url)
for zip in zip_url:
zipcontent=requests.get(url=zip,headers=headers).content
with open('ppt模板\'+str(id)+title+'.zip','wb') as zipfile:
zipfile.write(zipcontent)
#print(id,title)
