mport requests import re #fileurl='href="https://ppt.1ppt.com/uploads/soft/2209/1-2209201G044.zip' #https://www.1ppt.com/plus/download.php?open=0&aid=97069&cid=3 #遍历ppt模板列表页 for i in range(1,15): url=f'https://www.1ppt.com/xiazai/ppt_xiazai_{i}.html' #请求头,模拟浏览器 headers={'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/78.0.3904.108 Safari/537.36'} #请求数据 respons=requests.get(url=url,headers=headers) #自动识别编码 respons.encoding=respons.apparent_encoding print(respons.text) data_list=re.findall('

(.*?)

',respons.text) print(data_list) for id,title in data_list: url_1=f'https://www.1ppt.com/plus/download.php?open=0&aid={id}&cid=3' respons_1=requests.get(url=url_1,headers=headers) print(respons_1.text) zip_url=re.findall('
  • ',respons_1.text) print(zip_url) for zip in zip_url: zipcontent=requests.get(url=zip,headers=headers).content with open('ppt模板\'+str(id)+title+'.zip','wb') as zipfile: zipfile.write(zipcontent) #print(id,title)