python学习源码分享：批量爬取第1PPT网站PPT模板

mport requests import re #fileurl='href="https://ppt.1ppt.com/uploads/soft/2209/1-2209201G044.zip' #https://www.1ppt.com/plus/download.php?open=0&aid=97069&cid=3 #遍历ppt模板列表页 for i in range(1,15): url=f'https://www.1ppt.com/xiazai/ppt_xiazai_{i}.html' #请求头，模拟浏览器 headers={'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/78.0.3904.108 Safari/537.36'} #请求数据 respons=requests.get(url=url,headers=headers) #自动识别编码 respons.encoding=respons.apparent_encoding print(respons.text) data_list=re.findall('

`(.*?)`

',respons.text)
    print(data_list)
    for id,title in data_list:
        url_1=f'https://www.1ppt.com/plus/download.php?open=0&aid={id}&cid=3'
        respons_1=requests.get(url=url_1,headers=headers)
        print(respons_1.text)
        zip_url=re.findall('

',respons_1.text)
        print(zip_url)
        for zip in zip_url:
            zipcontent=requests.get(url=zip,headers=headers).content
            with open('ppt模板\'+str(id)+title+'.zip','wb') as zipfile:
                zipfile.write(zipcontent)
    #print(id,title)