主页 M

python面向对象xpath下载包图网预览视频

2020-04-06 网页编程网 网页编程网
# -*- coding: utf-8 -*-
import requests
from lxml import etree
#通过xhr未找到json,故用原始页下载
class Spider(object):
    def starr_request(self):
        for i in range(1,223):
            response=requests.get('https://ibaotu.com/shipin/7-0-0-0-0-{}.html'.format(i))
            html=etree.HTML(response.content.decode())
            self.xpath_data(html)

    def xpath_data(self,html):
        src_list=html.xpath('//div[@class="video-play"]/video/@src')
        tit_list=html.xpath('//span[@class="video-title"]/text()')
        #使二者一一对应
        for src,tit in zip(src_list,tit_list):
            print(src,tit)
            url='http:'+src
            name=tit+'.mp4'
            response=requests.get(url)
            print('down'+name)
            with open('video/{}'.format(name),'wb') as f:
                f.write(response.content)

if __name__ =='__main__':
    spider=Spider()
    spider.starr_request()
阅读原文
阅读 3327
123 显示电脑版