# -*- coding: utf-8 -*-
import requests
from lxml import etree
#通过xhr未找到json,故用原始页下载
class Spider(object):
def starr_request(self):
for i in range(1,223):
response=requests.get('https://ibaotu.com/shipin/7-0-0-0-0-{}.html'.format(i))
html=etree.HTML(response.content.decode())
self.xpath_data(html)
def xpath_data(self,html):
src_list=html.xpath('//div[@class="video-play"]/video/@src')
tit_list=html.xpath('//span[@class="video-title"]/text()')
#使二者一一对应
for src,tit in zip(src_list,tit_list):
print(src,tit)
url='http:'+src
name=tit+'.mp4'
response=requests.get(url)
print('down'+name)
with open('video/{}'.format(name),'wb') as f:
f.write(response.content)
if __name__ =='__main__':
spider=Spider()
spider.starr_request()