123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181 |
- #coding=utf-8
- #!/usr/bin/python
- import sys
- sys.path.append('..')
- from base.spider import Spider
- import json
- import time
- import base64
- class Spider(Spider): # 元类 默认的元类 type
- def getName(self):
- return "央视"
- def init(self,extend=""):
- print("============{0}============".format(extend))
- pass
- def isVideoFormat(self,url):
- pass
- def manualVideoCheck(self):
- pass
- def homeContent(self,filter):
- result = {}
- cateManual = {
- "健康之路": "TOPC1451557646802924",
- "远方的家": "TOPC1451541349400938",
- "探索发现": "TOPC1451557893544236",
- "地理中国": "TOPC1451557421544786",
- "人与自然": "TOPC1451525103989666",
- "人文地理": "TOPC1451469288523874",
- "全景自然": "TOPC1451469617360656",
- "魅力纪录": "TOPC1451465982926341",
- "秘境之眼": "TOPC1554187056533820",
- "自然": "TOPC1451469660736687",
- "新闻联播": "TOPC1451528971114112",
- "焦点访谈": "TOPC1451558976694518",
- "海峡两岸": "TOPC1451540328102649",
- "今日关注": "TOPC1451540389082713",
- "今日亚洲": "TOPC1451540448405749",
- "防务新观察": "TOPC1451526164984187",
- "共同关注": "TOPC1451558858788377",
- "深度国际": "TOPC1451540709098112",
- "环宇视野": "TOPC1451469241240836",
- "环球视线": "TOPC1451558926200436",
- "世界周刊": "TOPC1451558687534149",
- "东方时空": "TOPC1451558532019883",
- "新闻调查": "TOPC1451558819463311",
- "环球科技视野": "TOPC1451463780801881",
- "讲武堂": "TOPC1451526241359341",
- "国宝发现": "TOPC1571034869935436",
- "国宝档案": "TOPC1451540268188575",
- "天下财经": "TOPC1451531385787654",
- "走进科学": "TOPC1451558190239536",
- "解码科技史": "TOPC1570876640457386",
- "法律讲堂": "TOPC1451542824484472",
- "百家讲坛": "TOPC1451557052519584",
- "名家书场": "TOPC1579401761622774",
- "星光大道": "TOPC1451467630488780",
- "非常6+1": "TOPC1451467940101208",
- "中国节拍": "TOPC1570025984977611",
- "一鸣惊人": "TOPC1451558692971175",
- "金牌喜剧班": "TOPC1611826337610628",
- "九州大戏台": "TOPC1451558399948678",
- "家庭幽默大赛": "TOPC1451375222891702",
- "综艺盛典": "TOPC1451985071887935",
- "环球综艺": "TOPC1571300682556971",
- "中国好歌曲": "TOPC1451984949453678",
- "外国人在中国": "TOPC1451541113743615",
- "华人世界": "TOPC1451539822927345",
- "动物传奇": "TOPC1451984181884527",
- "美食中国": "TOPC1571034804976375",
- "动物世界": "TOPC1451378967257534",
- "经典咏流传 第五季":"VIDAIiNbDQzOjE5mLl3T4t2B220403"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name':k,
- 'type_id':cateManual[k]
- })
- result['class'] = classes
- if(filter):
- result['filters'] = self.config['filter']
- return result
- def homeVideoContent(self):
- result = {
- 'list':[]
- }
- return result
- def categoryContent(self,tid,pg,filter,extend):
- result = {}
- extend['id'] = tid
- extend['p'] = pg
- filterParams = ["id", "p", "d"]
- params = ["", "", ""]
- for idx in range(len(filterParams)):
- fp = filterParams[idx]
- if fp in extend.keys():
- params[idx] = '{0}={1}'.format(filterParams[idx],extend[fp])
- suffix = '&'.join(params)
- url = 'https://api.cntv.cn/NewVideo/getVideoListByColumn?{0}&n=20&sort=desc&mode=0&serviceId=tvcctv&t=json'.format(suffix)
- if not tid.startswith('TOPC'):
- url = 'https://api.cntv.cn/NewVideo/getVideoListByAlbumIdNew?{0}&n=20&sort=desc&mode=0&serviceId=tvcctv&t=json'.format(suffix)
- rsp = self.fetch(url,headers=self.header)
- jo = json.loads(rsp.text)
- vodList = jo['data']['list']
- videos = []
- for vod in vodList:
- guid = vod['guid']
- title = vod['title']
- img = vod['image']
- brief = vod['brief']
- videos.append({
- "vod_id":guid+"###"+img,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":''
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def detailContent(self,array):
- aid = array[0].split('###')
- tid = aid[0]
- url = "https://vdn.apps.cntv.cn/api/getHttpVideoInfo.do?pid={0}".format(tid)
- rsp = self.fetch(url,headers=self.header)
- jo = json.loads(rsp.text)
- title = jo['title'].strip()
- link = jo['hls_url'].strip()
- vod = {
- "vod_id":tid,
- "vod_name":title,
- "vod_pic":aid[1],
- "type_name":'',
- "vod_year":"",
- "vod_area":"",
- "vod_remarks":"",
- "vod_actor":"",
- "vod_director":"",
- "vod_content":""
- }
- vod['vod_play_from'] = 'CCTV'
- vod['vod_play_url'] = title+"$"+link
- result = {
- 'list':[
- vod
- ]
- }
- return result
- def searchContent(self,key,quick):
- result = {
- 'list':[]
- }
- return result
- def playerContent(self,flag,id,vipFlags):
- result = {}
- rsp = self.fetch(id,headers=self.header)
- content = rsp.text.strip()
- arr = content.split('\n')
- urlPrefix = self.regStr(id,'(http[s]?://[a-zA-z0-9.]+)/')
- url = urlPrefix + arr[-1]
- result["parse"] = 0
- result["playUrl"] = ''
- result["url"] = url
- result["header"] = ''
- return result
- config = {
- "player": {},
- "filter": {"TOPC1451557970755294": [{"key": "d", "name": "年份", "value": [{"n": "全部", "v": ""}, {"n": "2021", "v": "2021"}, {"n": "2020", "v": "2020"}, {"n": "2019", "v": "2019"}, {"n": "2018", "v": "2018"}, {"n": "2017", "v": "2017"}, {"n": "2016", "v": "2016"}, {"n": "2015", "v": "2015"}, {"n": "2014", "v": "2014"}, {"n": "2013", "v": "2013"}, {"n": "2012", "v": "2012"}, {"n": "2011", "v": "2011"}, {"n": "2010", "v": "2010"}, {"n": "2009", "v": "2009"}]}]}
- }
- header = {
- "User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.54 Safari/537.36"
- }
- def localProxy(self,param):
- return [200, "video/MP2T", action, ""]
|