123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217 |
- # coding=utf-8
- # !/usr/bin/python
- import sys
- import re
- sys.path.append('..')
- from base.spider import Spider
- import urllib.parse
- class Spider(Spider): # 元类 默认的元类 type
- def getName(self):
- return "创艺影视"
- def init(self, extend=""):
- print("============{0}============".format(extend))
- pass
- def homeContent(self, filter):
- result = {}
- cateManual = {
- "电影": "1",
- "剧集": "2",
- "动漫": "4",
- "综艺": "3",
- "纪录片": "30"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name': k,
- 'type_id': cateManual[k]
- })
- result['class'] = classes
- if (filter):
- result['filters'] = self.config['filter']
- return result
- def homeVideoContent(self):
- result = {
- 'list': []
- }
- return result
- def categoryContent(self, tid, pg, filter, extend):
- result = {}
- header = {"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
- url = 'https://www.30dian.cn/vodtype/{0}-{1}.html'.format(tid, pg)
- rsp = self.fetch(url,headers=header)
- root = self.html(self.cleanText(rsp.text))
- aList = root.xpath("//div[@class='myui-panel myui-panel-bg clearfix']/div/div/ul/li")
- videos = []
- for a in aList:
- name = a.xpath('./div/a/@title')[0]
- pic = a.xpath('./div/a/@data-original')[0]
- mark = a.xpath("./div/a/span/span[@class='tag']/text()")[0]
- sid = a.xpath("./div/a/@href")[0].replace("/", "").replace("voddetail", "").replace(".html", "")
- videos.append({
- "vod_id": sid,
- "vod_name": name,
- "vod_pic": pic,
- "vod_remarks": mark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 999
- result['limit'] = 5
- result['total'] = 9999
- return result
- def detailContent(self, array):
- tid = array[0]
- url = 'https://www.30dian.cn/voddetail/{0}.html'.format(tid)
- header = {"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
- rsp = self.fetch(url,headers=header)
- root = self.html(self.cleanText(rsp.text))
- divContent = root.xpath("//div[@class='col-lg-wide-75 col-md-wide-7 col-xs-1 padding-0']")[0]
- title = divContent.xpath(".//div[@class='myui-content__detail']/h1/text()")[0]
- pic = divContent.xpath(".//div[@class='myui-content__thumb']/a/img/@data-original")[0]
- det = divContent.xpath(".//div[@class='col-pd text-collapse content']/span[@class='data']")[0]
- if det.text is None:
- detail = det.xpath(".//p/text()")[0]
- else:
- detail = det.text
- vod = {
- "vod_id": tid,
- "vod_name": title,
- "vod_pic": pic,
- "type_name": "",
- "vod_year": "",
- "vod_area": "",
- "vod_remarks": "",
- "vod_actor": "",
- "vod_director": "",
- "vod_content": detail
- }
- infoArray = divContent.xpath(".//div[@class='myui-content__detail']/p[contains(@class,'data')]")
- for info in infoArray:
- content = info.xpath('string(.)')
- flag = "分类" in content
- if flag == True:
- infon = content.replace("\t","").replace("\n","").strip().split('\r')
- for inf in infon:
- if inf.startswith('分类'):
- vod['type_name'] = inf.replace("分类:", "")
- if inf.startswith('地区'):
- vod['vod_area'] = inf.replace("地区:", "")
- if inf.startswith('年份'):
- vod['vod_year'] = inf.replace("年份:", "")
- if content.startswith('主演'):
- vod['vod_actor'] = content.replace("\xa0", "/").replace("主演:", "").strip('/')
- if content.startswith('更新'):
- vod['vod_remarks'] = content.replace("更新:", "")
- if content.startswith('导演'):
- vod['vod_director'] = content.replace("\xa0", "").replace("导演:", "").strip('/')
- vod_play_from = '$$$'
- playFrom = []
- vodHeader = divContent.xpath(".//div[@class='myui-panel_hd']/div/ul/li/a[contains(@href,'playlist')]/text()")
- for v in vodHeader:
- playFrom.append(v.replace(" ", ""))
- vod_play_from = vod_play_from.join(playFrom)
- vod_play_url = '$$$'
- playList = []
- vodList = divContent.xpath(".//div[contains(@id,'playlist')]")
- for vl in vodList:
- vodItems = []
- aList = vl.xpath('./ul/li/a')
- if len(aList) <= 0:
- name = '无法找到播放源'
- tId = '00000'
- vodItems.append(name + "$" + tId)
- else:
- for tA in aList:
- href = tA.xpath('./@href')[0]
- name = tA.xpath("./text()")[0].replace(" ", "")
- tId = self.regStr(href, '/vodplay/(\\S+).html')
- vodItems.append(name + "$" + tId)
- joinStr = '#'
- joinStr = joinStr.join(vodItems)
- playList.append(joinStr)
- vod_play_url = vod_play_url.join(playList)
- vod['vod_play_from'] = vod_play_from
- vod['vod_play_url'] = vod_play_url
- result = {
- 'list': [
- vod
- ]
- }
- return result
- def searchContent(self, key, quick):
- url = 'https://www.30dian.cn/vodsearch/-------------.html?wd={0}'.format(key)
- header = {
- "User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
- rsp = self.fetch(url, headers=header)
- root = self.html(self.cleanText(rsp.text))
- aList = root.xpath("//ul[contains(@class,'myui-vodlist__media clearfix')]/li")
- videos = []
- for a in aList:
- name = a.xpath(".//div[@class='detail']/h4/a/text()")[0]
- pic = a.xpath(".//a[contains(@class,'myui-vodlist__thumb')]//@data-original")[0]
- mark = a.xpath(".//span[@class='tag']/text()")[0]
- sid = a.xpath(".//div[@class='detail']/h4/a/@href")[0]
- sid = self.regStr(sid,'/voddetail/(\\S+).html')
- videos.append({
- "vod_id": sid,
- "vod_name": name,
- "vod_pic": pic,
- "vod_remarks": mark
- })
- result = {
- 'list': videos
- }
- return result
- def playerContent(self, flag, id, vipFlags):
- result = {}
- header = {
- "User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
- if id == '00000':
- return {}
- url = 'https://www.30dian.cn/vodplay/{0}.html'.format(id)
- rsp = self.fetch(url,headers=header)
- root = self.html(self.cleanText(rsp.text))
- scripts = root.xpath("//div[@class='embed-responsive clearfix']/script[@type='text/javascript']/text()")[0]
- ukey = re.findall(r"url(.*)url_next", scripts)[0].replace('"', "").replace(',', "").replace(':', "")
- purl = urllib.parse.unquote(ukey)
- result["parse"] = 0
- result["playUrl"] = ''
- result["url"] =purl
- result["header"] = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
- return result
- config = {
- "player": {},
- "filter": {}
- }
- header = {}
- def isVideoFormat(self, url):
- pass
- def manualVideoCheck(self):
- pass
- def localProxy(self, param):
- action = {
- 'url': '',
- 'header': '',
- 'param': '',
- 'type': 'string',
- 'after': ''
- }
- return [200, "video/MP2T", action, ""]
|