123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255 |
- #coding=utf-8
- #!/usr/bin/python
- import sys
- sys.path.append('..')
- from base.spider import Spider
- import json
- import base64
- import re
- import math
- import time
- import uuid
- import hashlib
- from urllib import request, parse
- import urllib
- import urllib.request
- class Spider(Spider): # 元类 默认的元类 type
- def getName(self):
- return "1905电影"
- def init(self,extend=""):
- print("============{0}============".format(extend))
- pass
- def isVideoFormat(self,url):
- pass
- def manualVideoCheck(self):
- pass
- def homeContent(self,filter):
- result = {}
- cateManual = {
- "电影": "n_1",
- "微电影":"n_1_c_922",
- "系列电影":"n_2",
- "纪录片":"c_927",
- "晚会":"n_1_c_586",
- "独家":"n_1_c_178",
- "综艺":"n_1_c_1024"
- # ,"体育":"n_1_c_1053"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name':k,
- 'type_id':cateManual[k]
- })
- result['class'] = classes
- if(filter):
- result['filters'] = self.config['filter']
- return result
- def homeVideoContent(self):
- url = 'https://www.1905.com/vod/cctv6/lst/'
- rsp = self.fetch(url, headers=self.header)
- html = self.html(rsp.text)
- aList = html.xpath("//div[@class='grid-2x']/a")
- videos = self.custom_list(aList=aList)
- result = {
- 'list':videos
- }
- return result
- def categoryContent(self,tid,pg,filter,extend):
- result = {}
- videos=[]
- by='/o1p'
- if 'by' in extend.keys():
- by='/{0}p'.format(extend['by'])
- url = 'https://www.1905.com/vod/list/{0}{2}{1}.html'.format(tid, pg,by)
- rsp = self.fetch(url, headers=self.header)
- HtmlTxt=rsp.text
- html = self.html(HtmlTxt)
- aList = html.xpath("//section[contains(@class,'search-list')]/div/a" if tid != u'n_2' else "//div[@class='mod']/div[1]/a")
- videos = self.custom_list(aList=aList)
- limit = len(aList)
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 100
- result['limit'] = limit
- result['total'] = 100 * limit
- return result
- def detailContent(self,array):
- result = {}
- aid = array[0]
- vodItems=[]
- playList=[]
- vod_play_from=['1905电影',]
- if aid.isdigit()==False:
- rsp = self.fetch(aid, headers=self.header)
- HtmlTxt=rsp.text
- url=self.regStr(reg=r'<a class="iconBanner-playBtn icon-banner btn-play"\s*href="(.+?)"',src=HtmlTxt)
- if url=='':
- url=self.regStr(reg=r'property="og:url"\scontent="(.+?)"',src=HtmlTxt)
- if len(self.regStr(reg=r'(vip.1905)',src=url))>3:
- vod_play_from=['1905电影(需要vip解析)',]
- aid=url
- else:
- aid=self.regStr(reg=r'play/(.*?)\.sh',src=url)
- if aid=='':
- return {'list': []}
- elif aid.isdigit() and vod_play_from[0].find('需要vip解析')<0:
- url = "https://www.1905.com/api/content/?callback=&m=Vod&a=getVodSidebar&id={0}&fomat=json".format(aid)
- rsp = self.fetch(url, headers=self.header)
- HtmlTxt=rsp.text
- root = json.loads(HtmlTxt)
- title = root['title']
- pic = root['thumb']
- remark = root['commendreason']
- content = root['description']
- actor = root['starring']
- direct = root['direct']
- vodItems.append(title + "$" + aid)
- series = root['info']['series_data']
- series = root['info']['series_data']
- for ser in series:
- vodItems.append(ser['title'] + "$" + ser['contentid'])
- joinStr = '#'.join(vodItems)
- playList.append(joinStr)
- else:
- rsp = self.fetch(array[0], headers=self.header)
- HtmlTxt=rsp.text
- title=self.regStr(reg=r'<div class="container-right">\s*\r*\n*\t*<h1>(.+?)<',src=HtmlTxt).replace(' ','')
- pic=self.regStr(reg=r'<img class="poster" src="(.+?)"',src=HtmlTxt)
- remark=''
- actor=''
- direct=''
- content=self.regStr(reg=r'<p>(.+?)</p>',src=HtmlTxt)
- vodItems.append(title + "$" + aid)
- joinStr = '#'.join(vodItems)
- playList.append(joinStr)
- vod = {
- "vod_id":array[0],
- "vod_name":title,
- "vod_pic":pic,
- "type_name":'',
- "vod_year":"",
- "vod_area":"",
- "vod_remarks":remark,
- "vod_actor":actor,
- "vod_director":direct,
- "vod_content":content
- }
- vod['vod_play_from'] = "$$$".join(vod_play_from)
- vod['vod_play_url'] = "$$$".join(playList)
- result = {
- 'list':[
- vod
- ]
- }
- return result
- def searchContent(self,key,quick):
- url = 'https://www.1905.com/search/index-p-type-film-q-{}.html?envod=1&year=0&score=0&order=0'.format(key)#只搜索能看电影,想搜其它的可以把html之后的字符删掉
- #https://www.1905.com/search/index-p-type-all-q-{}.html
- rsp = self.fetch(url, headers=self.header)
- html = self.html(rsp.text)
- aList = html.xpath("//div/div[contains(@class,'new_content')]/div/div/div/a")
- videos = self.custom_list(aList=aList)
- result = {
- 'list':videos
- }
- return result
- def playerContent(self,flag,id,vipFlags):
- result = {}
- if flag.find('vip解析')>0:
- result["parse"] = 1#0=直接播放、1=嗅探
- result["playUrl"] =''
- result["url"] = id
- result['jx'] = 1#1=VIP解析,0=不解析
- result["header"] = ''
- else:
- nonce = int(round(time.time() * 1000))
- expiretime = nonce + 600
- uid = str(uuid.uuid4())
- playerid = uid.replace("-", "")[5:20]
- signature = 'cid={0}&expiretime={1}&nonce={2}&page=https%3A%2F%2Fwww.1905.com%2Fvod%2Fplay%2F{3}.shtml&playerid={4}&type=hls&uuid={5}.dde3d61a0411511d'.format(id,expiretime,nonce,id,playerid,uid)
- signature = hashlib.sha1(signature.encode()).hexdigest()
- url = 'https://profile.m1905.com/mvod/getVideoinfo.php?nonce={0}&expiretime={1}&cid={2}&uuid={3}&playerid={4}&page=https%3A%2F%2Fwww.1905.com%2Fvod%2Fplay%2F{5}.shtml&type=hls&signature={6}&callback='.format(nonce,expiretime,id,uid,playerid,id,signature)
- rsp = self.fetch(url, headers=self.header)
- HtmlTxt=rsp.text
- jo = json.loads(HtmlTxt.replace("(", "").replace(")", ""))
- data = jo['data']['sign']
- sign = ''
- qualityStr = ''
- if 'uhd' in data.keys():
- sign = data['uhd']['sign']
- qualityStr = 'uhd'
- elif 'hd' in data.keys():
- sign = data['hd']['sign']
- qualityStr = 'hd'
- elif 'sd' in data.keys():
- sign = data['sd']['sign']
- qualityStr = 'sd'
- host = jo['data']['quality'][qualityStr]['host']
- path = jo['data']['path'][qualityStr]['path']
- playUrl = host + sign + path
- result["parse"] = 1#0=直接播放、1=嗅探
- result["playUrl"] =''
- result["url"] = playUrl
- result["header"] = self.header
- return result
- config = {
- "player": {},
- "filter": {
- "n_1":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "n_1_c_922":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "n_2":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "c_927":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "n_1_c_586":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "n_1_c_178":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ],
- "n_1_c_1024":[
- {"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]}
- ]
- }
- }
- header = {
- 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/117.0.0.0 Safari/537.36 Edg/117.0.2045.43',
- 'Referer': 'https://www.1905.com/vod/list/n_1/o3p1.html',
- 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7'
- }
- def localProxy(self,param):
- return [200, "video/MP2T", action, ""]
- #-----------------------------------------------自定义函数-----------------------------------------------
- #分类取结果
- def custom_list(self,aList):
- videos = []
- for a in aList:
- img=a.xpath('./img/@src')[0]
- title=a.xpath('./img/@alt')[0]
- url=a.xpath("./@href")[0]
- if url.find('vip.1905')>1:#可以除掉
- continue
- if self.regStr(reg=r'(play)',src=url)=='':
- vod_id="{0}".format(url)
- else:
- id=self.regStr(reg=r'play/(.*?)\.sh',src=url)
- vod_id="{0}".format(id)
- videos.append({
- "vod_id":vod_id,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":''
- })
- return videos
|