123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238 |
- # coding=utf-8
- # !/usr/bin/python
- import sys
- sys.path.append('..')
- from base.spider import Spider
- import json
- import base64
- import hashlib
- class Spider(Spider): # 元类 默认的元类 type
- def getName(self):
- return "LeZhuTV"
- def init(self, extend=""):
- print("============{0}============".format(extend))
- pass
- def homeContent(self, filter):
- result = {}
- cateManual = {
- "电影": "1",
- "连续剧": "2",
- "动漫": "4",
- "综艺": "3",
- "韩剧": "14",
- "美剧": "15"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name': k,
- 'type_id': cateManual[k]
- })
- result['class'] = classes
- if (filter):
- result['filters'] = self.config['filter']
- return result
- def homeVideoContent(self):
- rsp = self.fetch("http://www.lezhutv.com")
- root = self.html(rsp.text)
- aList = root.xpath("//ul[@class='tbox_m2']/li")
- videos = []
- for a in aList:
- name = a.xpath('.//@title')[0]
- pic = a.xpath('.//@data-original')[0]
- mark = a.xpath(".//span/text()")[0]
- sid = a.xpath(".//@href")[0]
- sid = self.regStr(sid, "/detail/(\\d+).html")
- videos.append({
- "vod_id": sid,
- "vod_name": name,
- "vod_pic": pic,
- "vod_remarks": mark
- })
- result = {
- 'list': videos
- }
- return result
- def categoryContent(self, tid, pg, filter, extend):
- result = {}
- ext = extend.get("by","")
- url = 'http://www.lezhutv.com/list/{0}_{1}_desc_{2}_0_0___.html'.format(tid,pg,ext)
- rsp = self.fetch(url)
- root = self.html(rsp.text)
- aList = root.xpath("//ul[@class='tbox_m2']/li")
- videos = []
- for a in aList:
- name = a.xpath('.//@title')[0]
- pic = a.xpath('.//@data-original')[0]
- mark = a.xpath(".//span/text()")[0]
- sid = a.xpath(".//@href")[0]
- sid = self.regStr(sid, "/detail/(\\d+).html")
- videos.append({
- "vod_id": sid,
- "vod_name": name,
- "vod_pic": pic,
- "vod_remarks": mark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def detailContent(self, array):
- tid = array[0]
- url = 'http://www.lezhutv.com/detail/{0}.html'.format(tid)
- rsp = self.fetch(url)
- root = self.html(rsp.text)
- node = root.xpath(".//div[@class='dbox']")[0]
- nodes = root.xpath(".//div[@class='tbox2']")[0]
- pic = node.xpath(".//div/@data-original")[0]
- title = node.xpath('.//h4/text()')[0]
- detail = nodes.xpath(".//div[@class='tbox_js']/text()")[0]
- yac = node.xpath(".//p[@class='yac']/text()")[0]
- yac = yac.split('/')
- yacs = yac[0].strip()
- type_name = yac[1].strip()
- actor = node.xpath(".//p[@class='act']/text()")[0]
- director = node.xpath(".//p[@class='dir']/text()")[0]
- vod = {
- "vod_id": tid,
- "vod_name": title,
- "vod_pic": pic,
- "type_name": type_name,
- "vod_year": yacs,
- "vod_area": "",
- "vod_remarks": "",
- "vod_actor": actor,
- "vod_director": director,
- "vod_content": detail
- }
- vod_play_from = '$$$'
- playFrom = []
- vodHeader = root.xpath(".//div[@class='tbox2 tabs']/div/h3/text()")
- i=1
- for v in vodHeader:
- playFrom.append("线路" + str(i))
- i = i+1
- vod_play_from = vod_play_from.join(playFrom)
- vod_play_url = '$$$'
- playList = []
- vodList = root.xpath("//div[@class='tbox2 tabs']")
- for vl in vodList:
- vodItems = []
- aList = vl.xpath(".//ul/li/a")
- for tA in aList:
- href = tA.xpath('./@href')[0]
- name = tA.xpath('./text()')[0]
- tId = self.regStr(href, '/play/(\\S+).html')
- vodItems.append(name + "$" + tId)
- joinStr = '#'
- joinStr = joinStr.join(vodItems)
- playList.append(joinStr)
- vod_play_url = vod_play_url.join(playList)
- vod['vod_play_from'] = vod_play_from
- vod['vod_play_url'] = vod_play_url
- result = {
- 'list': [
- vod
- ]
- }
- return result
- def searchContent(self, key, quick):
- url = 'http://www.lezhutv.com/search-pg-1-wd-{0}.html'.format(key)
- rsp = self.fetch(url)
- root = self.html(rsp.text)
- seaArray = root.xpath("//ul[@class='tbox_m']/li")
- seaList = []
- for vod in seaArray:
- name = vod.xpath('.//@title')[0]
- pic = vod.xpath('.//@data-original')[0]
- mark = vod.xpath(".//span/text()")[0]
- sid = vod.xpath(".//@href")[0]
- sid = self.regStr(sid, "/detail/(\\d+).html")
- seaList.append({
- "vod_id": sid,
- "vod_name": name,
- "vod_pic": pic,
- "vod_remarks": mark
- })
- result = {
- 'list': seaList
- }
- return result
- config = {
- "player":{},
- "filter":{"1":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}],"2":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}],"3":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}],"4":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}],"14":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}],"15":[{"key":"by","name":"排序","value":[{"n":"时间","v":"time"},{"n":"人气","v":"score"},{"n":"评分","v":"hits"}]}]}
- }
- header = {
- "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/99.0.4844.84 Safari/537.36"
- }
- def get_md5(self,value):
- b64 = base64.b64encode((base64.b64encode(value.encode()).decode() + "NTY2").encode()).decode()
- md5 = hashlib.md5(b64.encode()).hexdigest()
- return "".join(char if char.isdigit() else "zyxwvutsrqponmlkjihgfedcba"["abcdefghijklmnopqrstuvwxyz".find(char)] for char in md5)
- def playerContent(self, flag, id, vipFlags):
- result = {}
- url = 'http://www.lezhutv.com/play/{0}.html'.format(id)
- rsp = self.fetch(url)
- root = self.html(rsp.text)
- scripts = root.xpath("//script/text()")
- scripts = scripts[1].replace('\n', '')
- nid = self.regStr(scripts, 'view_path = \'(.*?)\';')
- md5url = 'http://www.lezhutv.com/hls2/index.php?url={0}'.format(nid)
- rsp = self.fetch(md5url)
- root = self.html(rsp.text)
- value = root.xpath(".//input[@id='hdMd5']/@value")
- value = ''.join(value)
- md5s = self.get_md5(str(value))
- data = {
- "id": nid,
- "type": "vid",
- "siteuser": "",
- "md5": md5s,
- "referer": url,
- "hd": "",
- "lg": ""
- }
- payUrl = 'http://www.lezhutv.com/hls2/url.php'
- parseRsp = self.post(payUrl,data,headers=self.header)
- parseRsps = json.loads(parseRsp.text)
- realUrl = parseRsps['media']['url']
- if len(realUrl) > 0:
- result["parse"] = 0
- result["playUrl"] = ""
- result["url"] = realUrl
- result["header"] = ""
- else:
- result["parse"] = 1
- result["playUrl"] = ""
- result["url"] = url
- result["header"] = json.dumps(self.header)
- return result
- def isVideoFormat(self, url):
- pass
- def manualVideoCheck(self):
- pass
- def localProxy(self, param):
- return [200, "video/MP2T", action, ""]
|