123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420 |
- #coding=utf-8
- #!/usr/bin/python
- import sys
- sys.path.append('..')
- from base.spider import Spider
- import json
- import time
- import base64
- class Spider(Spider): # 元类 默认的元类 type
- def getName(self):
- return "歌手专辑"
- def init(self,extend=""):
- print("============{0}============".format(extend))
- pass
- def isVideoFormat(self,url):
- pass
- def manualVideoCheck(self):
- pass
- def homeContent(self,filter):
- result = {}
- cateManual = {
- "周杰伦":"周杰伦",
- "Beyond":"Beyond",
- "陈奕迅":"陈奕迅",
- "许巍":"许巍",
- "刘德华":"刘德华",
- "张学友":"张学友",
- "郭富城":"郭富城",
- "黎明":"黎明",
- "朴树":"朴树",
- "迪克牛仔":"迪克牛仔",
- "李宗盛":"李宗盛",
- "邓丽君":"邓丽君",
- "林子祥":"林子祥",
- "张信哲":"张信哲",
- "任贤齐":"任贤齐",
- "孙楠":"孙楠",
- "张宇":"张宇",
- "周华健":"周华健",
- "蔡依林":"蔡依林",
- "薛之谦":"薛之谦",
- "许嵩":"许嵩",
- "初音未来":"初音未来",
- "洛天依":"洛天依",
- "戴佩妮":"戴佩妮",
- "邓紫棋":"邓紫棋",
- "蔡健雅":"蔡健雅",
- "张韶涵":"张韶涵",
- "莫文蔚":"莫文蔚",
- "刘若英":"刘若英",
- "周深":"周深",
- "毛不易":"毛不易",
- "汪苏泷":"汪苏泷",
- "李宇春":"李宇春",
- "徐佳莹":"徐佳莹",
- "杨宗纬":"杨宗纬",
- "胡彦斌":"胡彦斌",
- "杨千嬅":"杨千嬅",
- "张靓颖":"张靓颖",
- "李荣浩":"李荣浩",
- "杨丞琳":"杨丞琳",
- "林志炫":"林志炫",
- "陶喆":"陶喆",
- "胡夏":"胡夏",
- "弦子":"弦子",
- "陈小春":"陈小春",
- "萧亚轩":"萧亚轩",
- "鹿晗":"鹿晗",
- "纵贯线":"纵贯线",
- "林俊杰":"林俊杰",
- "谭咏麟":"谭咏麟",
- "赵雷":"赵雷",
- "凤凰传奇":"凤凰传奇",
- "容祖儿":"容祖儿",
- "周传雄":"周传雄",
- "SHE":"SHE",
- "苏打绿":"苏打绿",
- "五月天":"五月天",
- "张国荣":"张国荣",
- "梅艳芳":"梅艳芳",
- "孙燕姿":"孙燕姿",
- "李健":"李健",
- "华晨宇":"华晨宇",
- "袁娅维":"袁娅维",
- "大张伟":"大张伟",
- "TFBOYS":"TFBOYS",
- "易烊千玺":"易烊千玺",
- "王俊凯":"王俊凯",
- "王源":"王源",
- "田馥甄":"田馥甄",
- "小虎队":"小虎队",
- "张杰":"张杰",
- "伍佰":"伍佰",
- "王菲":"王菲",
- "刀郎":"刀郎",
- "草蜢":"草蜢",
- "潘玮柏":"潘玮柏",
- "梁静茹":"梁静茹",
- "林宥嘉":"林宥嘉",
- "蔡徐坤":"蔡徐坤",
- "周慧敏":"周慧敏",
- "李圣杰":"李圣杰",
- "张惠妹":"张惠妹",
- "萧敬腾":"萧敬腾",
- "周笔畅":"周笔畅",
- "焦迈奇":"焦迈奇",
- "尤长靖":"尤长靖",
- "郑中基":"郑中基",
- "谭维维":"谭维维",
- "陈慧娴":"陈慧娴",
- "张艺兴":"张艺兴",
- "王嘉尔":"王嘉尔",
- "刘宪华":"刘宪华",
- "张敬轩":"张敬轩",
- "李克勤":"李克勤",
- "阿杜":"阿杜",
- "郭静":"郭静",
- "崔健":"崔健",
- "庾澄庆":"庾澄庆",
- "汪峰":"汪峰",
- "那英":"那英",
- "杨坤":"杨坤",
- "叶倩文":"叶倩文",
- "王心凌":"王心凌",
- "张震岳":"张震岳",
- "韩红":"韩红",
- "齐秦":"齐秦",
- "张雨生":"张雨生",
- "黄品源":"黄品源",
- "林忆莲":"林忆莲",
- "丁当":"丁当",
- "郑智化":"郑智化",
- "李玟":"李玟",
- "谢霆锋":"谢霆锋",
- "黄小琥":"黄小琥",
- "徐小凤":"徐小凤",
- "任嘉伦":"任嘉伦",
- "卓依婷":"卓依婷",
- "逃跑计划":"逃跑计划",
- "青鸟飞鱼":"青鸟飞鱼",
- "飞儿乐队":"飞儿乐队",
- "花儿乐队":"花儿乐队",
- "南拳妈妈":"南拳妈妈",
- "水木年华":"水木年华",
- "动力火车":"动力火车",
- "筷子兄弟":"筷子兄弟",
- "鹿先森乐队":"鹿先森乐队",
- "信乐队":"信乐队",
- "旅行团乐队":"旅行团乐队",
- "By2":"By2",
- "郁可唯":"郁可唯",
- "宋亚森":"宋亚森",
- "费玉清":"费玉清",
- "费翔":"费翔",
- "金志文":"金志文",
- "方大同":"方大同",
- "吴克群":"吴克群",
- "罗大佑":"罗大佑",
- "光良":"光良",
- "凤飞飞":"凤飞飞",
- "田震":"田震",
- "谭晶":"谭晶",
- "王杰":"王杰",
- "羽泉":"羽泉",
- "金池":"金池",
- "屠洪刚":"屠洪刚",
- "戴荃":"戴荃",
- "郭采洁":"郭采洁",
- "罗志祥":"罗志祥",
- "王力宏":"王力宏",
- "林肯公园":"林肯公园",
- "迈克尔杰克逊":"迈克尔杰克逊",
- "泰勒·斯威夫特":"泰勒·斯威夫特",
- "阿黛尔":"阿黛尔",
- "BIGBANG":"BIGBANG",
- "贾斯丁比伯":"贾斯丁比伯",
- "Lady Gaga":"Lady Gaga",
- "中岛美雪":"中岛美雪",
- "后街男孩":"后街男孩",
- "仓木麻衣":"仓木麻衣",
- "布兰妮":"布兰妮",
- "夜愿乐队":"夜愿乐队"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name':k,
- 'type_id':cateManual[k]
- })
- result['class'] = classes
- if(filter):
- result['filters'] = self.config['filter']
- return result
- def homeVideoContent(self):
- result = {
- 'list':[]
- }
- return result
- cookies = ''
- def getCookie(self):
- import requests
- import http.cookies
- # 这里填cookie
- raw_cookie_line = "buvid3=CFF74DA7-E79E-4B53-BB96-FC74AB8CD2F3184997infoc; LIVE_BUVID=AUTO4216125328906835; rpdid=|(umRum~uY~R0J'uYukYukkkY; balh_is_closed=; balh_server_inner=__custom__; PVID=4; video_page_version=v_old_home; i-wanna-go-back=-1; CURRENT_BLACKGAP=0; blackside_state=0; fingerprint=8965144a609d60190bd051578c610d72; buvid_fp_plain=undefined; CURRENT_QUALITY=120; hit-dyn-v2=1; nostalgia_conf=-1; buvid_fp=CFF74DA7-E79E-4B53-BB96-FC74AB8CD2F3184997infoc; CURRENT_FNVAL=4048; DedeUserID=85342; DedeUserID__ckMd5=f070401c4c699c83; b_ut=5; hit-new-style-dyn=0; buvid4=15C64651-E8B7-100C-4B1F-C7CFD2DB473007906-022110820-jYQRaMeS%2BRXRfw14q70%2FLQ%3D%3D; b_nut=1667910208; b_lsid=3CE4AE79_184578915C0; is-2022-channel=1; innersign=0; SESSDATA=a5e4d58d%2C1683641322%2C2c39a%2Ab1; bili_jct=2f3126b5954e37f593130f2fef082cd8; sid=p7tjqv22; bp_video_offset_85342=726936847258746900"
- simple_cookie = http.cookies.SimpleCookie(raw_cookie_line)
- cookie_jar = requests.cookies.RequestsCookieJar()
- cookie_jar.update(simple_cookie)
- return cookie_jar
- def get_dynamic(self,pg):
- result = {}
-
- url= 'https://api.bilibili.com/x/polymer/web-dynamic/v1/feed/all?timezone_offset=-480&type=all&page={0}'.format(pg)
-
- rsp = self.fetch(url,cookies=self.getCookie())
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos = []
- vodList = jo['data']['items']
- for vod in vodList:
- if vod['type'] == 'DYNAMIC_TYPE_AV':
- ivod = vod['modules']['module_dynamic']['major']['archive']
- aid = str(ivod['aid']).strip()
- title = ivod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
- img = ivod['cover'].strip()
- remark = str(ivod['duration_text']).strip()
- videos.append({
- "vod_id":aid,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_hot(self,pg):
- result = {}
- url= 'https://api.bilibili.com/x/web-interface/popular?ps=20&pn={0}'.format(pg)
- rsp = self.fetch(url,cookies=self.getCookie())
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos = []
- vodList = jo['data']['list']
- for vod in vodList:
- aid = str(vod['aid']).strip()
- title = vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
- img = vod['pic'].strip()
- remark = str(vod['duration']).strip()
- videos.append({
- "vod_id":aid,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_rank(self):
- result = {}
- url= 'https://api.bilibili.com/x/web-interface/ranking/v2?rid=0&type=all'
- rsp = self.fetch(url,cookies=self.getCookie())
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos = []
- vodList = jo['data']['list']
- for vod in vodList:
- aid = str(vod['aid']).strip()
- title = vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
- img = vod['pic'].strip()
- remark = str(vod['duration']).strip()
- videos.append({
- "vod_id":aid,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":remark
- })
- result['list'] = videos
- result['page'] = 1
- result['pagecount'] = 1
- result['limit'] = 90
- result['total'] = 999999
- return result
- def categoryContent(self,tid,pg,filter,extend):
- result = {}
- if tid == "热门":
- return self.get_hot(pg=pg)
- if tid == "排行榜" :
- return self.get_rank()
- if tid == '动态':
- return self.get_dynamic(pg=pg)
- url = 'https://api.bilibili.com/x/web-interface/search/type?search_type=video&keyword={0}&page={1}'.format(tid,pg)
- if len(self.cookies) <= 0:
- self.getCookie()
- rsp = self.fetch(url,cookies=self.getCookie())
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] != 0:
- rspRetry = self.fetch(url,cookies=self.getCookie())
- content = rspRetry.text
- jo = json.loads(content)
- videos = []
- vodList = jo['data']['result']
- for vod in vodList:
- aid = str(vod['aid']).strip()
- title = tid + ":" + vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
- img = 'https:' + vod['pic'].strip()
- remark = str(vod['duration']).strip()
- videos.append({
- "vod_id":aid,
- "vod_name":title,
- "vod_pic":img,
- "vod_remarks":remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def cleanSpace(self,str):
- return str.replace('\n','').replace('\t','').replace('\r','').replace(' ','')
- def detailContent(self,array):
- aid = array[0]
- url = "https://api.bilibili.com/x/web-interface/view?aid={0}".format(aid)
- rsp = self.fetch(url,headers=self.header,cookies=self.getCookie())
- jRoot = json.loads(rsp.text)
- jo = jRoot['data']
- title = jo['title'].replace("<em class=\"keyword\">","").replace("</em>","")
- pic = jo['pic']
- desc = jo['desc']
- typeName = jo['tname']
- vod = {
- "vod_id":aid,
- "vod_name":title,
- "vod_pic":pic,
- "type_name":typeName,
- "vod_year":"",
- "vod_area":"bilidanmu",
- "vod_remarks":"",
- "vod_actor":jo['owner']['name'],
- "vod_director":jo['owner']['name'],
- "vod_content":desc
- }
- ja = jo['pages']
- playUrl = ''
- for tmpJo in ja:
- cid = tmpJo['cid']
- part = tmpJo['part']
- playUrl = playUrl + '{0}${1}_{2}#'.format(part,aid,cid)
- vod['vod_play_from'] = 'B站'
- vod['vod_play_url'] = playUrl
- result = {
- 'list':[
- vod
- ]
- }
- return result
- def searchContent(self,key,quick):
- search = self.categoryContent(tid=key,pg=1,filter=None,extend=None)
- result = {
- 'list':search['list']
- }
- return result
- def playerContent(self,flag,id,vipFlags):
- # https://www.555dianying.cc/vodplay/static/js/playerconfig.js
- result = {}
- ids = id.split("_")
- url = 'https://api.bilibili.com:443/x/player/playurl?avid={0}&cid=%20%20{1}&qn=112'.format(ids[0],ids[1])
- rsp = self.fetch(url,cookies=self.getCookie())
- jRoot = json.loads(rsp.text)
- jo = jRoot['data']
- ja = jo['durl']
-
- maxSize = -1
- position = -1
- for i in range(len(ja)):
- tmpJo = ja[i]
- if maxSize < int(tmpJo['size']):
- maxSize = int(tmpJo['size'])
- position = i
- url = ''
- if len(ja) > 0:
- if position == -1:
- position = 0
- url = ja[position]['url']
- result["parse"] = 0
- result["playUrl"] = ''
- result["url"] = url
- result["header"] = {
- "Referer":"https://www.bilibili.com",
- "User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
- }
- result["contentType"] = 'video/x-flv'
- return result
- config = {
- "player": {},
- "filter": {}
- }
- header = {}
- def localProxy(self,param):
- return [200, "video/MP2T", action, ""]
|