123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543 |
- # coding=utf-8
- # !/usr/bin/python
- import sys
- from base.spider import Spider
- import json
- import threading
- import requests
- from requests import session
- import time
- sys.path.append('..')
- class Spider(Spider):
- def getDependence(self):
- return ['py_bilibili']
- def getName(self):
- return "哔哩影视"
- def init(self, extend=""):
- #self.bilibili = extend[0]
- #print("============{0}============".format(extend))
- pass
- def isVideoFormat(self, url):
- pass
- def manualVideoCheck(self):
- pass
- # 主页
- def homeContent(self, filter):
- result = {}
- cateManual = {
- "番剧": "1",
- "国创": "4",
- "电影": "2",
- "电视剧": "5",
- "纪录片": "3",
- "综艺": "7",
- "全部": "全部",
- # "追番追剧": "追番追剧",
- "时间表": "时间表",
- # ————————以下可自定义关键字,结果以搜索方式展示————————
- # "奥特曼": "奥特曼"
- }
- classes = []
- for k in cateManual:
- classes.append({
- 'type_name': k,
- 'type_id': cateManual[k]
- })
- result['class'] = classes
- if filter:
- result['filters'] = self.config['filter']
- return result
- # 用户cookies
- cookies = ''
- userid = ''
- csrf = ''
- def getCookie(self):
- # self.cookies = self.bilibili.getCookie()
- # self.userid = self.bilibili.userid
- # self.csrf = self.bilibili.csrf
- # return self.cookies
- # 单用此文件,请注释掉上面4行,取消以下注释,在下方raw_cookie_line后的双引号内填写cookies/外链
- import http.cookies
- raw_cookie_line = ""
- if raw_cookie_line.startswith('http'):
- raw_cookie_line = self.fetch(raw_cookie_line).text
- simple_cookie = http.cookies.SimpleCookie(raw_cookie_line)
- cookie_jar = requests.cookies.RequestsCookieJar()
- cookie_jar.update(simple_cookie)
- rsp = session()
- rsp.cookies = cookie_jar
- content = self.fetch("https://api.bilibili.com/x/web-interface/nav", cookies=rsp.cookies)
- res = json.loads(content.text)
- if res["code"] == 0:
- self.cookies = rsp.cookies
- self.userid = res["data"].get('mid')
- self.csrf = rsp.cookies['bili_jct']
- return cookie_jar
- # 格式化图片,默认16:9的webp格式,降低内存占用
- def format_img(self, img):
- img += "@640w_360h_1c_100q.webp" # 格式,[jpg/png/gif]@{width}w_{high}h_{is_cut}c_{quality}q.{format}
- return img
- # 将没有page_size参数的页面分页
- def pagination(self, array, pg):
- page_size = 10 # 默认单页视频数量为10,可自定义
- max_number = page_size * int(pg)
- min_number = max_number - page_size
- return array[min_number:max_number]
- # 记录观看历史
- def post_history(self, aid, cid):
- url = 'https://api.bilibili.com/x/v2/history/report?aid={0}&cid={1}&csrf={2}'.format(aid, cid, self.csrf)
- requests.post(url=url, cookies=self.cookies)
- # 将超过10000的数字换成成以万和亿为单位
- def zh(self, num):
- if int(num) >= 100000000:
- p = round(float(num) / float(100000000), 1)
- p = str(p) + '亿'
- else:
- if int(num) >= 10000:
- p = round(float(num) / float(10000), 1)
- p = str(p) + '万'
- else:
- p = str(num)
- return p
- def homeVideoContent(self):
- result = {}
- videos = self.get_rank(1, 1)['list'][0:2]
- for i in [4, 2, 5, 3, 7]:
- videos += self.get_rank2(i, 1)['list'][0:2]
- result['list'] = videos
- return result
- def get_rank(self, tid, pg):
- result = {}
- url = 'https://api.bilibili.com/pgc/web/rank/list?season_type={0}&day=3'.format(tid)
- rsp = self.fetch(url, cookies=self.cookies)
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos = []
- vodList = jo['result']['list']
- vodList = self.pagination(vodList, pg)
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = vod['title'].strip()
- img = vod['cover'].strip()
- remark = vod['new_ep']['index_show']
- videos.append({
- "vod_id": 'ss' + aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_rank2(self, tid, pg):
- result = {}
- url = 'https://api.bilibili.com/pgc/season/rank/web/list?season_type={0}&day=3'.format(tid)
- rsp = self.fetch(url, cookies=self.cookies)
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos = []
- vodList = jo['data']['list']
- vodList = self.pagination(vodList, pg)
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = vod['title'].strip()
- img = vod['ss_horizontal_cover'].strip()
- remark = vod['new_ep']['index_show']
- videos.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_zhui(self, pg, mode):
- result = {}
- if len(self.cookies) <= 0:
- self.getCookie()
- url = 'https://api.bilibili.com/x/space/bangumi/follow/list?type={2}&follow_status=0&pn={1}&ps=10&vmid={0}'.format(
- self.userid, pg, mode)
- rsp = self.fetch(url, cookies=self.cookies)
- content = rsp.text
- jo = json.loads(content)
- videos = []
- vodList = jo['data']['list']
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = vod['title']
- img = vod['cover'].strip()
- remark = vod['new_ep']['index_show'].strip()
- videos.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_all(self, tid, pg, order, season_status):
- result = {}
- if len(self.cookies) <= 0:
- self.getCookie()
- url = 'https://api.bilibili.com/pgc/season/index/result?order={2}&pagesize=10&type=1&season_type={0}&page={1}&season_status={3}'.format(
- tid, pg, order, season_status)
- rsp = self.fetch(url, cookies=self.cookies)
- content = rsp.text
- jo = json.loads(content)
- videos = []
- vodList = jo['data']['list']
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = vod['title']
- img = vod['cover'].strip()
- remark = vod['index_show'].strip()
- videos.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result['list'] = videos
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def get_timeline(self, tid, pg):
- result = {}
- url = 'https://api.bilibili.com/pgc/web/timeline/v2?season_type={0}&day_before=2&day_after=4'.format(tid)
- rsp = self.fetch(url, cookies=self.cookies)
- content = rsp.text
- jo = json.loads(content)
- if jo['code'] == 0:
- videos1 = []
- vodList = jo['result']['latest']
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = vod['title'].strip()
- img = vod['cover'].strip()
- remark = vod['pub_index'] + ' ' + vod['follows'].replace('系列', '')
- videos1.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- videos2 = []
- for i in range(0, 7):
- vodList = jo['result']['timeline'][i]['episodes']
- for vod in vodList:
- if str(vod['published']) == "0":
- aid = str(vod['season_id']).strip()
- title = str(vod['title']).strip()
- img = str(vod['cover']).strip()
- date = str(time.strftime("%m-%d %H:%M", time.localtime(vod['pub_ts'])))
- remark = date + " " + vod['pub_index']
- videos2.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result['list'] = self.pagination(videos2 + videos1, pg)
- result['page'] = pg
- result['pagecount'] = 9999
- result['limit'] = 90
- result['total'] = 999999
- return result
- def categoryContent(self, tid, pg, filter, extend):
- if len(self.cookies) <= 0:
- self.getCookie()
- if tid == "1":
- return self.get_rank(tid=tid, pg=pg)
- elif tid in {"2", "3", "4", "5", "7"}:
- return self.get_rank2(tid=tid, pg=pg)
- elif tid == "全部":
- tid = '1'
- order = '2'
- season_status = '-1'
- if 'tid' in extend:
- tid = extend['tid']
- if 'order' in extend:
- order = extend['order']
- if 'season_status' in extend:
- season_status = extend['season_status']
- return self.get_all(tid, pg, order, season_status)
- elif tid == "追番追剧":
- mode = '1'
- if 'mode' in extend:
- mode = extend['mode']
- return self.get_zhui(pg, mode)
- elif tid == "时间表":
- tid = '1'
- if 'tid' in extend:
- tid = extend['tid']
- return self.get_timeline(tid, pg)
- else:
- result = self.searchContent(key=tid, quick="false")
- return result
- def cleanSpace(self, str):
- return str.replace('\n', '').replace('\t', '').replace('\r', '').replace(' ', '')
- con = threading.Condition()
- def get_season(self, n, nList, fromList, urlList, season_id, season_title):
- url = 'https://api.bilibili.com/pgc/view/web/season?season_id={0}'.format(season_id)
- try:
- rsp = self.fetch(url, headers=self.header, cookies=self.cookies)
- season = json.loads(rsp.text)
- except:
- with self.con:
- nList.remove(n)
- self.con.notify_all()
- return
- episode = season['result']['episodes']
- if len(episode) == 0:
- with self.con:
- nList.remove(n)
- self.con.notify_all()
- return
- playUrl = ''
- for tmpJo in episode:
- aid = tmpJo['aid']
- cid = tmpJo['cid']
- part = tmpJo['title'].replace("#", "﹟").replace("$", "﹩")
- if tmpJo['badge'] != '':
- part += ' 【' + tmpJo['badge'] + '】'
- part += tmpJo['long_title'].replace("#", "﹟").replace("$", "﹩")
- playUrl += '{0}${1}_{2}_bangumi#'.format(part, aid, cid)
- with self.con:
- while True:
- if n == nList[0]:
- fromList.append(season_title)
- urlList.append(playUrl)
- nList.remove(n)
- self.con.notify_all()
- break
- else:
- self.con.wait()
- def detailContent(self, array):
- aid = array[0]
- if 'ep' in aid:
- aid = 'ep_id=' + aid.replace('ep', '')
- elif 'ss' in aid:
- aid = 'season_id=' + aid.replace('ss', '')
- else:
- aid = 'season_id=' + aid
- url = "https://api.bilibili.com/pgc/view/web/season?{0}".format(aid)
- rsp = self.fetch(url, headers=self.header, cookies=self.cookies)
- jRoot = json.loads(rsp.text)
- jo = jRoot['result']
- id = jo['season_id']
- title = jo['title']
- s_title = jo['season_title']
- img = jo['cover']
- typeName = jo['share_sub_title']
- date = jo['publish']['pub_time'][0:4]
- dec = jo['evaluate']
- remark = jo['new_ep']['desc']
- stat = jo['stat']
- status = "弹幕: " + self.zh(stat['danmakus']) + " 点赞: " + self.zh(stat['likes']) + " 投币: " + self.zh(
- stat['coins']) + " 追番追剧: " + self.zh(stat['favorites'])
- if 'rating' in jo:
- score = "评分: " + str(jo['rating']['score']) + ' ' + jo['subtitle']
- else:
- score = "暂无评分" + ' ' + jo['subtitle']
- vod = {
- "vod_id": id,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "type_name": typeName,
- "vod_year": date,
- "vod_area": "bilidanmu",
- "vod_remarks": remark,
- "vod_actor": status,
- "vod_director": score,
- "vod_content": dec
- }
- playUrl = ''
- for tmpJo in jo['episodes']:
- aid = tmpJo['aid']
- cid = tmpJo['cid']
- part = tmpJo['title'].replace("#", "﹟").replace("$", "﹩")
- if tmpJo['badge'] != '':
- part += '【' + tmpJo['badge'] + '】'
- part += tmpJo['long_title'].replace("#", "﹟").replace("$", "﹩")
- playUrl += '{0}${1}_{2}#'.format(part, aid, cid)
- fromList = []
- urlList = []
- if playUrl != '':
- fromList.append(s_title)
- urlList.append(playUrl)
- nList = []
- if len(jo['seasons']) > 1:
- n = 0
- for season in jo['seasons']:
- season_id = season['season_id']
- season_title = season['season_title']
- if season_id == id and len(fromList) > 0:
- isHere = fromList.index(s_title)
- fromList[isHere] = season_title
- continue
- n += 1
- nList.append(n)
- t = threading.Thread(target=self.get_season, args=(n, nList, fromList, urlList, season_id, season_title))
- t.start()
- while True:
- _count = threading.active_count()
- # 计算线程数,不出结果就调大,结果少了就调小
- if _count <= 2:
- break
- vod['vod_play_from'] = '$$$'.join(fromList)
- vod['vod_play_url'] = '$$$'.join(urlList)
- result = {'list': [vod]}
- return result
- def searchContent(self, key, quick):
- if len(self.cookies) <= 0:
- self.getCookie()
- url1 = 'https://api.bilibili.com/x/web-interface/search/type?search_type=media_bangumi&keyword={0}'.format(
- key) # 番剧搜索
- rsp1 = self.fetch(url1, cookies=self.cookies)
- content1 = rsp1.text
- jo1 = json.loads(content1)
- rs1 = jo1['data']
- url2 = 'https://api.bilibili.com/x/web-interface/search/type?search_type=media_ft&keyword={0}'.format(
- key) # 影视搜索
- rsp2 = self.fetch(url2, cookies=self.cookies)
- content2 = rsp2.text
- jo2 = json.loads(content2)
- rs2 = jo2['data']
- videos = []
- if rs1['numResults'] == 0:
- vodList = jo2['data']['result']
- elif rs2['numResults'] == 0:
- vodList = jo1['data']['result']
- else:
- vodList = jo1['data']['result'] + jo2['data']['result']
- for vod in vodList:
- aid = str(vod['season_id']).strip()
- title = key + '➢' + vod['title'].strip().replace("<em class=\"keyword\">", "").replace("</em>", "")
- img = vod['cover'].strip()
- remark = vod['index_show']
- videos.append({
- "vod_id": aid,
- "vod_name": title,
- "vod_pic": self.format_img(img),
- "vod_remarks": remark
- })
- result = {
- 'list': videos
- }
- return result
- def playerContent(self, flag, id, vipFlags):
- if len(self.cookies) <= 0:
- self.getCookie()
- result = {}
- url = ''
- ids = id.split("_")
- if len(ids) < 2:
- return result
- elif len(ids) >= 2:
- aid = ids[0]
- cid = ids[1]
- url = 'https://api.bilibili.com/pgc/player/web/playurl?aid={0}&cid={1}&qn=116'.format(aid, cid)
- self.post_history(aid, cid) # 回传播放历史记录
- rsp = self.fetch(url, cookies=self.cookies, headers=self.header)
- jRoot = json.loads(rsp.text)
- if jRoot['code'] != 0:
- return {}
- jo = jRoot['result']
- ja = jo['durl']
- maxSize = -1
- position = -1
- for i in range(len(ja)):
- tmpJo = ja[i]
- if maxSize < int(tmpJo['size']):
- maxSize = int(tmpJo['size'])
- position = i
- if len(ja) > 0:
- if position == -1:
- position = 0
- url = ja[position]['url']
- result["parse"] = 0
- result["playUrl"] = ''
- result["url"] = url
- result["header"] = {
- "Referer": "https://www.bilibili.com",
- "User-Agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36'
- }
- result["contentType"] = 'video/x-flv'
- return result
- config = {
- "player": {},
- "filter": {
- "全部": [{"key": "tid", "name": "分类",
- "value": [{"n": "番剧", "v": "1"}, {"n": "国创", "v": "4"}, {"n": "电影", "v": "2"},
- {"n": "电视剧", "v": "5"}, {"n": "记录片", "v": "3"}, {"n": "综艺", "v": "7"}]},
- {"key": "order", "name": "排序",
- "value": [{"n": "播放数量", "v": "2"}, {"n": "更新时间", "v": "0"}, {"n": "最高评分", "v": "4"},
- {"n": "弹幕数量", "v": "1"}, {"n": "追看人数", "v": "3"}, {"n": "开播时间", "v": "5"},
- {"n": "上映时间", "v": "6"}, ]},
- {"key": "season_status", "name": "付费",
- "value": [{"n": "全部", "v": "-1"}, {"n": "免费", "v": "1"},
- {"n": "付费", "v": "2%2C6"}, {"n": "大会员", "v": "4%2C6"}, ]}, ],
- "追番追剧": [{"key": "mode", "name": "分类",
- "value": [{"n": "追番", "v": "1"}, {"n": "追剧", "v": "2"}, ]}, ],
- "时间表": [{"key": "tid", "name": "分类",
- "value": [{"n": "番剧", "v": "1"}, {"n": "国创", "v": "4"}, ]}, ],
- }
- }
- header = {
- "Referer": "https://www.bilibili.com",
- "User-Agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36'
- }
- def localProxy(self, param):
- return [200, "video/MP2T", action, ""]
|