mirror of
https://github.com/letian1650/N3RD.git
synced 2025-01-26 12:54:50 +08:00
564 lines
19 KiB
Python
564 lines
19 KiB
Python
|
# coding=utf-8
|
|||
|
# !/usr/bin/python
|
|||
|
import sys
|
|||
|
|
|||
|
sys.path.append('..')
|
|||
|
from base.spider import Spider
|
|||
|
# from base.htmlParser import jsoup
|
|||
|
import json
|
|||
|
from requests import session, utils
|
|||
|
import os
|
|||
|
import time
|
|||
|
import base64
|
|||
|
|
|||
|
# def main3():
|
|||
|
# html = """
|
|||
|
# <div>
|
|||
|
# <p>内容1<span id='exd1'>我不获取的内容1</span><span id='exd2'>我不获取的内容2</span>内容2</p>
|
|||
|
# </div>
|
|||
|
# """
|
|||
|
# jsp = jsoup('https://www.cnblogs.com/lizhibk/p/8623543.html')
|
|||
|
# a = jsp.pdfh(html, 'div p:eq(0)--span&&Text')
|
|||
|
# print(a)
|
|||
|
# return a
|
|||
|
|
|||
|
class Spider(Spider): # 元类 默认的元类 type
|
|||
|
def getName(self):
|
|||
|
return "哔哩影视"
|
|||
|
|
|||
|
def init(self, extend=""):
|
|||
|
print("============{0}============".format(extend))
|
|||
|
pass
|
|||
|
|
|||
|
def isVideoFormat(self, url):
|
|||
|
pass
|
|||
|
|
|||
|
def manualVideoCheck(self):
|
|||
|
pass
|
|||
|
|
|||
|
def homeContent(self, filter):
|
|||
|
result = {}
|
|||
|
cateManual = {
|
|||
|
# main3():"1",
|
|||
|
"番剧": "1",
|
|||
|
"国创": "4",
|
|||
|
"电影": "2",
|
|||
|
"电视剧": "5",
|
|||
|
"纪录片": "3",
|
|||
|
"综艺": "7",
|
|||
|
"全部": "全部",
|
|||
|
"追番": "追番",
|
|||
|
"追剧": "追剧",
|
|||
|
"时间表": "时间表",
|
|||
|
|
|||
|
}
|
|||
|
classes = []
|
|||
|
for k in cateManual:
|
|||
|
classes.append({
|
|||
|
'type_name': k,
|
|||
|
'type_id': cateManual[k]
|
|||
|
})
|
|||
|
result['class'] = classes
|
|||
|
if (filter):
|
|||
|
result['filters'] = self.config['filter']
|
|||
|
return result
|
|||
|
|
|||
|
cookies = ''
|
|||
|
userid = ''
|
|||
|
|
|||
|
def getCookie(self):
|
|||
|
# --------↓↓↓↓↓↓↓------在下方cookies_str后的双引号内填写-------↓↓↓↓↓↓↓--------
|
|||
|
cookies_str = ""
|
|||
|
if cookies_str:
|
|||
|
cookies = dict([co.strip().split('=', 1) for co in cookies_str.split(';')])
|
|||
|
bili_jct = cookies['bili_jct']
|
|||
|
SESSDATA = cookies['SESSDATA']
|
|||
|
DedeUserID = cookies['DedeUserID']
|
|||
|
cookies_jar = {"bili_jct": bili_jct,
|
|||
|
'SESSDATA': SESSDATA,
|
|||
|
'DedeUserID': DedeUserID
|
|||
|
}
|
|||
|
rsp = session()
|
|||
|
rsp.cookies = cookies_jar
|
|||
|
content = self.fetch("https://api.bilibili.com/x/web-interface/nav", cookies=rsp.cookies)
|
|||
|
res = json.loads(content.text)
|
|||
|
if res["code"] == 0:
|
|||
|
self.cookies = rsp.cookies
|
|||
|
self.userid = res["data"].get('mid')
|
|||
|
return rsp.cookies
|
|||
|
rsp = self.fetch("https://www.bilibili.com/")
|
|||
|
self.cookies = rsp.cookies
|
|||
|
return rsp.cookies
|
|||
|
|
|||
|
# 将超过10000的数字换成成以万和亿为单位
|
|||
|
def zh(self, num):
|
|||
|
if int(num) >= 100000000:
|
|||
|
p = round(float(num) / float(100000000), 1)
|
|||
|
p = str(p) + '亿'
|
|||
|
else:
|
|||
|
if int(num) >= 10000:
|
|||
|
p = round(float(num) / float(10000), 1)
|
|||
|
p = str(p) + '万'
|
|||
|
else:
|
|||
|
p = str(num)
|
|||
|
return p
|
|||
|
|
|||
|
def homeVideoContent(self):
|
|||
|
result = {}
|
|||
|
videos = self.get_rank(1)['list'][0:5]
|
|||
|
for i in [4, 2, 5, 3, 7]:
|
|||
|
videos += self.get_rank2(i)['list'][0:5]
|
|||
|
result['list'] = videos
|
|||
|
return result
|
|||
|
|
|||
|
def get_rank(self, tid):
|
|||
|
result = {}
|
|||
|
url = 'https://api.bilibili.com/pgc/web/rank/list?season_type={0}&day=3'.format(tid)
|
|||
|
rsp = self.fetch(url, cookies=self.cookies)
|
|||
|
content = rsp.text
|
|||
|
jo = json.loads(content)
|
|||
|
if jo['code'] == 0:
|
|||
|
videos = []
|
|||
|
vodList = jo['result']['list']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = vod['title'].strip()
|
|||
|
img = vod['cover'].strip()
|
|||
|
remark = vod['new_ep']['index_show']
|
|||
|
videos.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result['list'] = videos
|
|||
|
result['page'] = 1
|
|||
|
result['pagecount'] = 1
|
|||
|
result['limit'] = 90
|
|||
|
result['total'] = 999999
|
|||
|
return result
|
|||
|
|
|||
|
def get_rank2(self, tid):
|
|||
|
result = {}
|
|||
|
url = 'https://api.bilibili.com/pgc/season/rank/web/list?season_type={0}&day=3'.format(tid)
|
|||
|
rsp = self.fetch(url, cookies=self.cookies)
|
|||
|
content = rsp.text
|
|||
|
jo = json.loads(content)
|
|||
|
if jo['code'] == 0:
|
|||
|
videos = []
|
|||
|
vodList = jo['data']['list']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = vod['title'].strip()
|
|||
|
img = vod['cover'].strip()
|
|||
|
remark = vod['new_ep']['index_show']
|
|||
|
videos.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result['list'] = videos
|
|||
|
result['page'] = 1
|
|||
|
result['pagecount'] = 1
|
|||
|
result['limit'] = 90
|
|||
|
result['total'] = 999999
|
|||
|
return result
|
|||
|
|
|||
|
def get_zhui(self, pg, mode):
|
|||
|
result = {}
|
|||
|
if len(self.cookies) <= 0:
|
|||
|
self.getCookie()
|
|||
|
url = 'https://api.bilibili.com/x/space/bangumi/follow/list?type={2}&follow_status=0&pn={1}&ps=10&vmid={0}'.format(self.userid, pg, mode)
|
|||
|
rsp = self.fetch(url, cookies=self.cookies)
|
|||
|
content = rsp.text
|
|||
|
jo = json.loads(content)
|
|||
|
videos = []
|
|||
|
vodList = jo['data']['list']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = vod['title']
|
|||
|
img = vod['cover'].strip()
|
|||
|
remark = vod['new_ep']['index_show'].strip()
|
|||
|
videos.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result['list'] = videos
|
|||
|
result['page'] = pg
|
|||
|
result['pagecount'] = 9999
|
|||
|
result['limit'] = 90
|
|||
|
result['total'] = 999999
|
|||
|
return result
|
|||
|
|
|||
|
def get_all(self, tid, pg, order, season_status, extend):
|
|||
|
result = {}
|
|||
|
if len(self.cookies) <= 0:
|
|||
|
self.getCookie()
|
|||
|
url = 'https://api.bilibili.com/pgc/season/index/result?order={2}&pagesize=20&type=1&season_type={0}&page={1}&season_status={3}'.format(tid, pg, order, season_status)
|
|||
|
rsp = self.fetch(url, cookies=self.cookies)
|
|||
|
content = rsp.text
|
|||
|
jo = json.loads(content)
|
|||
|
videos = []
|
|||
|
vodList = jo['data']['list']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = vod['title']
|
|||
|
img = vod['cover'].strip()
|
|||
|
remark = vod['index_show'].strip()
|
|||
|
videos.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result['list'] = videos
|
|||
|
result['page'] = pg
|
|||
|
result['pagecount'] = 9999
|
|||
|
result['limit'] = 90
|
|||
|
result['total'] = 999999
|
|||
|
return result
|
|||
|
|
|||
|
def get_timeline(self, tid, pg):
|
|||
|
result = {}
|
|||
|
url = 'https://api.bilibili.com/pgc/web/timeline/v2?season_type={0}&day_before=2&day_after=4'.format(tid)
|
|||
|
rsp = self.fetch(url, cookies=self.cookies)
|
|||
|
content = rsp.text
|
|||
|
jo = json.loads(content)
|
|||
|
if jo['code'] == 0:
|
|||
|
videos1 = []
|
|||
|
vodList = jo['result']['latest']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = vod['title'].strip()
|
|||
|
img = vod['cover'].strip()
|
|||
|
remark = vod['pub_index'] + ' ' + vod['follows'].replace('系列', '')
|
|||
|
videos1.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
videos2 = []
|
|||
|
for i in range(0, 7):
|
|||
|
vodList = jo['result']['timeline'][i]['episodes']
|
|||
|
for vod in vodList:
|
|||
|
if str(vod['published']) == "0":
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = str(vod['title']).strip()
|
|||
|
img = str(vod['cover']).strip()
|
|||
|
date = str(time.strftime("%m-%d %H:%M", time.localtime(vod['pub_ts'])))
|
|||
|
remark = date + " " + vod['pub_index']
|
|||
|
videos2.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result['list'] = videos2 + videos1
|
|||
|
result['page'] = 1
|
|||
|
result['pagecount'] = 1
|
|||
|
result['limit'] = 90
|
|||
|
result['total'] = 999999
|
|||
|
return result
|
|||
|
|
|||
|
def categoryContent(self, tid, pg, filter, extend):
|
|||
|
result = {}
|
|||
|
if len(self.cookies) <= 0:
|
|||
|
self.getCookie()
|
|||
|
if tid == "1":
|
|||
|
return self.get_rank(tid=tid)
|
|||
|
elif tid in {"2", "3", "4", "5", "7"}:
|
|||
|
return self.get_rank2(tid=tid)
|
|||
|
elif tid == "全部":
|
|||
|
tid = '1' # 全部界面默认展示最多播放的番剧
|
|||
|
order = '2'
|
|||
|
season_status = '-1'
|
|||
|
if 'tid' in extend:
|
|||
|
tid = extend['tid']
|
|||
|
if 'order' in extend:
|
|||
|
order = extend['order']
|
|||
|
if 'season_status' in extend:
|
|||
|
season_status = extend['season_status']
|
|||
|
return self.get_all(tid, pg, order, season_status, extend)
|
|||
|
elif tid == "追番":
|
|||
|
return self.get_zhui(pg, 1)
|
|||
|
elif tid == "追剧":
|
|||
|
return self.get_zhui(pg, 2)
|
|||
|
elif tid == "时间表":
|
|||
|
tid = 1
|
|||
|
if 'tid' in extend:
|
|||
|
tid = extend['tid']
|
|||
|
return self.get_timeline(tid, pg)
|
|||
|
else:
|
|||
|
result = self.searchContent(key=tid, quick="false")
|
|||
|
return result
|
|||
|
|
|||
|
def cleanSpace(self, str):
|
|||
|
return str.replace('\n', '').replace('\t', '').replace('\r', '').replace(' ', '')
|
|||
|
|
|||
|
def detailContent(self, array):
|
|||
|
aid = array[0]
|
|||
|
url = "https://api.bilibili.com/pgc/view/web/season?season_id={0}".format(aid)
|
|||
|
rsp = self.fetch(url, headers=self.header)
|
|||
|
jRoot = json.loads(rsp.text)
|
|||
|
jo = jRoot['result']
|
|||
|
id = jo['season_id']
|
|||
|
title = jo['title']
|
|||
|
pic = jo['cover']
|
|||
|
# areas = jo['areas']['name'] 改bilidanmu显示弹幕
|
|||
|
typeName = jo['share_sub_title']
|
|||
|
date = jo['publish']['pub_time'][0:4]
|
|||
|
dec = jo['evaluate']
|
|||
|
remark = jo['new_ep']['desc']
|
|||
|
stat = jo['stat']
|
|||
|
# 演员和导演框展示视频状态,包括以下内容:
|
|||
|
status = "弹幕: " + self.zh(stat['danmakus']) + " 点赞: " + self.zh(stat['likes']) + " 投币: " + self.zh(
|
|||
|
stat['coins']) + " 追番追剧: " + self.zh(stat['favorites'])
|
|||
|
if 'rating' in jo:
|
|||
|
score = "评分: " + str(jo['rating']['score']) + ' ' + jo['subtitle']
|
|||
|
else:
|
|||
|
score = "暂无评分" + ' ' + jo['subtitle']
|
|||
|
vod = {
|
|||
|
"vod_id": id,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": pic,
|
|||
|
"type_name": typeName,
|
|||
|
"vod_year": date,
|
|||
|
"vod_area": "bilidanmu",
|
|||
|
"vod_remarks": remark,
|
|||
|
"vod_actor": status,
|
|||
|
"vod_director": score,
|
|||
|
"vod_content": dec
|
|||
|
}
|
|||
|
ja = jo['episodes']
|
|||
|
playUrl = ''
|
|||
|
for tmpJo in ja:
|
|||
|
eid = tmpJo['id']
|
|||
|
cid = tmpJo['cid']
|
|||
|
part = tmpJo['title'].replace("#", "-")
|
|||
|
playUrl = playUrl + '{0}${1}_{2}#'.format(part, eid, cid)
|
|||
|
|
|||
|
vod['vod_play_from'] = 'B站'
|
|||
|
vod['vod_play_url'] = playUrl
|
|||
|
|
|||
|
result = {
|
|||
|
'list': [
|
|||
|
vod
|
|||
|
]
|
|||
|
}
|
|||
|
return result
|
|||
|
|
|||
|
def searchContent(self, key, quick):
|
|||
|
if len(self.cookies) <= 0:
|
|||
|
self.getCookie()
|
|||
|
url1 = 'https://api.bilibili.com/x/web-interface/search/type?search_type=media_bangumi&keyword={0}'.format(
|
|||
|
key) # 番剧搜索
|
|||
|
rsp1 = self.fetch(url1, cookies=self.cookies)
|
|||
|
content1 = rsp1.text
|
|||
|
jo1 = json.loads(content1)
|
|||
|
rs1 = jo1['data']
|
|||
|
url2 = 'https://api.bilibili.com/x/web-interface/search/type?search_type=media_ft&keyword={0}'.format(
|
|||
|
key) # 影视搜索
|
|||
|
rsp2 = self.fetch(url2, cookies=self.cookies)
|
|||
|
content2 = rsp2.text
|
|||
|
jo2 = json.loads(content2)
|
|||
|
rs2 = jo2['data']
|
|||
|
videos = []
|
|||
|
if rs1['numResults'] == 0:
|
|||
|
vodList = jo2['data']['result']
|
|||
|
elif rs2['numResults'] == 0:
|
|||
|
vodList = jo1['data']['result']
|
|||
|
else:
|
|||
|
vodList = jo1['data']['result'] + jo2['data']['result']
|
|||
|
for vod in vodList:
|
|||
|
aid = str(vod['season_id']).strip()
|
|||
|
title = key + '➢' + vod['title'].strip().replace("<em class=\"keyword\">", "").replace("</em>", "")
|
|||
|
img = vod['cover'].strip() # vod['eps'][0]['cover'].strip()原来的错误写法
|
|||
|
remark = vod['index_show']
|
|||
|
videos.append({
|
|||
|
"vod_id": aid,
|
|||
|
"vod_name": title,
|
|||
|
"vod_pic": img,
|
|||
|
"vod_remarks": remark
|
|||
|
})
|
|||
|
result = {
|
|||
|
'list': videos
|
|||
|
}
|
|||
|
return result
|
|||
|
|
|||
|
def playerContent(self, flag, id, vipFlags):
|
|||
|
result = {}
|
|||
|
ids = id.split("_")
|
|||
|
header = {
|
|||
|
"Referer": "https://www.bilibili.com",
|
|||
|
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
|
|||
|
}
|
|||
|
url = 'https://api.bilibili.com/pgc/player/web/playurl?qn=116&ep_id={0}&cid={1}'.format(ids[0], ids[1])
|
|||
|
if len(self.cookies) <= 0:
|
|||
|
self.getCookie()
|
|||
|
rsp = self.fetch(url, cookies=self.cookies, headers=header)
|
|||
|
jRoot = json.loads(rsp.text)
|
|||
|
if jRoot['message'] != 'success':
|
|||
|
print("需要大会员权限才能观看")
|
|||
|
return {}
|
|||
|
jo = jRoot['result']
|
|||
|
ja = jo['durl']
|
|||
|
maxSize = -1
|
|||
|
position = -1
|
|||
|
for i in range(len(ja)):
|
|||
|
tmpJo = ja[i]
|
|||
|
if maxSize < int(tmpJo['size']):
|
|||
|
maxSize = int(tmpJo['size'])
|
|||
|
position = i
|
|||
|
|
|||
|
url = ''
|
|||
|
if len(ja) > 0:
|
|||
|
if position == -1:
|
|||
|
position = 0
|
|||
|
url = ja[position]['url']
|
|||
|
|
|||
|
result["parse"] = 0
|
|||
|
result["playUrl"] = ''
|
|||
|
result["url"] = url
|
|||
|
result["header"] = {
|
|||
|
"Referer": "https://www.bilibili.com",
|
|||
|
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
|
|||
|
}
|
|||
|
result["contentType"] = 'video/x-flv'
|
|||
|
return result
|
|||
|
|
|||
|
config = {
|
|||
|
"player": {},
|
|||
|
"filter": {
|
|||
|
"全部": [
|
|||
|
{
|
|||
|
"key": "tid",
|
|||
|
"name": "分类",
|
|||
|
"value": [{
|
|||
|
"n": "番剧",
|
|||
|
"v": "1"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "国创",
|
|||
|
"v": "4"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "电影",
|
|||
|
"v": "2"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "电视剧",
|
|||
|
"v": "5"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "记录片",
|
|||
|
"v": "3"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "综艺",
|
|||
|
"v": "7"
|
|||
|
}
|
|||
|
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"key": "order",
|
|||
|
"name": "排序",
|
|||
|
"value": [
|
|||
|
|
|||
|
{
|
|||
|
"n": "播放数量",
|
|||
|
"v": "2"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "更新时间",
|
|||
|
"v": "0"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "最高评分",
|
|||
|
"v": "4"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "弹幕数量",
|
|||
|
"v": "1"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "追看人数",
|
|||
|
"v": "3"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "开播时间",
|
|||
|
"v": "5"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "上映时间",
|
|||
|
"v": "6"
|
|||
|
},
|
|||
|
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"key": "season_status",
|
|||
|
"name": "付费",
|
|||
|
"value": [
|
|||
|
{
|
|||
|
"n": "全部",
|
|||
|
"v": "-1"
|
|||
|
},
|
|||
|
{
|
|||
|
"n": "免费",
|
|||
|
"v": "1"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "付费",
|
|||
|
"v": "2%2C6"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "大会员",
|
|||
|
"v": "4%2C6"
|
|||
|
},
|
|||
|
|
|||
|
]
|
|||
|
},
|
|||
|
],
|
|||
|
|
|||
|
|
|||
|
"时间表": [{
|
|||
|
"key": "tid",
|
|||
|
"name": "分类",
|
|||
|
"value": [
|
|||
|
|
|||
|
{
|
|||
|
"n": "番剧",
|
|||
|
"v": "1"
|
|||
|
},
|
|||
|
|
|||
|
{
|
|||
|
"n": "国创",
|
|||
|
"v": "4"
|
|||
|
},
|
|||
|
|
|||
|
]
|
|||
|
},
|
|||
|
],
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
header = {
|
|||
|
"Referer": "https://www.bilibili.com",
|
|||
|
"User-Agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36'
|
|||
|
}
|
|||
|
|
|||
|
def localProxy(self, param):
|
|||
|
return [200, "video/MP2T", action, ""]
|