tvbox/py/xigua.py

412 lines
13 KiB
Python
Raw Normal View History

2023-06-02 18:59:25 +08:00
#coding=utf-8
#!/usr/bin/python
import sys
sys.path.append('..')
from base.spider import Spider
import base64
import math
import json
import requests
import urllib
from urllib import request, parse
import urllib.request
import re
class Spider(Spider):
def getName(self):
return "西瓜视频(个人中心)"
def init(self,extend=""):
self.userid=self.get_userid()
def isVideoFormat(self,url):
pass
def manualVideoCheck(self):
pass
def homeContent(self,filter):
result = {}
cateManual = {
"电视剧":"dianshiju",
"电影":"dianying",
"动漫":"dongman",
"纪录片":"jilupian",
"少儿":"shaoer",
"综艺":"zongyi",
"关注":"follow"
}
if self.userid=='':
del cateManual['关注']
classes = []
for k in cateManual:
classes.append({
'type_name': k,
'type_id': cateManual[k]
})
result['class'] = classes
if (filter):
result['filters'] = self.config['filter']
return result
def homeVideoContent(self):
result = {
'list': []
}
return result
userid=''
def categoryContent(self,tid,pg,filter,extend):
result = {}
idTxt='电视剧'
maximum=17
url = 'https://www.ixigua.com/api/cinema/filterv2/albums'
if tid=='dianying':
idTxt='电影'
elif tid=='zongyi':
idTxt='综艺'
elif tid=='dianshiju':
idTxt='电视剧'
elif tid=='dongman':
idTxt='动漫'
elif tid=='jilupian':
idTxt='纪录片'
elif tid=='shaoer':
idTxt='少儿'
elif tid=='follow':
offset=0 if int(pg)<2 else 20*int(pg)
url='https://www.ixigua.com/api/userv2/follow/list?authorId={0}&sortType=desc&sortType=desc&cursor={1}'.format(self.userid,offset)
maximum=12
videos=[]
if tid!='follow':
offset=0 if int(pg)<2 else 18*int(pg)
self.header['Referer']='https://www.ixigua.com/cinema/filter/'.format(tid)
data=r'{"pinyin":"'+tid+'","filters":{"type":"'+idTxt+'","area":"全部地区","tag":"全部类型","sort":"综合排序","paid":"全部资费"},"offset":'+str(offset)+',"limit":18}'
req = request.Request(url=url, data=bytes(data, encoding='utf8'),headers=self.header, method='POST')
response = request.urlopen(req)
urlTxt=response.read().decode('utf-8')
videos= self.get_list_videoGroup_json(jsonTxt=urlTxt)
else:
rsp=self.fetch(url,headers=self.header)
urlTxt=rsp.text
videos= self.get_list_videoGroup_follow_json(jsonTxt=urlTxt)
numvL = len(videos)
result['list'] = videos
result['page'] = pg
result['pagecount'] = pg if int(numvL)<maximum else int(pg)+1
result['limit'] = numvL
result['total'] = numvL
return result
def get_userid(self):
Url='https://www.ixigua.com/'
rsp=self.fetch(Url,headers=self.header)
htmlTxt = rsp.text
userid= self.get_RegexGetText(Text=htmlTxt,RegexText=r'"identity":{"id":"(\d+?)",',Index=1)
return userid
def detailContent(self,array):
result = {}
aid = array[0].split('###')
key = aid[1]
title = aid[0]
act=aid[2]
logo = aid[3]
Url='https://www.ixigua.com/api/albumv2/details?albumId={0}'.format(key)
if len(aid)==5:
Url='https://www.ixigua.com/api/videov2/author/new_video_list?to_user_id={0}'.format(key)
rsp = self.fetch(Url,headers=self.header)
htmlTxt = rsp.text
typeName=''
area=''
dir=''
cont=''
vip='true'
videoList=[]
if len(aid)==5:
jRoot = json.loads(htmlTxt)
if jRoot['code']!=200:
return result
jo = jRoot['data']
jsonList=jo['videoList']
for value in jsonList:
id="{0}${1}_false".format(value['title'],value.get('group_id'))
videoList.append(id)
dir=title
elif htmlTxt.find('playlist')>2:
jRoot = json.loads(htmlTxt)
if jRoot['code']!=200:
return result
jo = jRoot['data']
jsonList=jo['playlist']
if jsonList is not None:
for value in jsonList:
id="{0}${1}?id={2}_{3}".format(value['title'],value['albumId'],value['episodeId'],vip)
videoList.append(id)
playFrom=[v for v in jo['albumInfo']['tagList']]
typeName='/'.join(playFrom)
playFrom=[v for v in jo['albumInfo']['areaList']]
area='/'.join(playFrom)
playFrom=[v['name'] for v in jo['albumInfo']['directorList']]
dir='/'.join(playFrom)
cont=jo['albumInfo']['intro']
if len(videoList)<1:
return result
vod = {
"vod_id":array[0],
"vod_name":title,
"vod_pic":logo,
"type_name":typeName,
"vod_year":'',
"vod_area":area,
"vod_remarks":"",
"vod_actor":'',
"vod_director":dir,
"vod_content":cont
}
vod['vod_play_from'] = '西瓜'
vod['vod_play_url'] = "#".join(videoList)
result = {
'list':[
vod
]
}
return result
def verifyCode(self):
pass
def searchContent(self,key,quick):
Url='https://www.ixigua.com/api/searchv2/lvideo/{0}/0'.format(urllib.parse.quote(key))
rsp = self.fetch(Url,headers=self.header)
htmlTxt = rsp.text
videos=self.get_list(html=htmlTxt)
'''
Url='https://www.ixigua.com/api/searchv2/user/{0}/10'.format(urllib.parse.quote(key))
rsp = self.fetch(Url,headers=self.header)
htmlTxt1 = rsp.text
videos=self.get_list_user(html=htmlTxt1)
'''
result = {
'list': videos
}
return result
def playerContent(self,flag,id,vipFlags):
result={}
UrlId=id.split('_')
Url='https://www.ixigua.com/{0}'.format(UrlId[0])
headers = {
'User-Agent':'Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3947.100 Mobile Safari/537.36'
}
jx=1 if UrlId[1]=='true' else 0
result["parse"] = 1#0=直接播放,1=解析
result["playUrl"] = ''
result["url"] = Url
result['jx'] = jx#VIP解析
result["header"] =headers
return result
def get_RegexGetText(self,Text,RegexText,Index):
returnTxt=""
Regex=re.search(RegexText, Text, re.M|re.I)
if Regex is None:
returnTxt=""
else:
returnTxt=Regex.group(Index)
return returnTxt
def get_RegexGetTextLine(self,Text,RegexText,Index):
returnTxt=[]
pattern = re.compile(RegexText)
ListRe=pattern.findall(Text)
if len(ListRe)<1:
return returnTxt
for value in ListRe:
returnTxt.append(value)
return returnTxt
def get_playlist(self,Text,headStr,endStr):
circuit=""
origin=Text.find(headStr)
if origin>8:
end=Text.find(endStr,origin)
circuit=Text[origin:end]
return circuit
def removeHtml(self,txt):
soup = re.compile(r'<[^>]+>',re.S)
txt =soup.sub('', txt)
return txt.replace("&nbsp;"," ")
def get_webReadFile(self,urlStr):
headers = {
'Referer':urlStr,
'User-Agent': 'Mozilla/5.0 (Windows NT 5.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.112 Safari/537.36',
'Host': 'www.ikmjw.com'
}
req = urllib.request.Request(url=urlStr, headers=headers)
html = urllib.request.urlopen(req).read().decode('utf-8')
return html
def get_list(self,html):
result={}
jRoot = json.loads(html)
if jRoot['code']!=0:
return result
jo = jRoot['data']
if len(jo)<1:
return result
vodList = jo['data']
if len(vodList)<1:
return result
videos=[]
img='_'
artist='_'
for vod in vodList:
if vod['type']!='lvideo':
continue
data=vod['data']
display=data['display']
title =display['name']
if len(title)==0:
continue
episode_link=display.get('episode_link')
asc_link=episode_link.get('asc_link')
KeyName='album_id'
if asc_link is None:
asc_link=episode_link.get('desc_link')
KeyName='album_id'
id=asc_link[0].get('album_id')
sslocal=asc_link[0]['scheme_url']
if sslocal!=None and sslocal.find('sslocal:')<0:
continue
video_cover_info=display.get('video_cover_info')
img=video_cover_info['url'] if video_cover_info is not None else '_'
try:
artist=display['actor']
except Exception:
artist=''
remarks=display['rating']
vod_id="{0}###{1}###{2}###{3}".format(title,id,artist,img)
videos.append({
"vod_id":vod_id,
"vod_name":title,
"vod_pic":img,
"vod_remarks":remarks
})
return videos
def get_list_user(self,html):
result={}
jRoot = json.loads(html)
if jRoot['code']!=0:
return result
jo = jRoot['data']
if len(jo)<1:
return result
vodList = jo['data']
if len(vodList)<1:
return result
videos=[]
img='_'
artist='_'
for vod in vodList:
if vod['type']!='user':
continue
data=vod['data']
img=data['avatar']
title =data['name']
log_pb=json.loads(data.get('log_pb'))
user_auth_info=json.loads(data.get('user_auth_info'))
remarks=user_auth_info['auth_info']
id=log_pb.get('search_result_id')
vod_id="{0}###{1}###{2}###{3}###{4}".format(title,id,artist,img,'user')
videos.append({
"vod_id":vod_id,
"vod_name":title,
"vod_pic":img,
"vod_remarks":remarks
})
return videos
def get_list_videoGroup_json(self,jsonTxt):
result={}
jRoot = json.loads(jsonTxt)
if jRoot['code']!=200:
return result
jo = jRoot['data']
vodList = jo['albumList']
if len(vodList)<1:
return result
videos=[]
img='_'
artist='_'
for vod in vodList:
url =vod['albumId']
title =vod['title']
imgList =vod.get('coverList')
if len(imgList)>0:
img=imgList[0]['url']
remarks=vod['subTitle']
artistList=vod.get('actorList')
if artistList is not None:
artistList=artistList if len(artistList)<5 else artistList[0:4]
artist='/'.join(artistList)
if len(title)==0:
continue
#标题###地址###演员###封面
vod_id="{0}###{1}###{2}###{3}".format(title,url,artist,img)
videos.append({
"vod_id":vod_id,
"vod_name":title,
"vod_pic":img,
"vod_remarks":remarks
})
return videos
def get_list_videoGroup_follow_json(self,jsonTxt):
videos=[]
jRoot = json.loads(jsonTxt)
if jRoot['code']!=0:
return videos
jo = jRoot['data']
vodList=jo['data']
if len(vodList)<1:
return videos
img='_'
artist=''
for vod in vodList:
url =vod.get('user_id')
title =vod['name']
img =vod.get('avatar_url')
remarks=vod['description']
artistList=vod.get('actorList')
artist=title
if len(title)==0:
continue
#标题###地址###演员###封面
vod_id="{0}###{1}###{2}###{3}###{4}".format(title,url,artist,img,'user')
videos.append({
"vod_id":vod_id,
"vod_name":title,
"vod_pic":img,
"vod_remarks":remarks
})
return videos
def get_lineList(self,Txt,mark,after):
circuit=[]
origin=Txt.find(mark)
while origin>8:
end=Txt.find(after,origin)
circuit.append(Txt[origin:end])
origin=Txt.find(mark,end)
return circuit
def get_EpisodesList(self,jsonList):
vodItems=[]
for value in jsonList:
vodItems.append(value['title']+"$"+'https://www.ixigua.com/{0}?logTag=55abe18cfb733871bb04'.format(value['episodeId']))
return vodItems
config = {
"player": {},
"filter": {}
}
header = {
"Cookie":"s_v_web_id=verify_lev3h43l_rrTPrFDG_ztWQ_4ugg_8WBA_yGVYsXlVyoBh; passport_csrf_token=80e0efe90bc8bd6681a896dd90cd08cc; passport_csrf_token_default=80e0efe90bc8bd6681a896dd90cd08cc; __ac_nonce=0643361890096533c765; __ac_signature=_02B4Z6wo00f01JPVVrAAAIDBcisHPfWA66CT91IAAEDK9840CE-PheNOCgA4VtrFG0-K.KkLmAR5KsI-Xx-6dBXxz.ABWU2OpEd22kF7biwGaVmGR7an4S1heLEU9xpv0ObRSHFHDslR7uL8fb; support_webp=true; support_avif=false; MONITOR_WEB_ID=45c3b6ab-7ad4-4805-b971-5962d1d6909a; ttwid=1%7CCueNR-HU9tGVF30WaiFCjXDxh0FUXoXsZr-cIb9Dogg%7C1681089268%7Cf0eeaa2016a602a277055494954f083e9f7fa8121c5dd1162db9195932fa167b; odin_tt=386a42a5740f9859d4670373fc8c70cf320ea5b227aed04bcc53fde26c233e8c952a8b0ba5f80fd3d46f9663fa595d8c; sid_guard=842b56710f55021912487890e7d5bef3%7C1681089337%7C3024001%7CMon%2C+15-May-2023+01%3A15%3A38+GMT; uid_tt=b7eb5b73cd72bed6d3c2e1e1e8aaa9f3; uid_tt_ss=b7eb5b73cd72bed6d3c2e1e1e8aaa9f3; sid_tt=842b56710f55021912487890e7d5bef3; sessionid=842b56710f55021912487890e7d5bef3; sessionid_ss=842b56710f55021912487890e7d5bef3; sid_ucp_v1=1.0.0-KGQ2YzBlMDFiMzIyMjY0YTIwMDg2MjZmZGQzMTE5MmFlYTYzY2EwMTMKFQjL2cnx9AIQucbNoQYYGCAMOAhABRoCaGwiIDg0MmI1NjcxMGY1NTAyMTkxMjQ4Nzg5MGU3ZDViZWYz; ssid_ucp_v1=1.0.0-KGQ2YzBlMDFiMzIyMjY0YTIwMDg2MjZmZGQzMTE5MmFlYTYzY2EwMTMKFQjL2cnx9AIQucbNoQYYGCAMOAhABRoCaGwiIDg0MmI1NjcxMGY1NTAyMTkxMjQ4Nzg5MGU3ZDViZWYz; csrf_session_id=c58adecac1d20d91d8c61e72ce0c6fdb; ixigua-a-s=3; msToken=St3ptsHkwBjPgGvRWhZfVdhHO_K16vTizxxna17draCvt4ekz6DQXO6c2Ctrp6gOnn9_Abm83-a9URQp5rKb-JIPs4mQPn2fpKlQRY6jLDBWUdLYTePIAACU6cY2fk40; tt_scid=nN3WPItw72gnB5PDiGcHveirXDZ8oDl5n.ihKN583mmZhoe.uLhFpy3JOL8wrsQO0ed1",
"Referer": 'https://www.ixigua.com/cinema/filter/dianshiju/',
'User-Agent':'User-Agent: Mozilla%2F5.0+(Windows+NT+10.0%3B+WOW64)+AppleWebKit%2F537.36+(KHTML%2C+like+Gecko)+Chrome%2F63.0.3239.132+Safari%2F537.36',
'Host': 'www.ixigua.com',
'Accept': 'application/json, text/plain, */*',
'x-secsdk-csrf-token': '0001000000017b593ba6251b18bd7bce2753042917bb36e534867b9606317584c00b0ae836c61754314b7365128e',
'tt-anti-token': 'oDr7A3PDDFq4pWzk-707faf92a9e3040f5c6ed4284d53b05b7091221852c0e9d32bca9fcfe5035225',
'content-type': 'application/json'
}
def localProxy(self,param):
return [200, "video/MP2T", action, ""]