import './util-ym.js'; import cheerio from 'assets://js/lib/cheerio.min.js'; import 'assets://js/lib/crypto-js.js' // import muban from 'https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js'; // const key = 'drpy_zbk'; // eval(req('http://192.168.1.124:5705/libs/es6py.js').content); function init_test() { console.log("init_test_start"); console.log(RKEY); console.log(JSON.stringify(rule)); // clearItem(RULE_CK); // console.log(JSON.stringify(rule)); // let aa = base64Encode('编码测试一下') // log(aa); // let bb = base64Decode(aa); // log('bb:' + bb); // console.log(request('https://www.baidu.com',{withHeaders:true})); // console.log(request('https://www.baidu.com/favicon.ico', { toBase64: true })); // require('http://192.168.10.99:5705/txt/pluto/drT.js'); // console.log(typeof(drT)); // console.log(drT.renderText('{{fl.cate}},hi, {{fl}}哈哈.{{fl}}',{sort: 1,cate:'movie'},'fl')); console.log("init_test_end"); } let rule = {}; /** 已知问题记录 * 1.影魔的jinjia2引擎不支持 {{fl}}对象直接渲染 * Array.prototype.append = Array.prototype.push; 这种js执行后有毛病,for in 循环列表会把属性给打印出来 * 2.import es6py.js但是里面的函数没有被装载进来.比如drpy规则报错setResult2 is undefiend * 3.无法重复导入cheerio(怎么解决drpy和parseTag里都需要导入cheerio的问题) 无法在副文件导入cheerio (现在是全部放在drpy一个文件里了,凑合解决?) * 4.有个错误不知道哪儿来的 executeScript: com.quickjs.JSObject$Undefined cannot be cast to java.lang.String 在 点击选集播放打印init_test_end后面打印 * 5.需要实现 stringify 函数,比起JSON.stringify函数,它会原封不动保留中文不会编码unicode * todo: jsp:{pdfa,pdfh,pd},json:{pdfa,pdfh,pd},jq:{pdfa,pdfh,pd} * * 电脑看日志调试 adb tcpip 5555 adb connect 192.168.10.192 adb devices -l adb logcat -c adb logcat | grep -i QuickJS * **/ /*** 以下是内置变量和解析方法 **/ const MOBILE_UA = 'Mozilla/5.0 (Linux; Android 11; M2007J3SC Build/RKQ1.200826.002; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/77.0.3865.120 MQQBrowser/6.2 TBS/045714 Mobile Safari/537.36'; const PC_UA = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/95.0.4638.54 Safari/537.36'; const UA = 'Mozilla/5.0'; const UC_UA = 'Mozilla/5.0 (Linux; U; Android 9; zh-CN; MI 9 Build/PKQ1.181121.001) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/57.0.2987.108 UCBrowser/12.5.5.1035 Mobile Safari/537.36'; const IOS_UA = 'Mozilla/5.0 (iPhone; CPU iPhone OS 13_2_3 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/13.0.3 Mobile/15E148 Safari/604.1'; const RULE_CK = 'cookie'; // 源cookie的key值 // const KEY = typeof(key)!=='undefined'&&key?key:'drpy_' + (rule.title || rule.host); // 源的唯一标识 const CATE_EXCLUDE = '首页|留言|APP|下载|资讯|新闻|动态'; const TAB_EXCLUDE = '猜你|喜欢|APP|下载|剧情|热播'; const OCR_RETRY = 3;//ocr验证重试次数 // const OCR_API = 'http://dm.mudery.com:10000';//ocr在线识别接口 // const OCR_API = 'http://192.168.3.239:5705/parse/ocr';//ocr在线识别接口 const OCR_API = 'http://cms.nokia.press/parse/ocr';//ocr在线识别接口 if (typeof (MY_URL) === 'undefined') { var MY_URL; // 全局注入变量,pd函数需要 } var RKEY; // 源的唯一标识 var fetch; var print; var log; var rule_fetch_params; var fetch_params; // 每个位置单独的 var oheaders; var _pdfh; var _pdfa; var _pd; // const DOM_CHECK_ATTR = ['url', 'src', 'href', 'data-original', 'data-src']; const DOM_CHECK_ATTR = /(url|src|href|data-original|data-src)$/; const SELECT_REGEX = /:eq|:lt|:gt|#/g; const SELECT_REGEX_A = /:eq|:lt|:gt/g; function setResult(d) { if (!Array.isArray(d)) { return [] } VODS = []; // print(d); d.forEach(function (it) { let obj = { vod_id: it.url || '', vod_name: it.title || '', vod_remarks: it.desc || '', vod_content: it.content || '', vod_pic: it.pic_url || it.img || '', }; let keys = Object.keys(it); if (keys.includes('tname')) { obj.type_name = it.tname || ''; } if (keys.includes('tid')) { obj.type_id = it.tid || ''; } if (keys.includes('year')) { obj.vod_year = it.year || ''; } if (keys.includes('actor')) { obj.vod_actor = it.actor || ''; } if (keys.includes('director')) { obj.vod_director = it.director || ''; } if (keys.includes('area')) { obj.vod_area = it.area || ''; } VODS.push(obj); }); return VODS } function setResult2(res) { VODS = res.list || []; return VODS } function setHomeResult(res) { if (!res || typeof (res) !== 'object') { return [] } return setResult(res.list); } // 猫了个咪 function rc(js) { if (js === 'maomi_aes.js') { var a = CryptoJS.enc.Utf8.parse("625222f9149e961d"); var t = CryptoJS.enc.Utf8.parse("5efdtf6060e2o330"); return { De: function (word) { word = CryptoJS.enc.Hex.parse(word) return CryptoJS.AES.decrypt(CryptoJS.enc.Base64.stringify(word), a, { iv: t, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }).toString(CryptoJS.enc.Utf8) }, En: function (word) { // print(a); // print(word); var Encrypted = CryptoJS.AES.encrypt(word, a, { iv: t, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }); return Encrypted.ciphertext.toString(); } }; } return {}; } // 千万不要用for in 推荐 forEach (for in 会打乱顺序) //猫函数 function maoss(jxurl, ref, key) { eval(getCryptoJS()); try { var getVideoInfo = function (text) { return CryptoJS.AES.decrypt(text, key, { iv: iv, padding: CryptoJS.pad.Pkcs7 }).toString(CryptoJS.enc.Utf8); }; var token_key = key == undefined ? 'dvyYRQlnPRCMdQSe' : key; if (ref) { var html = request(jxurl, { headers: { 'Referer': ref } }); } else { var html = request(jxurl); } // print(html); if (html.indexOf('&btwaf=') != -1) { html = request(jxurl + '&btwaf' + html.match(/&btwaf(.*?)"/)[1], { headers: { 'Referer': ref } }) } var token_iv = html.split('_token = "')[1].split('"')[0]; var key = CryptoJS.enc.Utf8.parse(token_key); var iv = CryptoJS.enc.Utf8.parse(token_iv); // log("iv:"+iv); // log(html); // print(key); // print(iv); eval(html.match(/var config = {[\s\S]*?}/)[0] + ''); // config.url = config.url.replace(/,/g,''); // print(config.url); if (!config.url.startsWith('http')) { //config.url = decodeURIComponent(AES(config.url, key, iv)); config.url = CryptoJS.AES.decrypt(config.url, key, { iv: iv, padding: CryptoJS.pad.Pkcs7 }).toString(CryptoJS.enc.Utf8) } return config.url; } catch (e) { return ''; } } let VODS = [];// 一级或者搜索需要的数据列表 let VOD = {};// 二级的单个数据 /** * 重写pd方法-增加自动urljoin(没法重写,改个名继续骗) * @param html * @param parse * @param uri * @returns {*} */ function pD(html, parse, uri) { let ret = pdfh(html, parse); if (typeof (uri) === 'undefined' || !uri) { uri = ''; } if (DOM_CHECK_ATTR.test(parse)) { if (/http/.test(ret)) { ret = ret.substr(ret.indexOf('http')); } else { ret = urljoin(MY_URL, ret) } } // MY_URL = getItem('MY_URL',MY_URL); // console.log(`规则${RKEY}打印MY_URL:${MY_URL},uri:${uri}`); return ret } const parseTags = { jsp: { pdfh: pdfh, pdfa: pdfa, pd: pD, }, json: { pdfh(html, parse) { if (!parse || !parse.trim()) { return ''; } if (typeof (html) === 'string') { html = JSON.parse(html); } parse = parse.trim(); if (!parse.startsWith('$.')) { parse = '$.' + parse; } parse = parse.split('||'); for (let ps of parse) { let ret = cheerio.jp(ps, html); if (Array.isArray(ret)) { ret = ret[0] || ''; } else { ret = ret || '' } if (ret && typeof (ret) !== 'string') { ret = ret.toString(); } if (ret) { return ret } } return ''; }, pdfa(html, parse) { if (!parse || !parse.trim()) { return ''; } if (typeof (html) === 'string') { html = JSON.parse(html); } parse = parse.trim() if (!parse.startsWith('$.')) { parse = '$.' + parse; } let ret = cheerio.jp(parse, html); if (Array.isArray(ret) && Array.isArray(ret[0]) && ret.length === 1) { return ret[0] || [] } return ret || [] }, pd(html, parse) { let ret = parseTags.json.pdfh(html, parse); if (ret) { return urljoin(MY_URL, ret); } return ret }, }, jq: { pdfh: pdfh, pdfa: pdfa, pd(html, parse, uri) { return parseTags.jq.pdfh(html, parse, MY_URL); }, }, getParse(p0) {//非js开头的情况自动获取解析标签 if (p0.startsWith('jsp:')) { return this.jsp } else if (p0.startsWith('json:')) { return this.json } else if (p0.startsWith('jq:')) { return this.jq } else { return this.jq } } }; const stringify = JSON.stringify; const jsp = parseTags.jsp; /*** 后台需要实现的java方法并注入到js中 ***/ /** * 读取本地文件->应用程序目录 * @param filePath * @returns {string} */ function readFile(filePath) { filePath = filePath || './uri.min.js'; var fd = os.open(filePath); var buffer = new ArrayBuffer(1024); var len = os.read(fd, buffer, 0, 1024); console.log(len); let text = String.fromCharCode.apply(null, new Uint8Array(buffer)); console.log(text); return text } /** * 处理返回的json数据 * @param html * @returns {*} */ function dealJson(html) { try { return html.match(/[\w|\W|\s|\S]*?(\{[\w|\W|\s|\S]*\})/).group[1]; } catch (e) { } try { html = JSON.parse(html); } catch (e) { } // console.log(typeof(html)); return html; } /** * 验证码识别逻辑,需要java实现(js没有bytes类型,无法调用后端的传递图片二进制获取验证码文本的接口) * @type {{api: string, classification: (function(*=): string)}} */ var OcrApi = { api: OCR_API, classification: function (img) { // img是byte类型,这里不方便搞啊 let code = ''; try { let html = request(this.api, { data: { img: img }, headers: { 'User-Agent': PC_UA }, 'method': 'POST' }); html = JSON.parse(html); code = html.url || ''; } catch (e) { } return code } }; /** * 验证码识别,暂未实现 * @param url 验证码图片链接 * @returns {string} 验证成功后的cookie */ function verifyCode(url) { let cnt = 0; let host = getHome(url); let cookie = ''; while (cnt < OCR_RETRY) { try { // let obj = {headers:headers,timeout:timeout}; let yzm_url = `${host}/index.php/verify/index.html`; console.log(`验证码链接:${yzm_url}`); let hhtml = request(yzm_url, { withHeaders: true, toBase64: true }); let json = JSON.parse(hhtml); if (!cookie) { cookie = json['set-cookie'] ? json['set-cookie'].split(';')[0] : ''; } // console.log(hhtml); console.log('cookie:' + cookie); let img = json.body; // console.log(img); let code = OcrApi.classification(img); console.log(`第${cnt + 1}次验证码识别结果:${code}`); let submit_url = `${host}/index.php/ajax/verify_check?type=search&verify=${code}`; console.log(submit_url); let html = request(submit_url, { headers: { Cookie: cookie, 'User-Agent': MOBILE_UA }, 'method': 'POST' }); // console.log(html); html = JSON.parse(html); if (html.msg === 'ok') { console.log(`第${cnt + 1}次验证码提交成功`); return cookie // 需要返回cookie } else if (html.msg !== 'ok' && cnt + 1 >= OCR_RETRY) { cookie = ''; // 需要清空返回cookie } } catch (e) { console.log(`第${cnt + 1}次验证码提交失败:${e.message}`); if (cnt + 1 >= OCR_RETRY) { cookie = ''; } } cnt += 1 } return cookie } /** * 存在数据库配置表里, key字段对应值value,没有就新增,有就更新,调用此方法会清除key对应的内存缓存 * @param k 键 * @param v 值 */ function setItem(k, v) { local.set(RKEY, k, v); console.log(`规则${RKEY}设置${k} => ${v}`) } /** * 获取数据库配置表对应的key字段的value,没有这个key就返回value默认传参.需要有缓存,第一次获取后会存在内存里 * @param k 键 * @param v 值 * @returns {*} */ function getItem(k, v) { return local.get(RKEY, k) || v; } /** * 删除数据库key对应的一条数据,并清除此key对应的内存缓存 * @param k */ function clearItem(k) { local.delete(RKEY, k); } /*** js自封装的方法 ***/ /** * 获取链接的host(带http协议的完整链接) * @param url 任意一个正常完整的Url,自动提取根 * @returns {string} */ function getHome(url) { if (!url) { return '' } let tmp = url.split('//'); url = tmp[0] + '//' + tmp[1].split('/')[0]; try { url = decodeURIComponent(url); } catch (e) { } return url } /** * get参数编译链接,类似python params字典自动拼接 * @param url 访问链接 * @param obj 参数字典 * @returns {*} */ function buildUrl(url, obj) { obj = obj || {}; if (url.indexOf('?') < 0) { url += '?' } let param_list = []; let keys = Object.keys(obj); keys.forEach(it => { param_list.push(it + '=' + obj[it]) }); let prs = param_list.join('&'); if (keys.length > 0 && !url.endsWith('?')) { url += '&' } url += prs; return url } /** * 远程依赖执行函数 * @param url 远程js地址 */ function require(url) { eval(request(url)); } /** * 海阔网页请求函数完整封装 * @param url 请求链接 * @param obj 请求对象 {headers:{},method:'',timeout:5000,body:'',withHeaders:false} * @returns {string|string|DocumentFragment|*} */ function request(url, obj) { if (typeof (obj) === 'undefined' || !obj || obj === {}) { if (!fetch_params || !fetch_params.headers) { let headers = { 'User-Agent': MOBILE_UA, }; if (rule.headers) { Object.assign(headers, rule.headers); } fetch_params.headers = headers; } if (!fetch_params.headers.Referer) { fetch_params.headers.Referer = getHome(url) } obj = fetch_params; } else { let headers = obj.headers || {}; let keys = Object.keys(headers).map(it => it.toLowerCase()); if (!keys.includes('user-agent')) { headers['User-Agent'] = MOBILE_UA; } if (!keys.includes('referer')) { headers['Referer'] = getHome(url); } obj.headers = headers; } console.log(JSON.stringify(obj.headers)); if (typeof (obj.headers.body) != 'undefined' && obj.headers.body && typeof (obj.headers.body) === 'string') { let data = {}; obj.headers.body.split('&').forEach(it => { data[it.split('=')[0]] = it.split('=')[1] }); obj.data = data; delete obj.headers.body } if (!url) { return obj.withHeaders ? '{}' : '' } if (obj.toBase64) { // 返回base64,用于请求图片 obj.buffer = 2; delete obj.toBase64 } console.log('request:' + url); let res = req(url, obj); let html = res.content || ''; // console.log(html); if (obj.withHeaders) { let htmlWithHeaders = res.headers; htmlWithHeaders.body = html; return JSON.stringify(htmlWithHeaders); } else { return html } } fetch = request; print = function (data) { data = data || ''; if (typeof (data) !== 'string') { try { data = JSON.stringify(data); } catch (e) { console.log('print:' + e.message) } } console.log(data); } log = console.log; /** * 检查宝塔验证并自动跳过获取正确源码 * @param html 之前获取的html * @param url 之前的来源url * @param obj 来源obj * @returns {string|DocumentFragment|*} */ function checkHtml(html, url, obj) { if (/\?btwaf=/.test(html)) { let btwaf = html.match(/btwaf(.*?)"/)[1]; url = url.split('#')[0] + '?btwaf' + btwaf; html = request(url, obj); } return html } /** * 带一次宝塔验证的源码获取 * @param url 请求链接 * @param obj 请求参数 * @returns {string|DocumentFragment} */ function getCode(url, obj) { let html = request(url, obj); html = checkHtml(html, url, obj); return html } /** * 源rule专用的请求方法,自动注入cookie * @param url 请求链接 * @returns {string|DocumentFragment} */ function getHtml(url) { let obj = {}; if (rule.headers) { obj.headers = rule.headers; } let cookie = getItem(RULE_CK, ''); if (cookie) { if (obj.headers && !Object.keys(obj.headers).map(it => it.toLowerCase()).includes('cookie')) { obj.headers['Cookie'] = cookie; } else if (!obj.headers) { obj.headers = { Cookie: cookie }; } } let html = getCode(url, obj); return html } /** * 首页分类解析,筛选暂未实现 * @param homeObj 首页传参对象 * @returns {string} */ function homeParse(homeObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let classes = []; if (homeObj.class_name && homeObj.class_url) { let names = homeObj.class_name.split('&'); let urls = homeObj.class_url.split('&'); let cnt = Math.min(names.length, urls.length); for (let i = 0; i < cnt; i++) { classes.push({ 'type_id': urls[i], 'type_name': names[i] }); } } if (homeObj.class_parse) { let p = homeObj.class_parse.split(';'); if (p.length >= 4) { try { let html = getHtml(homeObj.MY_URL); if (html) { homeHtmlCache = html; let list = pdfa(html, p[0]); if (list && list.length > 0) { list.forEach((it, idex) => { try { let name = pdfh(it, p[1]); if (homeObj.cate_exclude && (new RegExp(homeObj.cate_exclude).test(name))) { return; } let url = pdfh(it, p[2]); if (p[3]) { let exp = new RegExp(p[3]); url = url.match(exp)[1]; } classes.push({ 'type_id': url.trim(), 'type_name': name.trim() }); } catch (e) { console.log(`分类列表定位第${idex}个元素正常报错:${e.message}`); } }); } } } catch (e) { console.log(e.message); } } } // 排除分类 classes = classes.filter(it => !homeObj.cate_exclude || !(new RegExp(homeObj.cate_exclude).test(it.type_name))); let resp = { 'class': classes }; if (homeObj.filter) { resp.filters = homeObj.filter; } console.log(JSON.stringify(resp)); return JSON.stringify(resp); } /** * 首页推荐列表解析 * @param homeVodObj * @returns {string} */ function homeVodParse(homeVodObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let d = []; MY_URL = homeVodObj.homeUrl; // setItem('MY_URL',MY_URL); console.log(MY_URL); let p = homeVodObj.推荐; if (!p || typeof (p) !== 'string') { return '{}' } p = p.trim(); if (p.startsWith('js:')) { const TYPE = 'home'; var input = MY_URL; const HOST = rule.host; eval(p.replace('js:', '')); d = VODS; } else { p = p.split(';'); if (!homeVodObj.double && p.length < 5) { return '{}' } else if (homeVodObj.double && p.length < 6) { return '{}' } let _ps = parseTags.getParse(p[0]); _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; let is_json = p[0].startsWith('json:'); p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); // print(p[0]); let html = homeHtmlCache || getHtml(MY_URL); homeHtmlCache = undefined; if (is_json) { html = dealJson(html); } try { console.log('double:' + homeVodObj.double); if (homeVodObj.double) { let items = _pdfa(html, p[0]); // console.log(items.length); for (let item of items) { // console.log(p[1]); let items2 = _pdfa(item, p[1]); // console.log(items2.length); for (let item2 of items2) { try { let title = _pdfh(item2, p[2]); let img = ''; try { img = _pd(item2, p[3]) } catch (e) { } let desc = _pdfh(item2, p[4]); let links = []; for (let p5 of p[5].split('+')) { let link = !homeVodObj.detailUrl ? _pd(item2, p5, MY_URL) : _pdfh(item2, p5); links.push(link); } let vod = { vod_name: title, vod_pic: img, vod_remarks: desc, vod_id: links.join('$') }; // print(vod); d.push(vod); } catch (e) { console.log('首页列表处理发生错误:' + e.message); } } } } else { let items = _pdfa(html, p[0]); for (let item of items) { try { let title = _pdfh(item, p[1]); let img = ''; try { img = _pd(item, p[2], MY_URL); } catch (e) { } let desc = _pdfh(item, p[3]); let links = []; for (let p5 of p[4].split('+')) { let link = !homeVodObj.detailUrl ? _pd(item, p5, MY_URL) : _pdfh(item, p5); links.push(link); } let vod = { vod_name: title, vod_pic: img, vod_remarks: desc, vod_id: links.join('$') }; d.push(vod); } catch (e) { } } } } catch (e) { } } // console.log(JSON.stringify(d)); return JSON.stringify({ list: d }) } /** * 一级分类页数据解析 * @param cateObj * @returns {string} */ function categoryParse(cateObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let p = cateObj.一级; if (!p || typeof (p) !== 'string') { return '{}' } let d = []; // let url = cateObj.url.replaceAll('fyclass', cateObj.tid).replaceAll('fypage', cateObj.pg); let url = cateObj.url.replaceAll('fyclass', cateObj.tid); if (rule.filter_url) { if (!/fyfilter/.test(url)) { if (!url.endsWith('&') && !rule.filter_url.startsWith('&')) { url += '&' } url += rule.filter_url; } else { url = url.replace('fyfilter', rule.filter_url); } // console.log('filter:'+cateObj.filter); let fl = cateObj.filter ? cateObj.extend : {}; let new_url; new_url = cheerio.jinja2(url, { fl: fl }); // if (/object Object/.test(new_url)) { // new_url = drT.renderText(url, fl); // } url = new_url; } if (/fypage/.test(url)) { if (url.includes('(') && url.includes(')')) { let url_rep = url.match(/.*?\((.*)\)/)[1]; // console.log(url_rep); let cnt_page = url_rep.replaceAll('fypage', cateObj.pg); // console.log(cnt_page); let cnt_pg = eval(cnt_page); // console.log(cnt_pg); url = url.replaceAll(url_rep, cnt_pg).replaceAll('(', '').replaceAll(')', ''); } else { url = url.replaceAll('fypage', cateObj.pg); } } if (cateObj.pg === 1 && url.includes('[') && url.includes(']')) { url = url.split('[')[1].split(']')[0]; } MY_URL = url; // setItem('MY_URL',MY_URL); console.log(MY_URL); p = p.trim(); const MY_CATE = cateObj.tid; if (p.startsWith('js:')) { var MY_FL = cateObj.extend; const TYPE = 'cate'; var input = MY_URL; const MY_PAGE = cateObj.pg; var desc = ''; eval(p.trim().replace('js:', '')); d = VODS; } else { p = p.split(';'); if (p.length < 5) { return '{}' } let _ps = parseTags.getParse(p[0]); _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; let is_json = p[0].startsWith('json:'); p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); try { let html = getHtml(MY_URL); if (html) { if (is_json) { html = dealJson(html); } let list = _pdfa(html, p[0]); list.forEach(it => { let links = p[4].split('+').map(p4 => { return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4); }); let link = links.join('$'); let vod_id = rule.detailUrl ? MY_CATE + '$' + link : link; d.push({ 'vod_id': vod_id, 'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(), 'vod_pic': _pd(it, p[2], MY_URL), 'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(), }); }); } } catch (e) { console.log(e.message); } } // print(d); return d.length < 1 ? '{}' : JSON.stringify({ 'page': parseInt(cateObj.pg), 'pagecount': 999, 'limit': 20, 'total': 999, 'list': d, }); } /** * 搜索列表数据解析 * @param searchObj * @returns {string} */ function searchParse(searchObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let d = []; if (!searchObj.searchUrl) { return '{}' } let p = searchObj.搜索 === '*' && rule.一级 ? rule.一级 : searchObj.搜索; if (!p || typeof (p) !== 'string') { return '{}' } p = p.trim(); let url = searchObj.searchUrl.replaceAll('**', searchObj.wd).replaceAll('fypage', searchObj.pg); MY_URL = url; console.log(MY_URL); // setItem('MY_URL',MY_URL); if (p.startsWith('js:')) { const TYPE = 'search'; const MY_PAGE = searchObj.pg; const KEY = searchObj.wd; var input = MY_URL; var detailUrl = rule.detailUrl || ''; eval(p.trim().replace('js:', '')); d = VODS; } else { p = p.split(';'); if (p.length < 5) { return '{}' } let _ps = parseTags.getParse(p[0]); _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; let is_json = p[0].startsWith('json:'); p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); try { let html = getHtml(MY_URL); if (html) { if (/系统安全验证|输入验证码/.test(html)) { let cookie = verifyCode(MY_URL); if (cookie) { console.log(`本次成功过验证,cookie:${cookie}`); setItem(RULE_CK, cookie); } else { console.log(`本次自动过搜索验证失败,cookie:${cookie}`); } // obj.headers['Cookie'] = cookie; html = getHtml(MY_URL); } if (!html.includes(searchObj.wd)) { console.log('搜索结果源码未包含关键字,疑似搜索失败,正为您打印结果源码'); console.log(html); } if (is_json) { html = dealJson(html); } let list = _pdfa(html, p[0]); list.forEach(it => { let links = p[4].split('+').map(p4 => { return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4) }); let link = links.join('$'); let ob = { 'vod_id': link, 'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(), 'vod_pic': _pd(it, p[2], MY_URL), 'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(), }; if (p.length > 5 && p[5]) { ob.vod_content = _pdfh(it, p[5]); } d.push(ob); }); } } catch (e) { return '{}' } } return JSON.stringify({ 'page': parseInt(searchObj.pg), 'pagecount': 10, 'limit': 20, 'total': 100, 'list': d, }); } /** * 二级详情页数据解析 * @param detailObj * @returns {string} */ function detailParse(detailObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let vod = { vod_id: detailObj.orId, //"id", vod_name: "片名", vod_pic: "", type_name: "剧情", vod_year: "年份", vod_area: "地区", vod_remarks: "更新信息", vod_actor: "主演", vod_director: "导演", vod_content: "简介" }; let p = detailObj.二级; let url = detailObj.url; let detailUrl = detailObj.detailUrl; let fyclass = detailObj.fyclass; let tab_exclude = detailObj.tab_exclude; let html = detailObj.html || ''; MY_URL = url; console.log(MY_URL); // setItem('MY_URL',MY_URL); if (p === '*') { vod.vod_play_from = '道长在线'; vod.vod_remarks = detailUrl; vod.vod_actor = '没有二级,只有一级链接直接嗅探播放'; vod.vod_content = MY_URL; vod.vod_play_url = '嗅探播放$' + MY_URL; } else if (typeof (p) === 'string' && p.trim().startsWith('js:')) { const TYPE = 'detail'; var input = MY_URL; eval(p.trim().replace('js:', '')); vod = VOD; console.log(JSON.stringify(vod)); } else if (p && typeof (p) === 'object') { if (!html) { html = getHtml(MY_URL); } let _impJQP = true; let _ps; if (p.is_json) { _ps = parseTags.json; html = dealJson(html); _impJQP = false; } else if (p.is_jsp) { _ps = parseTags.jsp; } else if (p.is_jq) { _ps = parseTags.jq; } else { _ps = parseTags.jq; } if (_impJQP) { let c$ = cheerio.load(html); html = { rr: c$, ele: c$('html')[0] } } _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; if (p.title) { let p1 = p.title.split(';'); vod.vod_name = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); let type_name = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').replace(/ /g, '').trim() : ''; vod.type_name = type_name || vod.type_name; } if (p.desc) { try { let p1 = p.desc.split(';'); vod.vod_remarks = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); vod.vod_year = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').trim() : ''; vod.vod_area = p1.length > 2 ? _pdfh(html, p1[2]).replace(/\n|\t/g, '').trim() : ''; // vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replaceAll('\n', ' ').trim():''; vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replace(/\n|\t/g, '').trim() : ''; vod.vod_director = p1.length > 4 ? _pdfh(html, p1[4]).replace(/\n|\t/g, '').trim() : ''; } catch (e) { } } if (p.content) { try { let p1 = p.content.split(';'); vod.vod_content = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); } catch (e) { } } if (p.img) { try { let p1 = p.img.split(';'); vod.vod_pic = _pd(html, p1[0], MY_URL); } catch (e) { } } let vod_play_from = '$$$'; let playFrom = []; if (p.重定向 && p.重定向.startsWith('js:')) { html = eval(p.重定向.replace('js:', '')); if (_impJQP) { let c$ = cheerio.load(html); html = { rr: c$, ele: c$('html')[0] } } } // console.log(2); if (p.tabs) { let p_tab = p.tabs.split(';')[0]; console.log(p_tab); let vHeader = _pdfa(html, p_tab); console.log(vHeader.length); for (let v of vHeader) { let v_title = _pdfh(v, 'body&&Text'); console.log(v_title); if (tab_exclude && (new RegExp(tab_exclude)).test(v_title)) { continue; } playFrom.push(v_title); } console.log(JSON.stringify(playFrom)); } else { playFrom = ['道长在线'] } vod.vod_play_from = playFrom.join(vod_play_from); // console.log(3); let vod_play_url = '$$$'; let vod_tab_list = []; if (p.lists) { for (let i = 0; i < playFrom.length; i++) { let tab_name = playFrom[i]; let tab_ext = p.tabs.split(';').length > 1 ? p.tabs.split(';')[1] : ''; let p1 = p.lists.replaceAll('#idv', tab_name).replaceAll('#id', i); tab_ext = tab_ext.replaceAll('#idv', tab_name).replaceAll('#id', i); console.log(p1); // console.log(html); let vodList = []; try { vodList = _pdfa(html, p1); console.log('len(vodList):' + vodList.length); } catch (e) { // console.log(e.message); } let new_vod_list = []; let tabName = tab_ext ? _pdfh(html, tab_ext) : tab_name; console.log(tabName); // console.log('cheerio解析Text'); vodList.forEach(it => { // 请注意,这里要固定pdfh解析body&&Text,不需要下划线,没写错 // new_vod_list.push(pdfh(it,'body&&Text')+'$'+_pd(it,'a&&href',MY_URL)); // new_vod_list.push(cheerio.load(it).text() + '$' + _pd(it, 'a&&href', MY_URL)); new_vod_list.push(_pdfh(it, 'body&&Text') + '$' + _pd(it, 'a&&href', MY_URL)); }); let vlist = new_vod_list.join('#'); vod_tab_list.push(vlist); } } vod.vod_play_url = vod_tab_list.join(vod_play_url); } // print(vod); return JSON.stringify({ list: [vod] }) } /** * 选集播放点击事件解析 * @param playObj * @returns {string} */ function playParse(playObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); MY_URL = playObj.url; if (!/http/.test(MY_URL)) { try { MY_URL = base64Decode(MY_URL); } catch (e) { } } MY_URL = decodeURIComponent(MY_URL); var input = MY_URL;//注入给免嗅js let common_play = { parse: 1, url: input }; let lazy_play; if (!rule.play_parse || !rule.lazy) { lazy_play = common_play; } else if (rule.play_parse && rule.lazy && typeof (rule.lazy) === 'string') { try { let lazy_code = rule.lazy.replace('js:', '').trim(); print('开始执行js免嗅=>' + lazy_code); eval(lazy_code); lazy_play = typeof (input) === 'object' ? input : { parse: 1, jx: 1, url: input }; } catch (e) { print('js免嗅错误:' + e.message); lazy_play = common_play; } } else { lazy_play = common_play; } console.log(JSON.stringify(lazy_play)); return JSON.stringify(lazy_play); } /** * js源预处理特定返回对象中的函数 * @param ext */ function init(ext) { console.log('init'); try { // make shared jsContext happy if (typeof (globalThis.mubanJs) === 'undefined') { let mubanJs = request('https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js', { 'User-Agent': MOBILE_UA }); mubanJs = mubanJs.replace('export default', '(function() {return muban;}()) // export default'); globalThis.mubanJs = mubanJs; } let muban = eval(globalThis.mubanJs); if (typeof ext == 'object') { rule = ext; if (rule.template) { rule = Object.assign(muban[rule.template], rule); } } else if (typeof ext == 'string') { if (ext.startsWith('http')) { let js = request(ext, { 'method': 'GET' }); if (js) { eval(js.replace('var rule', 'rule')); } } } else { eval(ext.replace('var rule', 'rule')); } /** 处理一下 rule规则关键字段没传递的情况 **/ let rule_cate_excludes = (rule.cate_exclude || '').split('|').filter(it => it.trim()); let rule_tab_excludes = (rule.tab_exclude || '').split('|').filter(it => it.trim()); rule_cate_excludes = rule_cate_excludes.concat(CATE_EXCLUDE.split('|').filter(it => it.trim())); rule_tab_excludes = rule_tab_excludes.concat(TAB_EXCLUDE.split('|').filter(it => it.trim())); rule.cate_exclude = rule_cate_excludes.join('|'); rule.tab_exclude = rule_tab_excludes.join('|'); rule.host = (rule.host || '').rstrip('/'); rule.url = rule.url || ''; rule.double = rule.double || false; rule.homeUrl = rule.homeUrl || ''; rule.detailUrl = rule.detailUrl || ''; rule.searchUrl = rule.searchUrl || ''; rule.homeUrl = rule.host && rule.homeUrl ? urljoin(rule.host, rule.homeUrl) : (rule.homeUrl || rule.host); rule.detailUrl = rule.host && rule.detailUrl ? urljoin(rule.host, rule.detailUrl) : rule.detailUrl; if (rule.url.includes('[') && rule.url.includes(']')) { let u1 = rule.url.split('[')[0] let u2 = rule.url.split('[')[1].split(']')[0] rule.url = rule.host && rule.url ? urljoin(rule.host, u1) + '[' + urljoin(rule.host, u2) + ']' : rule.url; } else { rule.url = rule.host && rule.url ? urljoin(rule.host, rule.url) : rule.url; } rule.searchUrl = rule.host && rule.searchUrl ? urljoin(rule.host, rule.searchUrl) : rule.searchUrl; rule.timeout = rule.timeout || 5000; rule.encoding = rule.编码 || rule.encoding || 'utf-8'; if (rule.headers && typeof (rule.headers) === 'object') { try { let header_keys = Object.keys(rule.headers); for (let k of header_keys) { if (k.toLowerCase() === 'user-agent') { let v = rule.headers[k]; console.log(v); if (['MOBILE_UA', 'PC_UA', 'UC_UA', 'IOS_UA', 'UA'].includes(v)) { rule.headers[k] = eval(v); } } } } catch (e) { console.log('处理headers发生错误:' + e.message); } } // print(rule.headers); rule_fetch_params = { 'headers': rule.headers || false, 'timeout': rule.timeout, 'encoding': rule.encoding }; oheaders = rule.headers || {}; RKEY = typeof (key) !== 'undefined' && key ? key : 'drpy_' + (rule.title || rule.host); init_test(); } catch (e) { console.log('init_test发生错误:' + e.message); } } let homeHtmlCache = undefined; /** * js源获取首页分类和筛选特定返回对象中的函数 * @param filter 筛选条件字典对象 * @returns {string} */ function home(filter) { console.log("home"); let homeObj = { filter: rule.filter || false, MY_URL: rule.homeUrl, class_name: rule.class_name || '', class_url: rule.class_url || '', class_parse: rule.class_parse || '', cate_exclude: rule.cate_exclude, }; return homeParse(homeObj); } /** * js源获取首页推荐数据列表特定返回对象中的函数 * @param params * @returns {string} */ function homeVod(params) { let homeVodObj = { 推荐: rule.推荐, double: rule.double, homeUrl: rule.homeUrl, detailUrl: rule.detailUrl }; return homeVodParse(homeVodObj) // return "{}"; } /** * js源获取分类页一级数据列表特定返回对象中的函数 * @param tid 分类id * @param pg 页数 * @param filter 当前选中的筛选条件 * @param extend 扩展 * @returns {string} */ function category(tid, pg, filter, extend) { let cateObj = { url: rule.url, 一级: rule.一级, tid: tid, pg: parseInt(pg), filter: filter, extend: extend }; // console.log(JSON.stringify(extend)); return categoryParse(cateObj) } /** * js源获取二级详情页数据特定返回对象中的函数 * @param vod_url 一级列表中的vod_id或者是带分类的自拼接 vod_id 如 fyclass$vod_id * @returns {string} */ function detail(vod_url) { let orId = vod_url; let fyclass = ''; if (vod_url.indexOf('$') > -1) { let tmp = vod_url.split('$'); fyclass = tmp[0]; vod_url = tmp[1]; } let detailUrl = vod_url; let url; if (!detailUrl.startsWith('http') && !detailUrl.includes('/')) { url = rule.detailUrl.replaceAll('fyid', detailUrl).replaceAll('fyclass', fyclass); } else if (detailUrl.includes('/')) { url = urljoin(rule.homeUrl, detailUrl); } else { url = detailUrl } let detailObj = { orId: orId, url: url, 二级: rule.二级, detailUrl: detailUrl, fyclass: fyclass, tab_exclude: rule.tab_exclude, } return detailParse(detailObj) } /** * js源选集按钮播放点击事件特定返回对象中的函数 * @param flag 线路名 * @param id 播放按钮的链接 * @param flags 全局配置的flags是否需要解析的标识列表 * @returns {string} */ function play(flag, id, flags) { let playObj = { url: id, flag: flag, flags: flags } return playParse(playObj); } /** * js源搜索返回的数据列表特定返回对象中的函数 * @param wd 搜索关键字 * @param quick 是否来自快速搜索 * @returns {string} */ function search(wd, quick) { let searchObj = { searchUrl: rule.searchUrl, 搜索: rule.搜索, wd: wd, //pg: pg, pg: 1, quick: quick, }; // console.log(JSON.stringify(searchObj)); return searchParse(searchObj) } function DRPY() {//导出函数 return { init: init, home: home, homeVod: homeVod, category: category, detail: detail, play: play, search: search, } } let pd = pD; // 导出函数对象 __JS_SPIDER__ = { init: init, home: home, homeVod: homeVod, category: category, detail: detail, play: play, search: search, DRPY: DRPY }