mirror of
https://github.com/qist/tvbox.git
synced 2025-02-02 10:14:50 +08:00
Delete lib directory
This commit is contained in:
parent
35873ec8bd
commit
f7721458fe
1
lib/cheerio.min.js
vendored
1
lib/cheerio.min.js
vendored
File diff suppressed because one or more lines are too long
6191
lib/crypto-js.js
6191
lib/crypto-js.js
File diff suppressed because it is too large
Load Diff
1
lib/dayjs.min.js
vendored
1
lib/dayjs.min.js
vendored
File diff suppressed because one or more lines are too long
189
lib/drT.js
189
lib/drT.js
@ -1,189 +0,0 @@
|
||||
// drT.js
|
||||
// 2022/09/30 write by hjdhnx
|
||||
// Licensed under the MIT license.
|
||||
|
||||
(function () {
|
||||
"use strict";
|
||||
|
||||
var drT = {
|
||||
name: "drT",
|
||||
version: "1.0.0",
|
||||
templateSettings: {
|
||||
evaluate: /\{\{([\s\S]+?(\}?)+)\}\}/g,
|
||||
interpolate: /\{\{([\s\S]+?)\}\}/g, // 变量渲染
|
||||
encode: /\{\{@([\s\S]+?)\}\}/g, // 变量自动url编码
|
||||
use: /\{\{#([\s\S]+?)\}\}/g,
|
||||
useParams: /(^|[^\w$])def(?:\.|\[[\'\"])([\w$\.]+)(?:[\'\"]\])?\s*\:\s*([\w$\.]+|\"[^\"]+\"|\'[^\']+\'|\{[^\}]+\})/g,
|
||||
define: /\{\{##\s*([\w\.$]+)\s*(\:|=)([\s\S]+?)#\}\}/g,
|
||||
defineParams:/^\s*([\w$]+):([\s\S]+)/,
|
||||
conditional: /\{\{\?(\?)?\s*([\s\S]*?)\s*\}\}/g, // ? if ?? else if ?? else
|
||||
iterate: /\{\{~\s*(?:\}\}|([\s\S]+?)\s*\:\s*([\w$]+)\s*(?:\:\s*([\w$]+))?\s*\}\})/g,
|
||||
varname: "fl",
|
||||
strip: true,
|
||||
append: true,
|
||||
selfcontained: false,
|
||||
doNotSkipEncoded: false
|
||||
},
|
||||
template: undefined, //fn, compile template
|
||||
compile: undefined, //fn, for express
|
||||
log: true
|
||||
}, _globals;
|
||||
|
||||
drT.encodeHTMLSource = function(doNotSkipEncoded) {
|
||||
var encodeHTMLRules = { "&": "&", "<": "<", ">": ">", '"': """, "'": "'", "/": "/" },
|
||||
matchHTML = doNotSkipEncoded ? /[&<>"'\/]/g : /&(?!#?\w+;)|<|>|"|'|\//g;
|
||||
return function(code) {
|
||||
return code ? code.toString().replace(matchHTML, function(m) {return encodeHTMLRules[m] || m;}) : "";
|
||||
};
|
||||
};
|
||||
|
||||
_globals = (function(){ return this || (0,eval)("this"); }());
|
||||
|
||||
/* istanbul ignore else */
|
||||
if (typeof module !== "undefined" && module.exports) {
|
||||
module.exports = drT;
|
||||
} else if (typeof define === "function" && define.amd) {
|
||||
define(function(){return drT;});
|
||||
} else {
|
||||
_globals.drT = drT;
|
||||
}
|
||||
|
||||
var startend = {
|
||||
append: { start: "'+(", end: ")+'", startencode: "'+encodeHTML(" },
|
||||
split: { start: "';out+=(", end: ");out+='", startencode: "';out+=encodeHTML(" }
|
||||
}, skip = /$^/;
|
||||
|
||||
function resolveDefs(c, block, def) {
|
||||
return ((typeof block === "string") ? block : block.toString())
|
||||
.replace(c.define || skip, function(m, code, assign, value) {
|
||||
if (code.indexOf("def.") === 0) {
|
||||
code = code.substring(4);
|
||||
}
|
||||
if (!(code in def)) {
|
||||
if (assign === ":") {
|
||||
if (c.defineParams) value.replace(c.defineParams, function(m, param, v) {
|
||||
def[code] = {arg: param, text: v};
|
||||
});
|
||||
if (!(code in def)) def[code]= value;
|
||||
} else {
|
||||
new Function("def", "def['"+code+"']=" + value)(def);
|
||||
}
|
||||
}
|
||||
return "";
|
||||
})
|
||||
.replace(c.use || skip, function(m, code) {
|
||||
if (c.useParams) code = code.replace(c.useParams, function(m, s, d, param) {
|
||||
if (def[d] && def[d].arg && param) {
|
||||
var rw = (d+":"+param).replace(/'|\\/g, "_");
|
||||
def.__exp = def.__exp || {};
|
||||
def.__exp[rw] = def[d].text.replace(new RegExp("(^|[^\\w$])" + def[d].arg + "([^\\w$])", "g"), "$1" + param + "$2");
|
||||
return s + "def.__exp['"+rw+"']";
|
||||
}
|
||||
});
|
||||
var v = new Function("def", "return " + code)(def);
|
||||
return v ? resolveDefs(c, v, def) : v;
|
||||
});
|
||||
}
|
||||
|
||||
function unescape(code) {
|
||||
return code.replace(/\\('|\\)/g, "$1").replace(/[\r\t\n]/g, " ");
|
||||
}
|
||||
|
||||
drT.template = function(tmpl, c, def) {
|
||||
c = c || drT.templateSettings;
|
||||
var cse = c.append ? startend.append : startend.split, needhtmlencode, sid = 0, indv,
|
||||
str = (c.use || c.define) ? resolveDefs(c, tmpl, def || {}) : tmpl;
|
||||
|
||||
// console.log(str);
|
||||
let beforeCode = '';
|
||||
if(str.match(c.interpolate || skip)){
|
||||
let inter_codes = str.match(c.interpolate || skip);
|
||||
let inter_dict = {};
|
||||
inter_codes.forEach(item=>{
|
||||
item.replace(c.interpolate || skip,function (m,code) {
|
||||
let varname = code.split('.')[0];
|
||||
if(!inter_dict.hasOwnProperty(varname)){
|
||||
let beginCode = `if(typeof(${varname})==='undefined'){${varname}={}}`;
|
||||
inter_dict[varname] = beginCode;
|
||||
}if(!inter_dict.hasOwnProperty(code)){
|
||||
let beginCode = `if(typeof(${code})==='undefined'){${code}=''};`;
|
||||
inter_dict[code] = beginCode;
|
||||
}
|
||||
});
|
||||
});
|
||||
let beginCode = Object.values(inter_dict).join('\n');
|
||||
// console.log(beginCode);
|
||||
beforeCode += beginCode;
|
||||
}
|
||||
str = beforeCode+("var out='" + (c.strip ? str.replace(/(^|\r|\n)\t* +| +\t*(\r|\n|$)/g," ")
|
||||
.replace(/\r|\n|\t|\/\*[\s\S]*?\*\//g,""): str)
|
||||
.replace(/'|\\/g, "\\$&")
|
||||
.replace(c.encode || skip, function(m, code) {
|
||||
needhtmlencode = true;
|
||||
return cse.startencode + unescape(code) + cse.end;
|
||||
})
|
||||
.replace(c.interpolate || skip, function(m, code) {
|
||||
let varname = code.split('.')[0];
|
||||
// console.log(varname === code);
|
||||
// console.log(`varname:${varname},code:${code}`);
|
||||
if(varname === code){
|
||||
let res = cse.start + `JSON.stringify(${unescape(code)})` + cse.end;
|
||||
// console.log(res);
|
||||
return res
|
||||
}
|
||||
return cse.start + unescape(code) + cse.end;
|
||||
})
|
||||
.replace(c.conditional || skip, function(m, elsecase, code) {
|
||||
return elsecase ?
|
||||
(code ? "';}else if(" + unescape(code) + "){out+='" : "';}else{out+='") :
|
||||
(code ? "';if(" + unescape(code) + "){out+='" : "';}out+='");
|
||||
})
|
||||
.replace(c.iterate || skip, function(m, iterate, vname, iname) {
|
||||
if (!iterate) return "';} } out+='";
|
||||
sid+=1; indv=iname || "i"+sid; iterate=unescape(iterate);
|
||||
return "';var arr"+sid+"="+iterate+";if(arr"+sid+"){var "+vname+","+indv+"=-1,l"+sid+"=arr"+sid+".length-1;while("+indv+"<l"+sid+"){"
|
||||
+vname+"=arr"+sid+"["+indv+"+=1];out+='";
|
||||
})
|
||||
.replace(c.evaluate || skip, function(m, code) {
|
||||
return "';" + unescape(code) + "out+='";
|
||||
})
|
||||
+ "';return out;")
|
||||
.replace(/\n/g, "\\n").replace(/\t/g, '\\t').replace(/\r/g, "\\r")
|
||||
.replace(/(\s|;|\}|^|\{)out\+='';/g, '$1').replace(/\+''/g, "");
|
||||
//.replace(/(\s|;|\}|^|\{)out\+=''\+/g,'$1out+=');
|
||||
|
||||
if (needhtmlencode) {
|
||||
// console.log('需要编码');
|
||||
// console.log(c.doNotSkipEncoded);
|
||||
if (!c.selfcontained && _globals && !_globals._encodeHTML) _globals._encodeHTML = drT.encodeHTMLSource(c.doNotSkipEncoded);
|
||||
str = "var encodeHTML = typeof _encodeHTML !== 'undefined' ? _encodeHTML : ("
|
||||
+ drT.encodeHTMLSource.toString() + "(" + (c.doNotSkipEncoded || '') + "));"
|
||||
+ str;
|
||||
// console.log(str);
|
||||
}else{
|
||||
// console.log('不需要编码');
|
||||
}
|
||||
// console.log(c.varname);
|
||||
// console.log(str);
|
||||
try {
|
||||
return new Function(c.varname, str);
|
||||
} catch (e) {
|
||||
/* istanbul ignore else */
|
||||
// console.log(e.message);
|
||||
if (typeof console !== "undefined") console.log("Could not create a template function: " + str);
|
||||
throw e;
|
||||
}
|
||||
};
|
||||
|
||||
drT.compile = function(tmpl, def) {
|
||||
return drT.template(tmpl, null, def);
|
||||
};
|
||||
drT.renderText = function (tmpl,dict,varname){
|
||||
varname = varname||'';
|
||||
if(varname){
|
||||
drT.templateSettings.varname = varname;
|
||||
}
|
||||
dict = dict||{};
|
||||
return drT.compile(tmpl)(dict);
|
||||
};
|
||||
}());
|
1741
lib/drpy.js
1741
lib/drpy.js
File diff suppressed because it is too large
Load Diff
1
lib/drpy.min.js
vendored
1
lib/drpy.min.js
vendored
File diff suppressed because one or more lines are too long
@ -1,4 +0,0 @@
|
||||
import './util.ym.js'
|
||||
import dr from './drpy.min.js'
|
||||
|
||||
__JS_SPIDER__ = dr.DRPY()
|
5
lib/underscore-esm-min.js
vendored
5
lib/underscore-esm-min.js
vendored
File diff suppressed because one or more lines are too long
1
lib/uri.min.js
vendored
1
lib/uri.min.js
vendored
File diff suppressed because one or more lines are too long
300
lib/util.js
300
lib/util.js
@ -1,300 +0,0 @@
|
||||
import 'assets://js/lib/uri.min.js'
|
||||
import cheerio from 'assets://js/lib/cheerio.min.js';
|
||||
import 'assets://js/lib/crypto-js.js'
|
||||
import 'assets://js/lib/dayjs.min.js'
|
||||
import _ from 'assets://js/lib/underscore-esm-min.js'
|
||||
|
||||
var charStr = 'abacdefghjklmnopqrstuvwxyzABCDEFGHJKLMNOPQRSTUVWXYZ0123456789';
|
||||
export function randIndex(min, max, i) {
|
||||
let index = Math.floor(Math.random() * (max - min + 1) + min),
|
||||
numStart = charStr.length - 10;
|
||||
if (i == 0 && index >= numStart) {
|
||||
index = randIndex(min, max, i);
|
||||
}
|
||||
return index;
|
||||
}
|
||||
|
||||
export function randomStr(len) {
|
||||
let min = 0, max = charStr.length - 1, _str = '';
|
||||
len = len || 15;
|
||||
for (var i = 0, index; i < len; i++) {
|
||||
index = randIndex(min, max, i);
|
||||
_str += charStr[index];
|
||||
}
|
||||
return _str;
|
||||
}
|
||||
if (typeof Object.assign != 'function') {
|
||||
Object.assign = function () {
|
||||
var target = arguments[0];
|
||||
for (var i = 1; i < arguments.length; i++) {
|
||||
var source = arguments[i];
|
||||
for (var key in source) {
|
||||
if (Object.prototype.hasOwnProperty.call(source, key)) {
|
||||
target[key] = source[key];
|
||||
}
|
||||
}
|
||||
}
|
||||
return target;
|
||||
};
|
||||
}
|
||||
if (!String.prototype.includes) {
|
||||
String.prototype.includes = function (search, start) {
|
||||
if (typeof start !== 'number') {
|
||||
start = 0;
|
||||
}
|
||||
|
||||
if (start + search.length > this.length) {
|
||||
return false;
|
||||
} else {
|
||||
return this.indexOf(search, start) !== -1;
|
||||
}
|
||||
};
|
||||
}
|
||||
if (!Array.prototype.includes) {
|
||||
Object.defineProperty(Array.prototype, 'includes', {
|
||||
value: function (searchElement, fromIndex) {
|
||||
|
||||
if (this == null) {//this是空或者未定义,抛出错误
|
||||
throw new TypeError('"this" is null or not defined');
|
||||
}
|
||||
|
||||
var o = Object(this);//将this转变成对象
|
||||
var len = o.length >>> 0;//无符号右移0位,获取对象length属性,如果未定义就会变成0
|
||||
|
||||
if (len === 0) {//length为0直接返回false未找到目标值
|
||||
return false;
|
||||
}
|
||||
|
||||
var n = fromIndex | 0;//查找起始索引
|
||||
var k = Math.max(n >= 0 ? n : len - Math.abs(n), 0);//计算正确起始索引,因为有可能是负值
|
||||
|
||||
while (k < len) {//从起始索引处开始循环
|
||||
if (o[k] === searchElement) {//如果某一位置与寻找目标相等,返回true,找到了
|
||||
return true;
|
||||
}
|
||||
k++;
|
||||
}
|
||||
return false;//未找到,返回false
|
||||
}
|
||||
});
|
||||
}
|
||||
if (typeof String.prototype.startsWith != 'function') {
|
||||
String.prototype.startsWith = function (prefix) {
|
||||
return this.slice(0, prefix.length) === prefix;
|
||||
};
|
||||
}
|
||||
if (typeof String.prototype.endsWith != 'function') {
|
||||
String.prototype.endsWith = function (suffix) {
|
||||
return this.indexOf(suffix, this.length - suffix.length) !== -1;
|
||||
};
|
||||
}
|
||||
Object.prototype.myValues = function (obj) {
|
||||
if (obj == null) {
|
||||
throw new TypeError("Cannot convert undefined or null to object");
|
||||
}
|
||||
var res = []
|
||||
for (var k in obj) {
|
||||
if (obj.hasOwnProperty(k)) {//需判断是否是本身的属性
|
||||
res.push(obj[k]);
|
||||
}
|
||||
}
|
||||
return res;
|
||||
}
|
||||
if (typeof Object.prototype.values != 'function') {
|
||||
Object.prototype.values = function (obj) {
|
||||
if (obj == null) {
|
||||
throw new TypeError("Cannot convert undefined or null to object");
|
||||
}
|
||||
var res = []
|
||||
for (var k in obj) {
|
||||
if (obj.hasOwnProperty(k)) {//需判断是否是本身的属性
|
||||
res.push(obj[k]);
|
||||
}
|
||||
}
|
||||
return res;
|
||||
}
|
||||
}
|
||||
if (typeof Array.prototype.join != 'function') {
|
||||
Array.prototype.join = function (emoji) {
|
||||
// emoji = emoji||',';
|
||||
emoji = emoji || '';
|
||||
let self = this;
|
||||
let str = "";
|
||||
let i = 0;
|
||||
if (!Array.isArray(self)) { throw String(self) + 'is not Array' }
|
||||
if (self.length === 0) { return '' }
|
||||
if (self.length === 1) { return String(self[0]) }
|
||||
i = 1;
|
||||
str = this[0];
|
||||
for (; i < self.length; i++) {
|
||||
str += String(emoji) + String(self[i]);
|
||||
}
|
||||
return str;
|
||||
};
|
||||
}
|
||||
|
||||
String.prototype.rstrip = function (chars) {
|
||||
let regex = new RegExp(chars + "$");
|
||||
return this.replace(regex, "");
|
||||
};
|
||||
|
||||
Array.prototype.append = Array.prototype.push;
|
||||
String.prototype.strip = String.prototype.trim;
|
||||
|
||||
export function 是否正版(vipUrl) {
|
||||
let flag = new RegExp('qq\.com|iqiyi\.com|youku\.com|mgtv\.com|bilibili\.com|sohu\.com|ixigua\.com|pptv\.com|miguvideo\.com|le\.com|1905\.com|fun\.tv');
|
||||
return flag.test(vipUrl);
|
||||
}
|
||||
|
||||
export function urlDeal(vipUrl) {
|
||||
if (!vipUrl) {
|
||||
return ''
|
||||
}
|
||||
if (!是否正版(vipUrl)) {
|
||||
return vipUrl
|
||||
}
|
||||
if (!/miguvideo/.test(vipUrl)) {
|
||||
vipUrl = vipUrl.split('#')[0].split('?')[0];
|
||||
}
|
||||
return vipUrl
|
||||
}
|
||||
|
||||
export function urlencode(str) {
|
||||
str = (str + '').toString();
|
||||
return encodeURIComponent(str).replace(/!/g, '%21').replace(/'/g, '%27').replace(/\(/g, '%28').
|
||||
replace(/\)/g, '%29').replace(/\*/g, '%2A').replace(/%20/g, '+');
|
||||
}
|
||||
|
||||
export function base64Encode(text) {
|
||||
return CryptoJS.enc.Base64.stringify(CryptoJS.enc.Utf8.parse(text));
|
||||
}
|
||||
|
||||
export function base64Decode(text) {
|
||||
return CryptoJS.enc.Utf8.stringify(CryptoJS.enc.Base64.parse(text));
|
||||
}
|
||||
|
||||
export function urljoin(base, url) {
|
||||
base = base || '';
|
||||
url = url || '';
|
||||
let baseU = new Uri(base.trim().rstrip('/'));
|
||||
url = url.trim().rstrip('/');
|
||||
let u = undefined;
|
||||
if (url.startsWith('http://') || url.startsWith('https://')) {
|
||||
u = new Uri(url);
|
||||
} else if (url.startsWith('://')) {
|
||||
u = new Uri(baseU.protocol() + url);
|
||||
} else if (url.startsWith('//')) {
|
||||
u = new Uri(baseU.protocol() + ':' + url);
|
||||
} else {
|
||||
u = new Uri(baseU.protocol() + '://' + baseU.host() + (baseU.port() ? ':' + baseU.port() : '') + '/' + url);
|
||||
}
|
||||
if ((!u.path() || u.path().trim().length === 0) && baseU.path())
|
||||
u.path(baseU.path());
|
||||
if (!u.query() && baseU.query())
|
||||
u.query(baseU.query());
|
||||
return u.toString();
|
||||
}
|
||||
|
||||
export function md5(src) {
|
||||
return CryptoJS.MD5(src).toString();
|
||||
}
|
||||
|
||||
const DOM_CHECK_ATTR = /(url|src|href|data-original|data-src)$/;
|
||||
const SELECT_REGEX = /:eq|:lt|:gt|#/g;
|
||||
const SELECT_REGEX_A = /:eq|:lt|:gt/g;
|
||||
|
||||
export function pdfh(html, parse, base_url) {
|
||||
if (!parse || !parse.trim()) {
|
||||
return ''
|
||||
}
|
||||
let eleFind = typeof html === 'object';
|
||||
let option = undefined;
|
||||
if (eleFind && parse.startsWith('body&&')) {
|
||||
parse = parse.substr(6);
|
||||
if (parse.indexOf('&&') < 0) {
|
||||
option = parse.trim();
|
||||
parse = '*=*';
|
||||
}
|
||||
}
|
||||
if (parse.indexOf('&&') > -1) {
|
||||
let sp = parse.split('&&');
|
||||
option = sp[sp.length - 1];
|
||||
sp.splice(sp.length - 1);
|
||||
if (sp.length > 1) {
|
||||
for (let i in sp) {
|
||||
if (!SELECT_REGEX.test(sp[i])) {
|
||||
sp[i] = sp[i] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
} else {
|
||||
if (!SELECT_REGEX.test(sp[0])) {
|
||||
sp[0] = sp[0] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
parse = sp.join(' ');
|
||||
}
|
||||
let result = '';
|
||||
const $ = eleFind ? html.rr : cheerio.load(html);
|
||||
let ret = eleFind ? ((parse === '*=*' || $(html.ele).is(parse)) ? html.ele : $(html.ele).find(parse)) : $(parse);
|
||||
if (option) {
|
||||
if (option === 'Text') {
|
||||
result = $(ret).text();
|
||||
}
|
||||
else if (option === 'Html') {
|
||||
result = $(ret).html();
|
||||
}
|
||||
else {
|
||||
result = $(ret).attr(option);
|
||||
}
|
||||
if (result && base_url && DOM_CHECK_ATTR.test(option)) {
|
||||
if (/http/.test(result)) {
|
||||
result = result.substr(result.indexOf('http'));
|
||||
} else {
|
||||
result = urljoin(base_url, result)
|
||||
}
|
||||
}
|
||||
} else {
|
||||
result = $(ret).toString();
|
||||
}
|
||||
return result;
|
||||
}
|
||||
|
||||
export function pdfa(html, parse) {
|
||||
if (!parse || !parse.trim()) {
|
||||
return [];
|
||||
}
|
||||
let eleFind = typeof html === 'object';
|
||||
if (parse.indexOf('&&') > -1) {
|
||||
let sp = parse.split('&&');
|
||||
for (let i in sp) {
|
||||
if (!SELECT_REGEX_A.test(sp[i]) && i < sp.length - 1) {
|
||||
sp[i] = sp[i] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
parse = sp.join(' ');
|
||||
}
|
||||
const $ = eleFind ? html.rr : cheerio.load(html);
|
||||
let ret = eleFind ? ($(html.ele).is(parse) ? html.ele : $(html.ele).find(parse)) : $(parse);
|
||||
let result = [];
|
||||
if (ret) {
|
||||
ret.each(function (idx, ele) {
|
||||
result.push({ rr: $, ele: ele });
|
||||
});
|
||||
}
|
||||
return result;
|
||||
}
|
||||
|
||||
globalThis.randIndex = randIndex;
|
||||
globalThis.randomStr = randomStr;
|
||||
globalThis.urljoin = urljoin;
|
||||
globalThis.joinUrl = urljoin;
|
||||
globalThis.urljoin2 = urljoin;
|
||||
globalThis.是否正版 = 是否正版;
|
||||
globalThis.urlDeal = urlDeal;
|
||||
globalThis.urlencode = urlencode;
|
||||
globalThis.encodeUrl = urlencode;
|
||||
globalThis.base64Encode = base64Encode;
|
||||
globalThis.base64Decode = base64Decode;
|
||||
globalThis.pdfa = pdfa;
|
||||
globalThis.pdfh = pdfh;
|
||||
globalThis.md5 = md5;
|
158
lib/util.ym.js
158
lib/util.ym.js
@ -1,158 +0,0 @@
|
||||
import 'assets://js/lib/uri.min.js'
|
||||
import cheerio from 'assets://js/lib/cheerio.min.js';
|
||||
import 'assets://js/lib/crypto-js.js'
|
||||
|
||||
var charStr = 'abacdefghjklmnopqrstuvwxyzABCDEFGHJKLMNOPQRSTUVWXYZ0123456789';
|
||||
export function randIndex(min, max, i) {
|
||||
let index = Math.floor(Math.random() * (max - min + 1) + min),
|
||||
numStart = charStr.length - 10;
|
||||
if (i == 0 && index >= numStart) {
|
||||
index = randIndex(min, max, i);
|
||||
}
|
||||
return index;
|
||||
}
|
||||
|
||||
export function randomStr(len) {
|
||||
let min = 0, max = charStr.length - 1, _str = '';
|
||||
len = len || 15;
|
||||
for (var i = 0, index; i < len; i++) {
|
||||
index = randIndex(min, max, i);
|
||||
_str += charStr[index];
|
||||
}
|
||||
return _str;
|
||||
}
|
||||
|
||||
export function urljoin(base, url) {
|
||||
base = base || '';
|
||||
url = url || '';
|
||||
let baseU = new Uri(base.trim().rstrip('/'));
|
||||
url = url.trim().rstrip('/');
|
||||
let u = undefined;
|
||||
if (url.startsWith('http://') || url.startsWith('https://')) {
|
||||
u = new Uri(url);
|
||||
} else if (url.startsWith('://')) {
|
||||
u = new Uri(baseU.protocol() + url);
|
||||
} else if (url.startsWith('//')) {
|
||||
u = new Uri(baseU.protocol() + ':' + url);
|
||||
} else {
|
||||
u = new Uri(baseU.protocol() + '://' + baseU.host() + (baseU.port() ? ':' + baseU.port() : '') + '/' + url);
|
||||
}
|
||||
if ((!u.path() || u.path().trim().length === 0) && baseU.path())
|
||||
u.path(baseU.path());
|
||||
if (!u.query() && baseU.query())
|
||||
u.query(baseU.query());
|
||||
return u.toString();
|
||||
}
|
||||
|
||||
const DOM_CHECK_ATTR = /(url|src|href|data-original|data-src)$/;
|
||||
const SELECT_REGEX = /:eq|:lt|:gt|#/g;
|
||||
const SELECT_REGEX_A = /:eq|:lt|:gt/g;
|
||||
|
||||
export function pdfh(html, parse, base_url) {
|
||||
if (!parse || !parse.trim()) {
|
||||
return ''
|
||||
}
|
||||
let eleFind = typeof html === 'object';
|
||||
let option = undefined;
|
||||
if (eleFind && parse.startsWith('body&&')) {
|
||||
parse = parse.substr(6);
|
||||
if (parse.indexOf('&&') < 0) {
|
||||
option = parse.trim();
|
||||
parse = '*=*';
|
||||
}
|
||||
}
|
||||
if (parse.indexOf('&&') > -1) {
|
||||
let sp = parse.split('&&');
|
||||
option = sp[sp.length - 1];
|
||||
sp.splice(sp.length - 1);
|
||||
if (sp.length > 1) {
|
||||
for (let i in sp) {
|
||||
if (!SELECT_REGEX.test(sp[i])) {
|
||||
sp[i] = sp[i] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
} else {
|
||||
if (!SELECT_REGEX.test(sp[0])) {
|
||||
sp[0] = sp[0] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
parse = sp.join(' ');
|
||||
}
|
||||
let result = '';
|
||||
const $ = eleFind ? html.rr : cheerio.load(html);
|
||||
let ret = eleFind ? ((parse === '*=*' || $(html.ele).is(parse)) ? html.ele : $(html.ele).find(parse)) : $(parse);
|
||||
if (option) {
|
||||
if (option === 'Text') {
|
||||
result = $(ret).text();
|
||||
}
|
||||
else if (option === 'Html') {
|
||||
result = $(ret).html();
|
||||
}
|
||||
else {
|
||||
result = $(ret).attr(option);
|
||||
}
|
||||
if (result && base_url && DOM_CHECK_ATTR.test(option)) {
|
||||
if (/http/.test(result)) {
|
||||
result = result.substr(result.indexOf('http'));
|
||||
} else {
|
||||
result = urljoin(base_url, result)
|
||||
}
|
||||
}
|
||||
} else {
|
||||
result = $(ret).toString();
|
||||
}
|
||||
return result;
|
||||
}
|
||||
|
||||
export function pdfa(html, parse) {
|
||||
if (!parse || !parse.trim()) {
|
||||
return [];
|
||||
}
|
||||
let eleFind = typeof html === 'object';
|
||||
if (parse.indexOf('&&') > -1) {
|
||||
let sp = parse.split('&&');
|
||||
for (let i in sp) {
|
||||
if (!SELECT_REGEX_A.test(sp[i]) && i < sp.length - 1) {
|
||||
sp[i] = sp[i] + ':eq(0)';
|
||||
}
|
||||
}
|
||||
parse = sp.join(' ');
|
||||
}
|
||||
const $ = eleFind ? html.rr : cheerio.load(html);
|
||||
let ret = eleFind ? ($(html.ele).is(parse) ? html.ele : $(html.ele).find(parse)) : $(parse);
|
||||
let result = [];
|
||||
if (ret) {
|
||||
ret.each(function (idx, ele) {
|
||||
result.push({ rr: $, ele: ele });
|
||||
});
|
||||
}
|
||||
return result;
|
||||
}
|
||||
|
||||
const defaultParser = {
|
||||
pdfh:pdfh,
|
||||
pdfa:pdfa,
|
||||
pd(html,parse,uri){
|
||||
let ret = this.pdfh(html,parse);
|
||||
if(typeof(uri)==='undefined'||!uri){
|
||||
uri = '';
|
||||
}
|
||||
if(DOM_CHECK_ATTR.test(parse)){
|
||||
if(/http/.test(ret)){
|
||||
ret = ret.substr(ret.indexOf('http'));
|
||||
}else{
|
||||
ret = urljoin(MY_URL,ret)
|
||||
}
|
||||
}
|
||||
return ret
|
||||
},
|
||||
};
|
||||
|
||||
globalThis.randIndex = randIndex;
|
||||
globalThis.randomStr = randomStr;
|
||||
globalThis.urljoin = urljoin;
|
||||
globalThis.joinUrl = urljoin;
|
||||
globalThis.defaultParser = defaultParser;
|
||||
globalThis.pdfa = defaultParser.pdfa;
|
||||
globalThis.pdfh = defaultParser.pdfh;
|
||||
globalThis.pd = defaultParser.pd;
|
Loading…
x
Reference in New Issue
Block a user