6/18/ds/调试助手/drpy.js

1448 lines
46 KiB
JavaScript
Raw Normal View History

2024-07-12 09:44:07 +03:00
import './lib/util.js';
import cheerio from 'assets://js/lib/cheerio.min.js';
import 'assets://js/lib/crypto-js.js'
// import muban from 'https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js';
// const key = 'drpy_zbk';
// eval(req('http://192.168.1.124:5705/libs/es6py.js').content);
function init_test() {
console.log("init_test_start");
console.log(RKEY);
console.log(JSON.stringify(rule));
// clearItem(RULE_CK);
// console.log(JSON.stringify(rule));
// let aa = base64Encode('编码测试一下')
// log(aa);
// let bb = base64Decode(aa);
// log('bb:' + bb);
// console.log(request('https://www.baidu.com',{withHeaders:true}));
// console.log(request('https://www.baidu.com/favicon.ico', { toBase64: true }));
// require('http://192.168.10.99:5705/txt/pluto/drT.js');
// console.log(typeof(drT));
// console.log(drT.renderText('{{fl.cate}},hi, {{fl}}哈哈.{{fl}}',{sort: 1,cate:'movie'},'fl'));
console.log("init_test_end");
}
let rule = {};
/**
* 1.影魔的jinjia2引擎不支持 {{fl}}对象直接渲染
* Array.prototype.append = Array.prototype.push; 这种js执行后有毛病,for in 循环列表会把属性给打印出来
* 2.import es6py.js但是里面的函数没有被装载进来.比如drpy规则报错setResult2 is undefiend
* 3.无法重复导入cheerio(怎么解决drpy和parseTag里都需要导入cheerio的问题) 无法在副文件导入cheerio (现在是全部放在drpy一个文件里了,凑合解决?)
* 4.有个错误不知道哪儿来的 executeScript: com.quickjs.JSObject$Undefined cannot be cast to java.lang.String 点击选集播放打印init_test_end后面打印
* 5.需要实现 stringify 函数,比起JSON.stringify函数,它会原封不动保留中文不会编码unicode
* todo: jsp:{pdfa,pdfh,pd},json:{pdfa,pdfh,pd},jq:{pdfa,pdfh,pd}
* * 电脑看日志调试
adb tcpip 5555
adb connect 192.168.10.192
adb devices -l
adb logcat -c
adb logcat | grep -i QuickJS
* **/
/*** 以下是内置变量和解析方法 **/
const MOBILE_UA = 'Mozilla/5.0 (Linux; Android 11; M2007J3SC Build/RKQ1.200826.002; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/77.0.3865.120 MQQBrowser/6.2 TBS/045714 Mobile Safari/537.36';
const PC_UA = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/95.0.4638.54 Safari/537.36';
const UA = 'Mozilla/5.0';
const UC_UA = 'Mozilla/5.0 (Linux; U; Android 9; zh-CN; MI 9 Build/PKQ1.181121.001) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/57.0.2987.108 UCBrowser/12.5.5.1035 Mobile Safari/537.36';
const IOS_UA = 'Mozilla/5.0 (iPhone; CPU iPhone OS 13_2_3 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/13.0.3 Mobile/15E148 Safari/604.1';
const RULE_CK = 'cookie'; // 源cookie的key值
// const KEY = typeof(key)!=='undefined'&&key?key:'drpy_' + (rule.title || rule.host); // 源的唯一标识
const CATE_EXCLUDE = '首页|留言|APP|下载|资讯|新闻|动态';
const TAB_EXCLUDE = '猜你|喜欢|APP|下载|剧情|热播';
const OCR_RETRY = 3;//ocr验证重试次数
// const OCR_API = 'http://dm.mudery.com:10000';//ocr在线识别接口
// const OCR_API = 'http://192.168.3.239:5705/parse/ocr';//ocr在线识别接口
const OCR_API = 'http://cms.nokia.press/parse/ocr';//ocr在线识别接口
if (typeof (MY_URL) === 'undefined') {
var MY_URL; // 全局注入变量,pd函数需要
}
var RKEY; // 源的唯一标识
var fetch;
var print;
var log;
var rule_fetch_params;
var fetch_params; // 每个位置单独的
var oheaders;
var _pdfh;
var _pdfa;
var _pd;
// const DOM_CHECK_ATTR = ['url', 'src', 'href', 'data-original', 'data-src'];
const DOM_CHECK_ATTR = /(url|src|href|data-original|data-src)$/;
const SELECT_REGEX = /:eq|:lt|:gt|#/g;
const SELECT_REGEX_A = /:eq|:lt|:gt/g;
function setResult(d) {
if (!Array.isArray(d)) {
return []
}
VODS = [];
// print(d);
d.forEach(function (it) {
let obj = {
vod_id: it.url || '',
vod_name: it.title || '',
vod_remarks: it.desc || '',
vod_content: it.content || '',
vod_pic: it.pic_url || it.img || '',
};
let keys = Object.keys(it);
if (keys.includes('tname')) {
obj.type_name = it.tname || '';
}
if (keys.includes('tid')) {
obj.type_id = it.tid || '';
}
if (keys.includes('year')) {
obj.vod_year = it.year || '';
}
if (keys.includes('actor')) {
obj.vod_actor = it.actor || '';
}
if (keys.includes('director')) {
obj.vod_director = it.director || '';
}
if (keys.includes('area')) {
obj.vod_area = it.area || '';
}
VODS.push(obj);
});
return VODS
}
function setResult2(res) {
VODS = res.list || [];
return VODS
}
function setHomeResult(res) {
if (!res || typeof (res) !== 'object') {
return []
}
return setResult(res.list);
}
// 猫了个咪
function rc(js) {
if (js === 'maomi_aes.js') {
var a = CryptoJS.enc.Utf8.parse("625222f9149e961d");
var t = CryptoJS.enc.Utf8.parse("5efdtf6060e2o330");
return {
De: function (word) {
word = CryptoJS.enc.Hex.parse(word)
return CryptoJS.AES.decrypt(CryptoJS.enc.Base64.stringify(word), a, {
iv: t,
mode: CryptoJS.mode.CBC,
padding: CryptoJS.pad.Pkcs7
}).toString(CryptoJS.enc.Utf8)
},
En: function (word) {
// print(a);
// print(word);
var Encrypted = CryptoJS.AES.encrypt(word, a, {
iv: t,
mode: CryptoJS.mode.CBC,
padding: CryptoJS.pad.Pkcs7
});
return Encrypted.ciphertext.toString();
}
};
}
return {};
}
// 千万不要用for in 推荐 forEach (for in 会打乱顺序)
//猫函数
function maoss(jxurl, ref, key) {
eval(getCryptoJS());
try {
var getVideoInfo = function (text) {
return CryptoJS.AES.decrypt(text, key, { iv: iv, padding: CryptoJS.pad.Pkcs7 }).toString(CryptoJS.enc.Utf8);
};
var token_key = key == undefined ? 'dvyYRQlnPRCMdQSe' : key;
if (ref) {
var html = request(jxurl, {
headers: {
'Referer': ref
}
});
} else {
var html = request(jxurl);
}
// print(html);
if (html.indexOf('&btwaf=') != -1) {
html = request(jxurl + '&btwaf' + html.match(/&btwaf(.*?)"/)[1], {
headers: {
'Referer': ref
}
})
}
var token_iv = html.split('_token = "')[1].split('"')[0];
var key = CryptoJS.enc.Utf8.parse(token_key);
var iv = CryptoJS.enc.Utf8.parse(token_iv);
// log("iv:"+iv);
// log(html);
// print(key);
// print(iv);
eval(html.match(/var config = {[\s\S]*?}/)[0] + '');
// config.url = config.url.replace(/,/g,'');
// print(config.url);
if (!config.url.startsWith('http')) {
//config.url = decodeURIComponent(AES(config.url, key, iv));
config.url = CryptoJS.AES.decrypt(config.url, key, {
iv: iv,
padding: CryptoJS.pad.Pkcs7
}).toString(CryptoJS.enc.Utf8)
}
return config.url;
} catch (e) {
return '';
}
}
let VODS = [];// 一级或者搜索需要的数据列表
let VOD = {};// 二级的单个数据
/**
* 重写pd方法-增加自动urljoin(没法重写,改个名继续骗)
* @param html
* @param parse
* @param uri
* @returns {*}
*/
function pD(html, parse, uri) {
let ret = pdfh(html, parse);
if (typeof (uri) === 'undefined' || !uri) {
uri = '';
}
if (DOM_CHECK_ATTR.test(parse)) {
if (/http/.test(ret)) {
ret = ret.substr(ret.indexOf('http'));
} else {
ret = urljoin(MY_URL, ret)
}
}
// MY_URL = getItem('MY_URL',MY_URL);
// console.log(`规则${RKEY}打印MY_URL:${MY_URL},uri:${uri}`);
return ret
}
const parseTags = {
jsp: {
pdfh: pdfh,
pdfa: pdfa,
pd: pD,
},
json: {
pdfh(html, parse) {
if (!parse || !parse.trim()) {
return '';
}
if (typeof (html) === 'string') {
html = JSON.parse(html);
}
parse = parse.trim();
if (!parse.startsWith('$.')) {
parse = '$.' + parse;
}
parse = parse.split('||');
for (let ps of parse) {
let ret = cheerio.jp(ps, html);
if (Array.isArray(ret)) {
ret = ret[0] || '';
} else {
ret = ret || ''
}
if (ret && typeof (ret) !== 'string') {
ret = ret.toString();
}
if (ret) {
return ret
}
}
return '';
},
pdfa(html, parse) {
if (!parse || !parse.trim()) {
return '';
}
if (typeof (html) === 'string') {
html = JSON.parse(html);
}
parse = parse.trim()
if (!parse.startsWith('$.')) {
parse = '$.' + parse;
}
let ret = cheerio.jp(parse, html);
if (Array.isArray(ret) && Array.isArray(ret[0]) && ret.length === 1) {
return ret[0] || []
}
return ret || []
},
pd(html, parse) {
let ret = parseTags.json.pdfh(html, parse);
if (ret) {
return urljoin(MY_URL, ret);
}
return ret
},
},
jq: {
pdfh: pdfh,
pdfa: pdfa,
pd(html, parse, uri) {
return parseTags.jq.pdfh(html, parse, MY_URL);
},
},
getParse(p0) {//非js开头的情况自动获取解析标签
if (p0.startsWith('jsp:')) {
return this.jsp
} else if (p0.startsWith('json:')) {
return this.json
} else if (p0.startsWith('jq:')) {
return this.jq
} else {
return this.jq
}
}
};
const stringify = JSON.stringify;
const jsp = parseTags.jsp;
/*** 后台需要实现的java方法并注入到js中 ***/
/**
* 读取本地文件->应用程序目录
* @param filePath
* @returns {string}
*/
function readFile(filePath) {
filePath = filePath || './uri.min.js';
var fd = os.open(filePath);
var buffer = new ArrayBuffer(1024);
var len = os.read(fd, buffer, 0, 1024);
console.log(len);
let text = String.fromCharCode.apply(null, new Uint8Array(buffer));
console.log(text);
return text
}
/**
* 处理返回的json数据
* @param html
* @returns {*}
*/
function dealJson(html) {
try {
return html.match(/[\w|\W|\s|\S]*?(\{[\w|\W|\s|\S]*\})/).group[1];
} catch (e) {
}
try {
html = JSON.parse(html);
} catch (e) { }
// console.log(typeof(html));
return html;
}
/**
* 验证码识别逻辑,需要java实现(js没有bytes类型,无法调用后端的传递图片二进制获取验证码文本的接口)
* @type {{api: string, classification: (function(*=): string)}}
*/
var OcrApi = {
api: OCR_API,
classification: function (img) { // img是byte类型,这里不方便搞啊
let code = '';
try {
let html = request(this.api, { data: { img: img }, headers: { 'User-Agent': PC_UA }, 'method': 'POST' });
html = JSON.parse(html);
code = html.url || '';
} catch (e) { }
return code
}
};
/**
* 验证码识别,暂未实现
* @param url 验证码图片链接
* @returns {string} 验证成功后的cookie
*/
function verifyCode(url) {
let cnt = 0;
let host = getHome(url);
let cookie = '';
while (cnt < OCR_RETRY) {
try {
// let obj = {headers:headers,timeout:timeout};
let yzm_url = `${host}/index.php/verify/index.html`;
console.log(`验证码链接:${yzm_url}`);
let hhtml = request(yzm_url, { withHeaders: true, toBase64: true });
let json = JSON.parse(hhtml);
if (!cookie) {
cookie = json['set-cookie'] ? json['set-cookie'].split(';')[0] : '';
}
// console.log(hhtml);
console.log('cookie:' + cookie);
let img = json.body;
// console.log(img);
let code = OcrApi.classification(img);
console.log(`${cnt + 1}次验证码识别结果:${code}`);
let submit_url = `${host}/index.php/ajax/verify_check?type=search&verify=${code}`;
console.log(submit_url);
let html = request(submit_url, { headers: { Cookie: cookie, 'User-Agent': MOBILE_UA }, 'method': 'POST' });
// console.log(html);
html = JSON.parse(html);
if (html.msg === 'ok') {
console.log(`${cnt + 1}次验证码提交成功`);
return cookie // 需要返回cookie
} else if (html.msg !== 'ok' && cnt + 1 >= OCR_RETRY) {
cookie = ''; // 需要清空返回cookie
}
} catch (e) {
console.log(`${cnt + 1}次验证码提交失败:${e.message}`);
if (cnt + 1 >= OCR_RETRY) {
cookie = '';
}
}
cnt += 1
}
return cookie
}
/**
* 存在数据库配置表里, key字段对应值value,没有就新增,有就更新,调用此方法会清除key对应的内存缓存
* @param k
* @param v
*/
function setItem(k, v) {
local.set(RKEY, k, v);
console.log(`规则${RKEY}设置${k} => ${v}`)
}
/**
* 获取数据库配置表对应的key字段的value没有这个key就返回value默认传参.需要有缓存,第一次获取后会存在内存里
* @param k
* @param v
* @returns {*}
*/
function getItem(k, v) {
return local.get(RKEY, k) || v;
}
/**
* 删除数据库key对应的一条数据,并清除此key对应的内存缓存
* @param k
*/
function clearItem(k) {
local.delete(RKEY, k);
}
/*** js自封装的方法 ***/
/**
* 获取链接的host(带http协议的完整链接)
* @param url 任意一个正常完整的Url,自动提取根
* @returns {string}
*/
function getHome(url) {
if (!url) {
return ''
}
let tmp = url.split('//');
url = tmp[0] + '//' + tmp[1].split('/')[0];
try {
url = decodeURIComponent(url);
} catch (e) { }
return url
}
/**
* get参数编译链接,类似python params字典自动拼接
* @param url 访问链接
* @param obj 参数字典
* @returns {*}
*/
function buildUrl(url, obj) {
obj = obj || {};
if (url.indexOf('?') < 0) {
url += '?'
}
let param_list = [];
let keys = Object.keys(obj);
keys.forEach(it => {
param_list.push(it + '=' + obj[it])
});
let prs = param_list.join('&');
if (keys.length > 0 && !url.endsWith('?')) {
url += '&'
}
url += prs;
return url
}
/**
* 远程依赖执行函数
* @param url 远程js地址
*/
function require(url) {
eval(request(url));
}
/**
* 海阔网页请求函数完整封装
* @param url 请求链接
* @param obj 请求对象 {headers:{},method:'',timeout:5000,body:'',withHeaders:false}
* @returns {string|string|DocumentFragment|*}
*/
function request(url, obj) {
if (typeof (obj) === 'undefined' || !obj || obj === {}) {
if (!fetch_params || !fetch_params.headers) {
let headers = {
'User-Agent': MOBILE_UA,
};
if (rule.headers) {
Object.assign(headers, rule.headers);
}
fetch_params.headers = headers;
}
if (!fetch_params.headers.Referer) {
fetch_params.headers.Referer = getHome(url)
}
obj = fetch_params;
} else {
let headers = obj.headers || {};
let keys = Object.keys(headers).map(it => it.toLowerCase());
if (!keys.includes('user-agent')) {
headers['User-Agent'] = MOBILE_UA;
} if (!keys.includes('referer')) {
headers['Referer'] = getHome(url);
}
obj.headers = headers;
}
console.log(JSON.stringify(obj.headers));
if (typeof (obj.headers.body) != 'undefined' && obj.headers.body && typeof (obj.headers.body) === 'string') {
let data = {};
obj.headers.body.split('&').forEach(it => {
data[it.split('=')[0]] = it.split('=')[1]
});
obj.data = data;
delete obj.headers.body
}
if (!url) {
return obj.withHeaders ? '{}' : ''
}
if (obj.toBase64) { // 返回base64,用于请求图片
obj.buffer = 2;
delete obj.toBase64
}
console.log('request:' + url);
let res = req(url, obj);
let html = res.content || '';
// console.log(html);
if (obj.withHeaders) {
let htmlWithHeaders = res.headers;
htmlWithHeaders.body = html;
return JSON.stringify(htmlWithHeaders);
} else {
return html
}
}
fetch = request;
print = function (data) {
data = data || '';
if (typeof (data) !== 'string') {
try {
data = JSON.stringify(data);
} catch (e) {
console.log('print:' + e.message)
}
}
console.log(data);
}
log = console.log;
/**
* 检查宝塔验证并自动跳过获取正确源码
* @param html 之前获取的html
* @param url 之前的来源url
* @param obj 来源obj
* @returns {string|DocumentFragment|*}
*/
function checkHtml(html, url, obj) {
if (/\?btwaf=/.test(html)) {
let btwaf = html.match(/btwaf(.*?)"/)[1];
url = url.split('#')[0] + '?btwaf' + btwaf;
html = request(url, obj);
}
return html
}
/**
* 带一次宝塔验证的源码获取
* @param url 请求链接
* @param obj 请求参数
* @returns {string|DocumentFragment}
*/
function getCode(url, obj) {
let html = request(url, obj);
html = checkHtml(html, url, obj);
return html
}
/**
* 源rule专用的请求方法,自动注入cookie
* @param url 请求链接
* @returns {string|DocumentFragment}
*/
function getHtml(url) {
let obj = {};
if (rule.headers) {
obj.headers = rule.headers;
}
let cookie = getItem(RULE_CK, '');
if (cookie) {
if (obj.headers && !Object.keys(obj.headers).map(it => it.toLowerCase()).includes('cookie')) {
obj.headers['Cookie'] = cookie;
} else if (!obj.headers) {
obj.headers = { Cookie: cookie };
}
}
let html = getCode(url, obj);
return html
}
/**
* 首页分类解析筛选暂未实现
* @param homeObj 首页传参对象
* @returns {string}
*/
function homeParse(homeObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
let classes = [];
if (homeObj.class_name && homeObj.class_url) {
let names = homeObj.class_name.split('&');
let urls = homeObj.class_url.split('&');
let cnt = Math.min(names.length, urls.length);
for (let i = 0; i < cnt; i++) {
classes.push({
'type_id': urls[i],
'type_name': names[i]
});
}
}
if (homeObj.class_parse) {
let p = homeObj.class_parse.split(';');
if (p.length >= 4) {
try {
let html = getHtml(homeObj.MY_URL);
if (html) {
homeHtmlCache = html;
let list = pdfa(html, p[0]);
if (list && list.length > 0) {
list.forEach((it, idex) => {
try {
let name = pdfh(it, p[1]);
if (homeObj.cate_exclude && (new RegExp(homeObj.cate_exclude).test(name))) {
return;
}
let url = pdfh(it, p[2]);
if (p[3]) {
let exp = new RegExp(p[3]);
url = url.match(exp)[1];
}
classes.push({
'type_id': url.trim(),
'type_name': name.trim()
});
} catch (e) {
console.log(`分类列表定位第${idex}个元素正常报错:${e.message}`);
}
});
}
}
} catch (e) {
console.log(e.message);
}
}
}
// 排除分类
classes = classes.filter(it => !homeObj.cate_exclude || !(new RegExp(homeObj.cate_exclude).test(it.type_name)));
let resp = {
'class': classes
};
if (homeObj.filter) {
resp.filters = homeObj.filter;
}
console.log(JSON.stringify(resp));
return JSON.stringify(resp);
}
/**
* 首页推荐列表解析
* @param homeVodObj
* @returns {string}
*/
function homeVodParse(homeVodObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
let d = [];
MY_URL = homeVodObj.homeUrl;
// setItem('MY_URL',MY_URL);
console.log(MY_URL);
let p = homeVodObj.推荐;
if (!p || typeof (p) !== 'string') {
return '{}'
}
p = p.trim();
if (p.startsWith('js:')) {
const TYPE = 'home';
var input = MY_URL;
const HOST = rule.host;
eval(p.replace('js:', ''));
d = VODS;
} else {
p = p.split(';');
if (!homeVodObj.double && p.length < 5) {
return '{}'
} else if (homeVodObj.double && p.length < 6) {
return '{}'
}
let _ps = parseTags.getParse(p[0]);
_pdfa = _ps.pdfa;
_pdfh = _ps.pdfh;
_pd = _ps.pd;
let is_json = p[0].startsWith('json:');
p[0] = p[0].replace(/^(jsp:|json:|jq:)/, '');
// print(p[0]);
let html = homeHtmlCache || getHtml(MY_URL);
homeHtmlCache = undefined;
if (is_json) {
html = dealJson(html);
}
try {
console.log('double:' + homeVodObj.double);
if (homeVodObj.double) {
let items = _pdfa(html, p[0]);
// console.log(items.length);
for (let item of items) {
// console.log(p[1]);
let items2 = _pdfa(item, p[1]);
// console.log(items2.length);
for (let item2 of items2) {
try {
let title = _pdfh(item2, p[2]);
let img = '';
try {
img = _pd(item2, p[3])
} catch (e) {
}
let desc = _pdfh(item2, p[4]);
let links = [];
for (let p5 of p[5].split('+')) {
let link = !homeVodObj.detailUrl ? _pd(item2, p5, MY_URL) : _pdfh(item2, p5);
links.push(link);
}
let vod = {
vod_name: title,
vod_pic: img,
vod_remarks: desc,
vod_id: links.join('$')
};
// print(vod);
d.push(vod);
} catch (e) {
console.log('首页列表处理发生错误:' + e.message);
}
}
}
} else {
let items = _pdfa(html, p[0]);
for (let item of items) {
try {
let title = _pdfh(item, p[1]);
let img = '';
try {
img = _pd(item, p[2], MY_URL);
} catch (e) {
}
let desc = _pdfh(item, p[3]);
let links = [];
for (let p5 of p[4].split('+')) {
let link = !homeVodObj.detailUrl ? _pd(item, p5, MY_URL) : _pdfh(item, p5);
links.push(link);
}
let vod = {
vod_name: title,
vod_pic: img,
vod_remarks: desc,
vod_id: links.join('$')
};
d.push(vod);
} catch (e) {
}
}
}
} catch (e) {
}
}
// console.log(JSON.stringify(d));
return JSON.stringify({
list: d
})
}
/**
* 一级分类页数据解析
* @param cateObj
* @returns {string}
*/
function categoryParse(cateObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
let p = cateObj.一级;
if (!p || typeof (p) !== 'string') {
return '{}'
}
let d = [];
// let url = cateObj.url.replaceAll('fyclass', cateObj.tid).replaceAll('fypage', cateObj.pg);
let url = cateObj.url.replaceAll('fyclass', cateObj.tid);
if (rule.filter_url) {
if (!/fyfilter/.test(url)) {
if (!url.endsWith('&') && !rule.filter_url.startsWith('&')) {
url += '&'
}
url += rule.filter_url;
} else {
url = url.replace('fyfilter', rule.filter_url);
}
// console.log('filter:'+cateObj.filter);
let fl = cateObj.filter ? cateObj.extend : {};
let new_url;
new_url = cheerio.jinja2(url, { fl: fl });
// if (/object Object/.test(new_url)) {
// new_url = drT.renderText(url, fl);
// }
url = new_url;
}
if (/fypage/.test(url)) {
if (url.includes('(') && url.includes(')')) {
let url_rep = url.match(/.*?\((.*)\)/)[1];
// console.log(url_rep);
let cnt_page = url_rep.replaceAll('fypage', cateObj.pg);
// console.log(cnt_page);
let cnt_pg = eval(cnt_page);
// console.log(cnt_pg);
url = url.replaceAll(url_rep, cnt_pg).replaceAll('(', '').replaceAll(')', '');
} else {
url = url.replaceAll('fypage', cateObj.pg);
}
}
if (cateObj.pg === 1 && url.includes('[') && url.includes(']')) {
url = url.split('[')[1].split(']')[0];
}
MY_URL = url;
// setItem('MY_URL',MY_URL);
console.log(MY_URL);
p = p.trim();
const MY_CATE = cateObj.tid;
if (p.startsWith('js:')) {
var MY_FL = cateObj.extend;
const TYPE = 'cate';
var input = MY_URL;
const MY_PAGE = cateObj.pg;
var desc = '';
eval(p.trim().replace('js:', ''));
d = VODS;
} else {
p = p.split(';');
if (p.length < 5) {
return '{}'
}
let _ps = parseTags.getParse(p[0]);
_pdfa = _ps.pdfa;
_pdfh = _ps.pdfh;
_pd = _ps.pd;
let is_json = p[0].startsWith('json:');
p[0] = p[0].replace(/^(jsp:|json:|jq:)/, '');
try {
let html = getHtml(MY_URL);
if (html) {
if (is_json) {
html = dealJson(html);
}
let list = _pdfa(html, p[0]);
list.forEach(it => {
let links = p[4].split('+').map(p4 => {
return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4);
});
let link = links.join('$');
let vod_id = rule.detailUrl ? MY_CATE + '$' + link : link;
d.push({
'vod_id': vod_id,
'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(),
'vod_pic': _pd(it, p[2], MY_URL),
'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(),
});
});
}
} catch (e) {
console.log(e.message);
}
}
// print(d);
return d.length < 1 ? '{}' : JSON.stringify({
'page': parseInt(cateObj.pg),
'pagecount': 999,
'limit': 20,
'total': 999,
'list': d,
});
}
/**
* 搜索列表数据解析
* @param searchObj
* @returns {string}
*/
function searchParse(searchObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
let d = [];
if (!searchObj.searchUrl) {
return '{}'
}
let p = searchObj.搜索 === '*' && rule.一级 ? rule.一级 : searchObj.搜索;
if (!p || typeof (p) !== 'string') {
return '{}'
}
p = p.trim();
let url = searchObj.searchUrl.replaceAll('**', searchObj.wd).replaceAll('fypage', searchObj.pg);
MY_URL = url;
console.log(MY_URL);
// setItem('MY_URL',MY_URL);
if (p.startsWith('js:')) {
const TYPE = 'search';
const MY_PAGE = searchObj.pg;
const KEY = searchObj.wd;
var input = MY_URL;
var detailUrl = rule.detailUrl || '';
eval(p.trim().replace('js:', ''));
d = VODS;
} else {
p = p.split(';');
if (p.length < 5) {
return '{}'
}
let _ps = parseTags.getParse(p[0]);
_pdfa = _ps.pdfa;
_pdfh = _ps.pdfh;
_pd = _ps.pd;
let is_json = p[0].startsWith('json:');
p[0] = p[0].replace(/^(jsp:|json:|jq:)/, '');
try {
let html = getHtml(MY_URL);
if (html) {
if (/系统安全验证|输入验证码/.test(html)) {
let cookie = verifyCode(MY_URL);
if (cookie) {
console.log(`本次成功过验证,cookie:${cookie}`);
setItem(RULE_CK, cookie);
} else {
console.log(`本次自动过搜索验证失败,cookie:${cookie}`);
}
// obj.headers['Cookie'] = cookie;
html = getHtml(MY_URL);
}
if (!html.includes(searchObj.wd)) {
console.log('搜索结果源码未包含关键字,疑似搜索失败,正为您打印结果源码');
console.log(html);
}
if (is_json) {
html = dealJson(html);
}
let list = _pdfa(html, p[0]);
list.forEach(it => {
let links = p[4].split('+').map(p4 => {
return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4)
});
let link = links.join('$');
let ob = {
'vod_id': link,
'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(),
'vod_pic': _pd(it, p[2], MY_URL),
'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(),
};
if (p.length > 5 && p[5]) {
ob.vod_content = _pdfh(it, p[5]);
}
d.push(ob);
});
}
} catch (e) {
return '{}'
}
}
return JSON.stringify({
'page': parseInt(searchObj.pg),
'pagecount': 10,
'limit': 20,
'total': 100,
'list': d,
});
}
/**
* 二级详情页数据解析
* @param detailObj
* @returns {string}
*/
function detailParse(detailObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
let vod = {
vod_id: detailObj.orId, //"id",
vod_name: "片名",
vod_pic: "",
type_name: "剧情",
vod_year: "年份",
vod_area: "地区",
vod_remarks: "更新信息",
vod_actor: "主演",
vod_director: "导演",
vod_content: "简介"
};
let p = detailObj.二级;
let url = detailObj.url;
let detailUrl = detailObj.detailUrl;
let fyclass = detailObj.fyclass;
let tab_exclude = detailObj.tab_exclude;
let html = detailObj.html || '';
MY_URL = url;
console.log(MY_URL);
// setItem('MY_URL',MY_URL);
if (p === '*') {
vod.vod_play_from = '道长在线';
vod.vod_remarks = detailUrl;
vod.vod_actor = '没有二级,只有一级链接直接嗅探播放';
vod.vod_content = MY_URL;
vod.vod_play_url = '嗅探播放$' + MY_URL;
} else if (typeof (p) === 'string' && p.trim().startsWith('js:')) {
const TYPE = 'detail';
var input = MY_URL;
eval(p.trim().replace('js:', ''));
vod = VOD;
console.log(JSON.stringify(vod));
} else if (p && typeof (p) === 'object') {
if (!html) {
html = getHtml(MY_URL);
}
let _impJQP = true;
let _ps;
if (p.is_json) {
_ps = parseTags.json;
html = dealJson(html);
_impJQP = false;
} else if (p.is_jsp) {
_ps = parseTags.jsp;
} else if (p.is_jq) {
_ps = parseTags.jq;
} else {
_ps = parseTags.jq;
}
if (_impJQP) {
let c$ = cheerio.load(html);
html = { rr: c$, ele: c$('html')[0] }
}
_pdfa = _ps.pdfa;
_pdfh = _ps.pdfh;
_pd = _ps.pd;
if (p.title) {
let p1 = p.title.split(';');
vod.vod_name = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim();
let type_name = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').replace(/ /g, '').trim() : '';
vod.type_name = type_name || vod.type_name;
}
if (p.desc) {
try {
let p1 = p.desc.split(';');
vod.vod_remarks = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim();
vod.vod_year = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').trim() : '';
vod.vod_area = p1.length > 2 ? _pdfh(html, p1[2]).replace(/\n|\t/g, '').trim() : '';
// vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replaceAll('\n', ' ').trim():'';
vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replace(/\n|\t/g, '').trim() : '';
vod.vod_director = p1.length > 4 ? _pdfh(html, p1[4]).replace(/\n|\t/g, '').trim() : '';
}
catch (e) {
}
}
if (p.content) {
try {
let p1 = p.content.split(';');
vod.vod_content = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim();
}
catch (e) { }
}
if (p.img) {
try {
let p1 = p.img.split(';');
vod.vod_pic = _pd(html, p1[0], MY_URL);
}
catch (e) { }
}
let vod_play_from = '$$$';
let playFrom = [];
if (p.重定向 && p.重定向.startsWith('js:')) {
html = eval(p.重定向.replace('js:', ''));
if (_impJQP) {
let c$ = cheerio.load(html);
html = { rr: c$, ele: c$('html')[0] }
}
}
// console.log(2);
if (p.tabs) {
let p_tab = p.tabs.split(';')[0];
console.log(p_tab);
let vHeader = _pdfa(html, p_tab);
console.log(vHeader.length);
for (let v of vHeader) {
let v_title = _pdfh(v, 'body&&Text');
console.log(v_title);
if (tab_exclude && (new RegExp(tab_exclude)).test(v_title)) {
continue;
}
playFrom.push(v_title);
}
console.log(JSON.stringify(playFrom));
} else {
playFrom = ['道长在线']
}
vod.vod_play_from = playFrom.join(vod_play_from);
// console.log(3);
let vod_play_url = '$$$';
let vod_tab_list = [];
if (p.lists) {
for (let i = 0; i < playFrom.length; i++) {
let tab_name = playFrom[i];
let tab_ext = p.tabs.split(';').length > 1 ? p.tabs.split(';')[1] : '';
let p1 = p.lists.replaceAll('#idv', tab_name).replaceAll('#id', i);
tab_ext = tab_ext.replaceAll('#idv', tab_name).replaceAll('#id', i);
console.log(p1);
// console.log(html);
let vodList = [];
try {
vodList = _pdfa(html, p1);
console.log('len(vodList):' + vodList.length);
} catch (e) {
// console.log(e.message);
}
let new_vod_list = [];
let tabName = tab_ext ? _pdfh(html, tab_ext) : tab_name;
console.log(tabName);
// console.log('cheerio解析Text');
vodList.forEach(it => {
// 请注意,这里要固定pdfh解析body&&Text,不需要下划线,没写错
// new_vod_list.push(pdfh(it,'body&&Text')+'$'+_pd(it,'a&&href',MY_URL));
// new_vod_list.push(cheerio.load(it).text() + '$' + _pd(it, 'a&&href', MY_URL));
new_vod_list.push(_pdfh(it, 'body&&Text') + '$' + _pd(it, 'a&&href', MY_URL));
});
let vlist = new_vod_list.join('#');
vod_tab_list.push(vlist);
}
}
vod.vod_play_url = vod_tab_list.join(vod_play_url);
}
// print(vod);
return JSON.stringify({
list: [vod]
})
}
/**
* 选集播放点击事件解析
* @param playObj
* @returns {string}
*/
function playParse(playObj) {
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
MY_URL = playObj.url;
if (!/http/.test(MY_URL)) {
try {
MY_URL = base64Decode(MY_URL);
} catch (e) { }
}
MY_URL = decodeURIComponent(MY_URL);
var input = MY_URL;//注入给免嗅js
let common_play = {
parse: 1,
url: input
};
let lazy_play;
if (!rule.play_parse || !rule.lazy) {
lazy_play = common_play;
} else if (rule.play_parse && rule.lazy && typeof (rule.lazy) === 'string') {
try {
let lazy_code = rule.lazy.replace('js:', '').trim();
print('开始执行js免嗅=>' + lazy_code);
eval(lazy_code);
lazy_play = typeof (input) === 'object' ? input : {
parse: 1,
jx: 1,
url: input
};
} catch (e) {
print('js免嗅错误:' + e.message);
lazy_play = common_play;
}
} else {
lazy_play = common_play;
}
console.log(JSON.stringify(lazy_play));
return JSON.stringify(lazy_play);
}
/**
* js源预处理特定返回对象中的函数
* @param ext
*/
function init(ext) {
console.log('init');
try {
// make shared jsContext happy
if (typeof (globalThis.mubanJs) === 'undefined') {
let mubanJs = request('https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js', { 'User-Agent': MOBILE_UA });
mubanJs = mubanJs.replace('export default', '(function() {return muban;}()) // export default');
globalThis.mubanJs = mubanJs;
}
let muban = eval(globalThis.mubanJs);
if (typeof ext == 'object') {
rule = ext;
if (rule.template) {
rule = Object.assign(muban[rule.template], rule);
}
} else if (typeof ext == 'string') {
if (ext.startsWith('http')) {
let js = request(ext, { 'method': 'GET' });
if (js) {
eval(js.replace('var rule', 'rule'));
}
}
} else {
eval(ext.replace('var rule', 'rule'));
}
/** 处理一下 rule规则关键字段没传递的情况 **/
let rule_cate_excludes = (rule.cate_exclude || '').split('|').filter(it => it.trim());
let rule_tab_excludes = (rule.tab_exclude || '').split('|').filter(it => it.trim());
rule_cate_excludes = rule_cate_excludes.concat(CATE_EXCLUDE.split('|').filter(it => it.trim()));
rule_tab_excludes = rule_tab_excludes.concat(TAB_EXCLUDE.split('|').filter(it => it.trim()));
rule.cate_exclude = rule_cate_excludes.join('|');
rule.tab_exclude = rule_tab_excludes.join('|');
rule.host = (rule.host || '').rstrip('/');
rule.url = rule.url || '';
rule.double = rule.double || false;
rule.homeUrl = rule.homeUrl || '';
rule.detailUrl = rule.detailUrl || '';
rule.searchUrl = rule.searchUrl || '';
rule.homeUrl = rule.host && rule.homeUrl ? urljoin(rule.host, rule.homeUrl) : (rule.homeUrl || rule.host);
rule.detailUrl = rule.host && rule.detailUrl ? urljoin(rule.host, rule.detailUrl) : rule.detailUrl;
if (rule.url.includes('[') && rule.url.includes(']')) {
let u1 = rule.url.split('[')[0]
let u2 = rule.url.split('[')[1].split(']')[0]
rule.url = rule.host && rule.url ? urljoin(rule.host, u1) + '[' + urljoin(rule.host, u2) + ']' : rule.url;
} else {
rule.url = rule.host && rule.url ? urljoin(rule.host, rule.url) : rule.url;
}
rule.searchUrl = rule.host && rule.searchUrl ? urljoin(rule.host, rule.searchUrl) : rule.searchUrl;
rule.timeout = rule.timeout || 5000;
rule.encoding = rule.编码 || rule.encoding || 'utf-8';
if (rule.headers && typeof (rule.headers) === 'object') {
try {
let header_keys = Object.keys(rule.headers);
for (let k of header_keys) {
if (k.toLowerCase() === 'user-agent') {
let v = rule.headers[k];
console.log(v);
if (['MOBILE_UA', 'PC_UA', 'UC_UA', 'IOS_UA', 'UA'].includes(v)) {
rule.headers[k] = eval(v);
}
}
}
} catch (e) {
console.log('处理headers发生错误:' + e.message);
}
}
// print(rule.headers);
rule_fetch_params = { 'headers': rule.headers || false, 'timeout': rule.timeout, 'encoding': rule.encoding };
oheaders = rule.headers || {};
RKEY = typeof (key) !== 'undefined' && key ? key : 'drpy_' + (rule.title || rule.host);
init_test();
} catch (e) {
console.log('init_test发生错误:' + e.message);
}
}
let homeHtmlCache = undefined;
/**
* js源获取首页分类和筛选特定返回对象中的函数
* @param filter 筛选条件字典对象
* @returns {string}
*/
function home(filter) {
console.log("home");
let homeObj = {
filter: rule.filter || false,
MY_URL: rule.homeUrl,
class_name: rule.class_name || '',
class_url: rule.class_url || '',
class_parse: rule.class_parse || '',
cate_exclude: rule.cate_exclude,
};
return homeParse(homeObj);
}
/**
* js源获取首页推荐数据列表特定返回对象中的函数
* @param params
* @returns {string}
*/
function homeVod(params) {
let homeVodObj = {
推荐: rule.推荐,
double: rule.double,
homeUrl: rule.homeUrl,
detailUrl: rule.detailUrl
};
return homeVodParse(homeVodObj)
// return "{}";
}
/**
* js源获取分类页一级数据列表特定返回对象中的函数
* @param tid 分类id
* @param pg 页数
* @param filter 当前选中的筛选条件
* @param extend 扩展
* @returns {string}
*/
function category(tid, pg, filter, extend) {
let cateObj = {
url: rule.url,
一级: rule.一级,
tid: tid,
pg: parseInt(pg),
filter: filter,
extend: extend
};
// console.log(JSON.stringify(extend));
return categoryParse(cateObj)
}
/**
* js源获取二级详情页数据特定返回对象中的函数
* @param vod_url 一级列表中的vod_id或者是带分类的自拼接 vod_id fyclass$vod_id
* @returns {string}
*/
function detail(vod_url) {
let orId = vod_url;
let fyclass = '';
if (vod_url.indexOf('$') > -1) {
let tmp = vod_url.split('$');
fyclass = tmp[0];
vod_url = tmp[1];
}
let detailUrl = vod_url;
let url;
if (!detailUrl.startsWith('http') && !detailUrl.includes('/')) {
url = rule.detailUrl.replaceAll('fyid', detailUrl).replaceAll('fyclass', fyclass);
} else if (detailUrl.includes('/')) {
url = urljoin(rule.homeUrl, detailUrl);
} else {
url = detailUrl
}
let detailObj = {
orId: orId,
url: url,
二级: rule.二级,
detailUrl: detailUrl,
fyclass: fyclass,
tab_exclude: rule.tab_exclude,
}
return detailParse(detailObj)
}
/**
* js源选集按钮播放点击事件特定返回对象中的函数
* @param flag 线路名
* @param id 播放按钮的链接
* @param flags 全局配置的flags是否需要解析的标识列表
* @returns {string}
*/
function play(flag, id, flags) {
let playObj = {
url: id,
flag: flag,
flags: flags
}
return playParse(playObj);
}
/**
* js源搜索返回的数据列表特定返回对象中的函数
* @param wd 搜索关键字
* @param quick 是否来自快速搜索
* @returns {string}
*/
function search(wd, quick) {
let searchObj = {
searchUrl: rule.searchUrl,
搜索: rule.搜索,
wd: wd,
//pg: pg,
pg: 1,
quick: quick,
};
// console.log(JSON.stringify(searchObj));
return searchParse(searchObj)
}
function DRPY() {//导出函数
return {
init: init,
home: home,
homeVod: homeVod,
category: category,
detail: detail,
play: play,
search: search,
}
}
let pd = pD;
// 导出函数对象
__JS_SPIDER__ = {
init: init,
home: home,
homeVod: homeVod,
category: category,
detail: detail,
play: play,
search: search,
DRPY: DRPY
}