2247 lines
74 KiB
JavaScript
2247 lines
74 KiB
JavaScript
import cheerio from './cheerio.min.js';
|
||
import './crypto-js.js';
|
||
import 模板 from"./模板.js"
|
||
import {gbkTool} from './gbk.js'
|
||
|
||
// import cheerio from "https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/libs/cheerio.min.js";
|
||
// import "https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/libs/crypto-js.js";
|
||
// import 模板 from"https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/js/模板.js";
|
||
// import {gbkTool} from 'https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/libs/gbk.js'
|
||
|
||
function init_test(){
|
||
// console.log(typeof(CryptoJS));
|
||
console.log("init_test_start");
|
||
// print(模板);
|
||
// print(typeof(模板.getMubans));
|
||
console.log("当前版本号:"+VERSION);
|
||
console.log(RKEY);
|
||
console.log(JSON.stringify(rule));
|
||
console.log("init_test_end");
|
||
}
|
||
|
||
/**
|
||
* 执行预处理代码
|
||
*/
|
||
function pre(){
|
||
if(typeof(rule.预处理) === 'string' && rule.预处理 && rule.预处理.trim()){
|
||
let code = rule.预处理.trim();
|
||
console.log("执行预处理代码:"+code);
|
||
if(code.startsWith('js:')){
|
||
code = code.replace('js:','');
|
||
}
|
||
try {
|
||
// code里可以进行get 或者 post请求cookie并改变rule.headers 里的cookie
|
||
// 直接操作 rule_fetch_params 这个变量 .headers.Cookie
|
||
eval(code);
|
||
}catch (e) {
|
||
console.log('预处理执行失败:'+e.message);
|
||
}
|
||
}
|
||
}
|
||
|
||
let rule = {};
|
||
let vercode = typeof(pdfl) ==='function'?'drpy2.1':'drpy2';
|
||
const VERSION = vercode+' 3.9.43beta1 20230607';
|
||
/** 已知问题记录
|
||
* 1.影魔的jinjia2引擎不支持 {{fl}}对象直接渲染 (有能力解决的话尽量解决下,支持对象直接渲染字符串转义,如果加了|safe就不转义)[影魔牛逼,最新的文件发现这问题已经解决了]
|
||
* Array.prototype.append = Array.prototype.push; 这种js执行后有毛病,for in 循环列表会把属性给打印出来 (这个大毛病需要重点排除一下)
|
||
* 2.import es6py.js但是里面的函数没有被装载进来.比如drpy规则报错setResult2 is undefiend(合并文件了可以不管了)
|
||
* 3.无法重复导入cheerio(怎么解决drpy和parseTag里都需要导入cheerio的问题) 无法在副文件导入cheerio (现在是全部放在drpy一个文件里了,凑合解决?)
|
||
* 4.有个错误不知道哪儿来的 executeScript: com.quickjs.JSObject$Undefined cannot be cast to java.lang.String 在 点击选集播放打印init_test_end后面打印(貌似不影响使用)
|
||
* 5.需要实现 stringify 函数,比起JSON.stringify函数,它会原封不动保留中文不会编码unicode
|
||
* 6.base64Encode,base64Decode,md5函数还没有实现 (抄影魔代码实现了)
|
||
* 7.eval(getCryptoJS());还没有实现 (可以空实现了,以后遇到能忽略)
|
||
* done: jsp:{pdfa,pdfh,pd},json:{pdfa,pdfh,pd},jq:{pdfa,pdfh,pd}
|
||
* 8.req函数不支持传递字符串的data参数 {'content-type':'text/plain'} 类型数据,因此无法直接调用alist的ocr接口
|
||
* * 电脑看日志调试
|
||
adb tcpip 5555
|
||
adb connect 192.168.10.192
|
||
adb devices -l
|
||
adb logcat -c
|
||
adb logcat | grep -i QuickJS
|
||
adb logcat -c -b events
|
||
adb logcat -c -b main -b events -b radio -b system
|
||
adb logcat > 2.log DRPY:E | grep -i QuickJS
|
||
* **/
|
||
|
||
|
||
/*** 以下是内置变量和解析方法 **/
|
||
const MOBILE_UA = 'Mozilla/5.0 (Linux; Android 11; M2007J3SC Build/RKQ1.200826.002; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/77.0.3865.120 MQQBrowser/6.2 TBS/045714 Mobile Safari/537.36';
|
||
const PC_UA = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/95.0.4638.54 Safari/537.36';
|
||
const UA = 'Mozilla/5.0';
|
||
const UC_UA = 'Mozilla/5.0 (Linux; U; Android 9; zh-CN; MI 9 Build/PKQ1.181121.001) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/57.0.2987.108 UCBrowser/12.5.5.1035 Mobile Safari/537.36';
|
||
const IOS_UA = 'Mozilla/5.0 (iPhone; CPU iPhone OS 13_2_3 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/13.0.3 Mobile/15E148 Safari/604.1';
|
||
const RULE_CK = 'cookie'; // 源cookie的key值
|
||
// const KEY = typeof(key)!=='undefined'&&key?key:'drpy_' + (rule.title || rule.host); // 源的唯一标识
|
||
const CATE_EXCLUDE = '首页|留言|APP|下载|资讯|新闻|动态';
|
||
const TAB_EXCLUDE = '猜你|喜欢|下载|剧情|热播';
|
||
const OCR_RETRY = 3;//ocr验证重试次数
|
||
// const OCR_API = 'http://dm.mudery.com:10000';//ocr在线识别接口
|
||
// const OCR_API = 'http://192.168.3.239:5705/parse/ocr';//ocr在线识别接口
|
||
// const OCR_API = 'http://cms.nokia.press/parse/ocr';//ocr在线识别接口
|
||
// const OCR_API = 'http://cms.nokia.press:5707/parse/ocr';//ocr在线识别接口
|
||
const OCR_API = 'http://drpy.nokia.press:8028/ocr/drpy/text';//ocr在线识别接口
|
||
if(typeof(MY_URL)==='undefined'){
|
||
var MY_URL; // 全局注入变量,pd函数需要
|
||
}
|
||
var HOST;
|
||
var RKEY; // 源的唯一标识
|
||
var fetch;
|
||
var print;
|
||
var log;
|
||
var rule_fetch_params;
|
||
var fetch_params; // 每个位置单独的
|
||
var oheaders;
|
||
// var play_url; // 二级详情页注入变量,为了适配js模式0 (不在这里定义了,直接二级里定义了个空字符串)
|
||
var _pdfh;
|
||
var _pdfa;
|
||
var _pd;
|
||
// const DOM_CHECK_ATTR = ['url', 'src', 'href', 'data-original', 'data-src'];
|
||
const DOM_CHECK_ATTR = /(url|src|href|-original|-src|-play|-url)$/;
|
||
const NOADD_INDEX = /:eq|:lt|:gt|:first|:last|^body$|^#/; // 不自动加eq下标索引
|
||
const URLJOIN_ATTR = /(url|src|href|-original|-src|-play|-url)$/; // 需要自动urljoin的属性
|
||
const SELECT_REGEX = /:eq|:lt|:gt|#/g;
|
||
const SELECT_REGEX_A = /:eq|:lt|:gt/g;
|
||
|
||
/**
|
||
es6py扩展
|
||
*/
|
||
if (typeof Object.assign != 'function') {
|
||
Object.assign = function () {
|
||
var target = arguments[0];
|
||
for (var i = 1; i < arguments.length; i++) {
|
||
var source = arguments[i];
|
||
for (var key in source) {
|
||
if (Object.prototype.hasOwnProperty.call(source, key)) {
|
||
target[key] = source[key];
|
||
}
|
||
}
|
||
}
|
||
return target;
|
||
};
|
||
}
|
||
if (!String.prototype.includes) {
|
||
String.prototype.includes = function (search, start) {
|
||
if (typeof start !== 'number') {
|
||
start = 0;
|
||
}
|
||
|
||
if (start + search.length > this.length) {
|
||
return false;
|
||
} else {
|
||
return this.indexOf(search, start) !== -1;
|
||
}
|
||
};
|
||
}
|
||
|
||
if (!Array.prototype.includes) {
|
||
Object.defineProperty(Array.prototype, 'includes', {
|
||
value: function (searchElement, fromIndex) {
|
||
|
||
if (this == null) {//this是空或者未定义,抛出错误
|
||
throw new TypeError('"this" is null or not defined');
|
||
}
|
||
|
||
var o = Object(this);//将this转变成对象
|
||
var len = o.length >>> 0;//无符号右移0位,获取对象length属性,如果未定义就会变成0
|
||
|
||
if (len === 0) {//length为0直接返回false未找到目标值
|
||
return false;
|
||
}
|
||
|
||
var n = fromIndex | 0;//查找起始索引
|
||
var k = Math.max(n >= 0 ? n : len - Math.abs(n), 0);//计算正确起始索引,因为有可能是负值
|
||
|
||
while (k < len) {//从起始索引处开始循环
|
||
if (o[k] === searchElement) {//如果某一位置与寻找目标相等,返回true,找到了
|
||
return true;
|
||
}
|
||
k++;
|
||
}
|
||
return false;//未找到,返回false
|
||
}
|
||
});
|
||
}
|
||
if (typeof String.prototype.startsWith != 'function') {
|
||
String.prototype.startsWith = function (prefix){
|
||
return this.slice(0, prefix.length) === prefix;
|
||
};
|
||
}
|
||
if (typeof String.prototype.endsWith != 'function') {
|
||
String.prototype.endsWith = function(suffix) {
|
||
return this.indexOf(suffix, this.length - suffix.length) !== -1;
|
||
};
|
||
}
|
||
Object.prototype.myValues=function(obj){
|
||
if(obj ==null) {
|
||
throw new TypeError("Cannot convert undefined or null to object");
|
||
}
|
||
var res=[]
|
||
for(var k in obj){
|
||
if(obj.hasOwnProperty(k)){//需判断是否是本身的属性
|
||
res.push(obj[k]);
|
||
}
|
||
}
|
||
return res;
|
||
}
|
||
if (typeof Object.prototype.values != 'function') {
|
||
Object.prototype.values=function(obj){
|
||
if(obj ==null) {
|
||
throw new TypeError("Cannot convert undefined or null to object");
|
||
}
|
||
var res=[]
|
||
for(var k in obj){
|
||
if(obj.hasOwnProperty(k)){//需判断是否是本身的属性
|
||
res.push(obj[k]);
|
||
}
|
||
}
|
||
return res;
|
||
}
|
||
}
|
||
if (typeof Array.prototype.join != 'function') {
|
||
Array.prototype.join = function (emoji) {
|
||
// emoji = emoji||',';
|
||
emoji = emoji||'';
|
||
let self = this;
|
||
let str = "";
|
||
let i = 0;
|
||
if (!Array.isArray(self)) {throw String(self)+'is not Array'}
|
||
if(self.length===0){return ''}
|
||
if (self.length === 1){return String(self[0])}
|
||
i = 1;
|
||
str = this[0];
|
||
for (; i < self.length; i++) {
|
||
str += String(emoji)+String(self[i]);
|
||
}
|
||
return str;
|
||
};
|
||
}
|
||
|
||
String.prototype.rstrip = function (chars) {
|
||
let regex = new RegExp(chars + "$");
|
||
return this.replace(regex, "");
|
||
};
|
||
|
||
Array.prototype.append = Array.prototype.push;
|
||
String.prototype.strip = String.prototype.trim;
|
||
function 是否正版(vipUrl){
|
||
let flag = new RegExp('qq\.com|iqiyi\.com|youku\.com|mgtv\.com|bilibili\.com|sohu\.com|ixigua\.com|pptv\.com|miguvideo\.com|le\.com|1905\.com|fun\.tv');
|
||
return flag.test(vipUrl);
|
||
}
|
||
function urlDeal(vipUrl){
|
||
if(!vipUrl){
|
||
return ''
|
||
}
|
||
if(!是否正版(vipUrl)){
|
||
return vipUrl
|
||
}
|
||
if(!/miguvideo/.test(vipUrl)){
|
||
vipUrl=vipUrl.split('#')[0].split('?')[0];
|
||
}
|
||
return vipUrl
|
||
}
|
||
function setResult(d){
|
||
if(!Array.isArray(d)){
|
||
return []
|
||
}
|
||
VODS = [];
|
||
// print(d);
|
||
d.forEach(function (it){
|
||
let obj = {
|
||
vod_id:it.url||'',
|
||
vod_name: it.title||'',
|
||
vod_remarks: it.desc||'',
|
||
vod_content: it.content||'',
|
||
vod_pic: it.pic_url||it.img||'',
|
||
};
|
||
let keys = Object.keys(it);
|
||
if(keys.includes('tname')){
|
||
obj.type_name = it.tname||'';
|
||
}
|
||
if(keys.includes('tid')){
|
||
obj.type_id = it.tid||'';
|
||
}
|
||
if(keys.includes('year')){
|
||
obj.vod_year = it.year||'';
|
||
}
|
||
if(keys.includes('actor')){
|
||
obj.vod_actor = it.actor||'';
|
||
}
|
||
if(keys.includes('director')){
|
||
obj.vod_director = it.director||'';
|
||
}
|
||
if(keys.includes('area')){
|
||
obj.vod_area = it.area||'';
|
||
}
|
||
VODS.push(obj);
|
||
});
|
||
return VODS
|
||
}
|
||
function setResult2(res){
|
||
VODS = res.list||[];
|
||
return VODS
|
||
}
|
||
function setHomeResult(res){
|
||
if(!res||typeof(res)!=='object'){
|
||
return []
|
||
}
|
||
return setResult(res.list);
|
||
}
|
||
// 猫了个咪
|
||
function rc(js) {
|
||
if (js === 'maomi_aes.js') {
|
||
var a = CryptoJS.enc.Utf8.parse("625222f9149e961d");
|
||
var t = CryptoJS.enc.Utf8.parse("5efdtf6060e2o330");
|
||
return {
|
||
De: function (word) {
|
||
word = CryptoJS.enc.Hex.parse(word)
|
||
return CryptoJS.AES.decrypt(CryptoJS.enc.Base64.stringify(word), a, {
|
||
iv: t,
|
||
mode: CryptoJS.mode.CBC,
|
||
padding: CryptoJS.pad.Pkcs7
|
||
}).toString(CryptoJS.enc.Utf8)
|
||
},
|
||
En: function (word) {
|
||
// print(a);
|
||
// print(word);
|
||
var Encrypted = CryptoJS.AES.encrypt(word, a, {
|
||
iv: t,
|
||
mode: CryptoJS.mode.CBC,
|
||
padding: CryptoJS.pad.Pkcs7
|
||
});
|
||
return Encrypted.ciphertext.toString();
|
||
}
|
||
};
|
||
}
|
||
return {};
|
||
}
|
||
|
||
// 千万不要用for in 推荐 forEach (for in 会打乱顺序)
|
||
//猫函数
|
||
function maoss(jxurl, ref, key) {
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
eval(getCryptoJS());
|
||
try {
|
||
var getVideoInfo = function (text) {
|
||
return CryptoJS.AES.decrypt(text, key, {iv: iv, padding: CryptoJS.pad.Pkcs7}).toString(CryptoJS.enc.Utf8);
|
||
};
|
||
var token_key = key == undefined ? 'dvyYRQlnPRCMdQSe' : key;
|
||
if (ref) {
|
||
var html = request(jxurl, {
|
||
headers: {
|
||
'Referer': ref
|
||
}
|
||
});
|
||
} else {
|
||
var html = request(jxurl);
|
||
}
|
||
// print(html);
|
||
if (html.indexOf('&btwaf=') != -1) {
|
||
html = request(jxurl + '&btwaf' + html.match(/&btwaf(.*?)"/)[1], {
|
||
headers: {
|
||
'Referer': ref
|
||
}
|
||
})
|
||
}
|
||
var token_iv = html.split('_token = "')[1].split('"')[0];
|
||
var key = CryptoJS.enc.Utf8.parse(token_key);
|
||
var iv = CryptoJS.enc.Utf8.parse(token_iv);
|
||
// log("iv:"+iv);
|
||
// log(html);
|
||
// print(key);
|
||
// print(iv);
|
||
eval(html.match(/var config = {[\s\S]*?}/)[0] + '');
|
||
// config.url = config.url.replace(/,/g,'');
|
||
// print(config.url);
|
||
if (!config.url.startsWith('http')) {
|
||
//config.url = decodeURIComponent(AES(config.url, key, iv));
|
||
config.url = CryptoJS.AES.decrypt(config.url, key, {
|
||
iv: iv,
|
||
padding: CryptoJS.pad.Pkcs7
|
||
}).toString(CryptoJS.enc.Utf8)
|
||
}
|
||
return config.url;
|
||
} catch (e) {
|
||
return '';
|
||
}
|
||
}
|
||
|
||
function urlencode (str) {
|
||
str = (str + '').toString();
|
||
return encodeURIComponent(str).replace(/!/g, '%21').replace(/'/g, '%27').replace(/\(/g, '%28').
|
||
replace(/\)/g, '%29').replace(/\*/g, '%2A').replace(/%20/g, '+');
|
||
}
|
||
|
||
function base64Encode(text){
|
||
return CryptoJS.enc.Base64.stringify(CryptoJS.enc.Utf8.parse(text));
|
||
// return text
|
||
}
|
||
|
||
function base64Decode(text){
|
||
return CryptoJS.enc.Utf8.stringify(CryptoJS.enc.Base64.parse(text));
|
||
// return text
|
||
}
|
||
|
||
function md5(text) {
|
||
return CryptoJS.MD5(text).toString();
|
||
}
|
||
|
||
/**
|
||
* 字符串按指定编码
|
||
* @param input
|
||
* @param encoding
|
||
* @returns {*}
|
||
*/
|
||
function encodeStr(input,encoding){
|
||
encoding = encoding||'gbk';
|
||
if(encoding.startsWith('gb')){
|
||
const strTool = gbkTool();
|
||
input = strTool.encode(input);
|
||
}
|
||
return input
|
||
}
|
||
|
||
/**
|
||
* 字符串指定解码
|
||
* @param input
|
||
* @param encoding
|
||
* @returns {*}
|
||
*/
|
||
function decodeStr(input,encoding){
|
||
encoding = encoding||'gbk';
|
||
if(encoding.startsWith('gb')){
|
||
const strTool = gbkTool();
|
||
input = strTool.decode(input);
|
||
}
|
||
return input
|
||
}
|
||
|
||
function getCryptoJS(){
|
||
// return request('https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/libs/crypto-hiker.js');
|
||
return 'console.log("CryptoJS已装载");'
|
||
}
|
||
|
||
/**
|
||
* 强制正序算法
|
||
* @param lists 待正序列表
|
||
* @param key 正序键
|
||
* @param option 单个元素处理函数
|
||
* @returns {*}
|
||
*/
|
||
function forceOrder(lists,key,option){
|
||
let start = Math.floor(lists.length/2);
|
||
let end = Math.min(lists.length-1,start+1);
|
||
if(start >= end){
|
||
return lists;
|
||
}
|
||
let first = lists[start];
|
||
let second = lists[end];
|
||
if(key){
|
||
try {
|
||
first = first[key];
|
||
second = second[key];
|
||
}catch (e) {}
|
||
}
|
||
if(option && typeof(option)==='function'){
|
||
try {
|
||
first = option(first);
|
||
second = option(second);
|
||
}catch (e) {}
|
||
}
|
||
first+='';
|
||
second+='';
|
||
// console.log(first,second);
|
||
if(first.match(/(\d+)/)&&second.match(/(\d+)/)){
|
||
let num1 = Number(first.match(/(\d+)/)[1]);
|
||
let num2 = Number(second.match(/(\d+)/)[1]);
|
||
if (num1 > num2){
|
||
lists.reverse();
|
||
}
|
||
}
|
||
return lists
|
||
}
|
||
|
||
let VODS = [];// 一级或者搜索需要的数据列表
|
||
let VOD = {};// 二级的单个数据
|
||
let TABS = [];// 二级的自定义线路列表 如: TABS=['道长在线','道长在线2']
|
||
let LISTS = [];// 二级的自定义选集播放列表 如: LISTS=[['第1集$http://1.mp4','第2集$http://2.mp4'],['第3集$http://1.mp4','第4集$http://2.mp4']]
|
||
globalThis.encodeUrl = urlencode;
|
||
globalThis.urlencode = urlencode;
|
||
|
||
|
||
|
||
/**
|
||
* url拼接
|
||
* @param fromPath 初始当前页面url
|
||
* @param nowPath 相对当前页面url
|
||
* @returns {*}
|
||
*/
|
||
function urljoin(fromPath, nowPath) {
|
||
fromPath = fromPath||'';
|
||
nowPath = nowPath||'';
|
||
return joinUrl(fromPath, nowPath);
|
||
// try {
|
||
// // import Uri from './uri.min.js';
|
||
// // var Uri = require('./uri.min.js');
|
||
// // eval(request('https://cdn.bootcdn.net/ajax/libs/URI.js/1.19.11/URI.min.js'));
|
||
// // let new_uri = URI(nowPath, fromPath);
|
||
|
||
// let new_uri = Uri(nowPath, fromPath);
|
||
// new_uri = new_uri.toString();
|
||
// // console.log(new_uri);
|
||
// // return fromPath + nowPath
|
||
// return new_uri
|
||
// }
|
||
// catch (e) {
|
||
// console.log('urljoin发生错误:'+e.message);
|
||
// if(nowPath.startsWith('http')){
|
||
// return nowPath
|
||
// }if(nowPath.startsWith('/')){
|
||
// return getHome(fromPath)+nowPath
|
||
// }
|
||
// return fromPath+nowPath
|
||
// }
|
||
}
|
||
var urljoin2 = urljoin;
|
||
|
||
// 内置 pdfh,pdfa,pd
|
||
const defaultParser = {
|
||
pdfh:pdfh,
|
||
pdfa:pdfa,
|
||
pd:pd,
|
||
};
|
||
|
||
|
||
/**
|
||
* pdfh原版优化,能取style属性里的图片链接
|
||
* @param html 源码
|
||
* @param parse 解析表达式
|
||
* @returns {string|*}
|
||
*/
|
||
function pdfh2(html,parse){
|
||
let html2 = html;
|
||
try {
|
||
if(typeof(html)!=='string'){
|
||
html2 = html.rr(html.ele).toString();
|
||
}
|
||
}catch (e) {
|
||
print('html对象转文本发生了错误:'+e.message);
|
||
}
|
||
let result = defaultParser.pdfh(html2,parse);
|
||
let option = parse.includes('&&')?parse.split('&&').slice(-1)[0]:parse.split(' ').slice(-1)[0];
|
||
if(/style/.test(option.toLowerCase())&&/url\(/.test(result)){
|
||
try {
|
||
result = result.match(/url\((.*?)\)/)[1];
|
||
}catch (e) {}
|
||
}
|
||
return result
|
||
}
|
||
|
||
/**
|
||
* pdfa原版优化,可以转换jq的html对象
|
||
* @param html
|
||
* @param parse
|
||
* @returns {*}
|
||
*/
|
||
function pdfa2(html,parse){
|
||
let html2 = html;
|
||
try {
|
||
if(typeof(html)!=='string'){
|
||
html2 = html.rr(html.ele).toString();
|
||
}
|
||
}catch (e) {
|
||
print('html对象转文本发生了错误:'+e.message);
|
||
}
|
||
return defaultParser.pdfa(html2,parse);
|
||
}
|
||
|
||
/**
|
||
* pd原版方法重写-增加自动urljoin
|
||
* @param html
|
||
* @param parse
|
||
* @param uri
|
||
* @returns {*}
|
||
*/
|
||
function pd2(html,parse,uri){
|
||
let ret = pdfh2(html,parse);
|
||
if(typeof(uri)==='undefined'||!uri){
|
||
uri = '';
|
||
}
|
||
if(DOM_CHECK_ATTR.test(parse)){
|
||
if(/http/.test(ret)){
|
||
ret = ret.substr(ret.indexOf('http'));
|
||
}else{
|
||
ret = urljoin(MY_URL,ret)
|
||
}
|
||
}
|
||
// MY_URL = getItem('MY_URL',MY_URL);
|
||
// console.log(`规则${RKEY}打印MY_URL:${MY_URL},uri:${uri}`);
|
||
return ret
|
||
}
|
||
|
||
const parseTags = {
|
||
jsp:{
|
||
pdfh:pdfh2,
|
||
pdfa:pdfa2,
|
||
pd:pd2,
|
||
},
|
||
json:{
|
||
pdfh(html, parse) {
|
||
if (!parse || !parse.trim()){
|
||
return '';
|
||
}
|
||
if (typeof(html) === 'string'){
|
||
// print('jsonpath:pdfh字符串转dict');
|
||
html = JSON.parse(html);
|
||
}
|
||
parse = parse.trim();
|
||
if (!parse.startsWith('$.')){
|
||
parse = '$.' + parse;
|
||
}
|
||
parse = parse.split('||');
|
||
for (let ps of parse) {
|
||
let ret = cheerio.jp(ps, html);
|
||
if (Array.isArray(ret)){
|
||
ret = ret[0] || '';
|
||
} else{
|
||
ret = ret || ''
|
||
}
|
||
if (ret && typeof (ret) !== 'string'){
|
||
ret = ret.toString();
|
||
}
|
||
if(ret){
|
||
return ret
|
||
}
|
||
}
|
||
return '';
|
||
},
|
||
pdfa(html, parse) {
|
||
if (!parse || !parse.trim()){
|
||
return '';
|
||
}
|
||
if (typeof(html) === 'string'){
|
||
// print('jsonpath:pdfa字符串转dict');
|
||
html = JSON.parse(html);
|
||
}
|
||
parse = parse.trim()
|
||
if (!parse.startsWith('$.')){
|
||
parse = '$.' + parse;
|
||
}
|
||
let ret = cheerio.jp(parse, html);
|
||
if (Array.isArray(ret) && Array.isArray(ret[0]) && ret.length === 1){
|
||
return ret[0] || []
|
||
}
|
||
return ret || []
|
||
},
|
||
pd(html,parse){
|
||
let ret = parseTags.json.pdfh(html,parse);
|
||
if(ret){
|
||
return urljoin(MY_URL,ret);
|
||
}
|
||
return ret
|
||
},
|
||
},
|
||
jq:{
|
||
pdfh(html, parse) {
|
||
if (!html||!parse || !parse.trim()) {
|
||
return ''
|
||
}
|
||
parse = parse.trim();
|
||
let result = defaultParser.pdfh(html,parse);
|
||
// print(`pdfh解析${parse}=>${result}`);
|
||
return result;
|
||
},
|
||
pdfa(html, parse) {
|
||
if (!html||!parse || !parse.trim()) {
|
||
return [];
|
||
}
|
||
parse = parse.trim();
|
||
let result = defaultParser.pdfa(html,parse);
|
||
// print(result);
|
||
print(`pdfa解析${parse}=>${result.length}`);
|
||
return result;
|
||
},
|
||
pd(html,parse,base_url){
|
||
if (!html||!parse || !parse.trim()) {
|
||
return ''
|
||
}
|
||
parse = parse.trim();
|
||
base_url = base_url||MY_URL;
|
||
return defaultParser.pd(html, parse, base_url);
|
||
},
|
||
},
|
||
getParse(p0){//非js开头的情况自动获取解析标签
|
||
if(p0.startsWith('jsp:')){
|
||
return this.jsp
|
||
}else if(p0.startsWith('json:')){
|
||
return this.json
|
||
}else if(p0.startsWith('jq:')){
|
||
return this.jq
|
||
}else {
|
||
return this.jq
|
||
}
|
||
}
|
||
};
|
||
|
||
const stringify = JSON.stringify;
|
||
const jsp = parseTags.jsp;
|
||
const jq = parseTags.jq;
|
||
|
||
/*** 后台需要实现的java方法并注入到js中 ***/
|
||
|
||
/**
|
||
* 读取本地文件->应用程序目录
|
||
* @param filePath
|
||
* @returns {string}
|
||
*/
|
||
function readFile(filePath){
|
||
filePath = filePath||'./uri.min.js';
|
||
var fd = os.open(filePath);
|
||
var buffer = new ArrayBuffer(1024);
|
||
var len = os.read(fd, buffer, 0, 1024);
|
||
console.log(len);
|
||
let text = String.fromCharCode.apply(null, new Uint8Array(buffer));
|
||
console.log(text);
|
||
return text
|
||
}
|
||
|
||
/**
|
||
* 处理返回的json数据
|
||
* @param html
|
||
* @returns {*}
|
||
*/
|
||
function dealJson(html) {
|
||
try {
|
||
// html = html.match(/[\w|\W|\s|\S]*?(\{[\w|\W|\s|\S]*\})/).group[1];
|
||
html = html.trim();
|
||
if(!((html.startsWith('{') && html.endsWith('}'))||(html.startsWith('[') && html.endsWith(']')))){
|
||
html = '{'+html.match(/.*?\{(.*)\}/m)[1]+'}';
|
||
}
|
||
} catch (e) {
|
||
}
|
||
try {
|
||
html = JSON.parse(html);
|
||
}catch (e) {}
|
||
// console.log(typeof(html));
|
||
return html;
|
||
}
|
||
|
||
/**
|
||
* 验证码识别逻辑,需要java实现(js没有bytes类型,无法调用后端的传递图片二进制获取验证码文本的接口)
|
||
* @type {{api: string, classification: (function(*=): string)}}
|
||
*/
|
||
var OcrApi={
|
||
api:OCR_API,
|
||
classification:function (img){ // img是byte类型,这里不方便搞啊
|
||
let code = '';
|
||
try {
|
||
// let html = request(this.api,{data:{img:img},headers:{'User-Agent':PC_UA},'method':'POST'},true);
|
||
// html = JSON.parse(html);
|
||
// code = html.url||'';
|
||
log('通过drpy_ocr验证码接口过验证...');
|
||
let html = request(OCR_API,{data:{img:img},headers:{'User-Agent':PC_UA},'method':'POST'},true);
|
||
code = html||'';
|
||
}catch (e) {
|
||
log(`OCR识别验证码发生错误:${e.message}`)
|
||
}
|
||
return code
|
||
}
|
||
};
|
||
/**
|
||
* 验证码识别,暂未实现
|
||
* @param url 验证码图片链接
|
||
* @returns {string} 验证成功后的cookie
|
||
*/
|
||
function verifyCode(url){
|
||
let cnt = 0;
|
||
let host = getHome(url);
|
||
let cookie = '';
|
||
while (cnt < OCR_RETRY){
|
||
try{
|
||
// let obj = {headers:headers,timeout:timeout};
|
||
let yzm_url = `${host}/index.php/verify/index.html`;
|
||
console.log(`验证码链接:${yzm_url}`);
|
||
let hhtml = request(yzm_url,{withHeaders:true,toBase64:true},true);
|
||
let json = JSON.parse(hhtml);
|
||
if(!cookie){
|
||
// print(json);
|
||
let setCk = Object.keys(json).find(it=>it.toLowerCase()==='set-cookie');
|
||
// cookie = json['set-cookie']?json['set-cookie'].split(';')[0]:'';
|
||
cookie = setCk?json[setCk].split(';')[0]:'';
|
||
}
|
||
// console.log(hhtml);
|
||
console.log('cookie:'+cookie);
|
||
let img = json.body;
|
||
// console.log(img);
|
||
let code = OcrApi.classification(img);
|
||
console.log(`第${cnt+1}次验证码识别结果:${code}`);
|
||
let submit_url = `${host}/index.php/ajax/verify_check?type=search&verify=${code}`;
|
||
console.log(submit_url);
|
||
let html = request(submit_url,{headers:{Cookie:cookie,'User-Agent':MOBILE_UA},'method':'POST'});
|
||
// console.log(html);
|
||
html = JSON.parse(html);
|
||
if(html.msg === 'ok'){
|
||
console.log(`第${cnt+1}次验证码提交成功`);
|
||
return cookie // 需要返回cookie
|
||
}else if(html.msg!=='ok'&&cnt+1>=OCR_RETRY){
|
||
cookie = ''; // 需要清空返回cookie
|
||
}
|
||
}catch (e) {
|
||
console.log(`第${cnt+1}次验证码提交失败:${e.message}`);
|
||
if(cnt+1>=OCR_RETRY){
|
||
cookie = '';
|
||
}
|
||
}
|
||
cnt+=1
|
||
}
|
||
return cookie
|
||
}
|
||
|
||
/**
|
||
* 存在数据库配置表里, key字段对应值value,没有就新增,有就更新,调用此方法会清除key对应的内存缓存
|
||
* @param k 键
|
||
* @param v 值
|
||
*/
|
||
function setItem(k,v){
|
||
local.set(RKEY,k,v);
|
||
console.log(`规则${RKEY}设置${k} => ${v}`)
|
||
}
|
||
|
||
/**
|
||
* 获取数据库配置表对应的key字段的value,没有这个key就返回value默认传参.需要有缓存,第一次获取后会存在内存里
|
||
* @param k 键
|
||
* @param v 值
|
||
* @returns {*}
|
||
*/
|
||
function getItem(k,v){
|
||
return local.get(RKEY,k) || v;
|
||
}
|
||
|
||
/**
|
||
* 删除数据库key对应的一条数据,并清除此key对应的内存缓存
|
||
* @param k
|
||
*/
|
||
function clearItem(k){
|
||
local.delete(RKEY,k);
|
||
}
|
||
|
||
/*** js自封装的方法 ***/
|
||
|
||
/**
|
||
* 获取链接的host(带http协议的完整链接)
|
||
* @param url 任意一个正常完整的Url,自动提取根
|
||
* @returns {string}
|
||
*/
|
||
function getHome(url){
|
||
if(!url){
|
||
return ''
|
||
}
|
||
let tmp = url.split('//');
|
||
url = tmp[0] + '//' + tmp[1].split('/')[0];
|
||
try {
|
||
url = decodeURIComponent(url);
|
||
}catch (e) {}
|
||
return url
|
||
}
|
||
|
||
/**
|
||
* get参数编译链接,类似python params字典自动拼接
|
||
* @param url 访问链接
|
||
* @param obj 参数字典
|
||
* @returns {*}
|
||
*/
|
||
function buildUrl(url,obj){
|
||
obj = obj||{};
|
||
if(url.indexOf('?')<0){
|
||
url += '?'
|
||
}
|
||
let param_list = [];
|
||
let keys = Object.keys(obj);
|
||
keys.forEach(it=>{
|
||
param_list.push(it+'='+obj[it])
|
||
});
|
||
let prs = param_list.join('&');
|
||
if(keys.length > 0 && !url.endsWith('?')){
|
||
url += '&'
|
||
}
|
||
url+=prs;
|
||
return url
|
||
}
|
||
|
||
/**
|
||
* 远程依赖执行函数
|
||
* @param url 远程js地址
|
||
*/
|
||
function require(url){
|
||
eval(request(url));
|
||
}
|
||
/**
|
||
* 海阔网页请求函数完整封装
|
||
* @param url 请求链接
|
||
* @param obj 请求对象 {headers:{},method:'',timeout:5000,body:'',withHeaders:false}
|
||
* @param ocr_flag 标识此flag是用于请求ocr识别的,自动过滤content-type指定编码
|
||
* @returns {string|string|DocumentFragment|*}
|
||
*/
|
||
function request(url,obj,ocr_flag){
|
||
ocr_flag = ocr_flag||false;
|
||
if(typeof(obj)==='undefined'||!obj||obj==={}){
|
||
if(!fetch_params||!fetch_params.headers){
|
||
let headers = {
|
||
'User-Agent':MOBILE_UA,
|
||
};
|
||
if(rule.headers){
|
||
Object.assign(headers,rule.headers);
|
||
}
|
||
if(!fetch_params){
|
||
fetch_params = {};
|
||
}
|
||
fetch_params.headers = headers;
|
||
}
|
||
if(!fetch_params.headers.Referer){
|
||
fetch_params.headers.Referer = getHome(url)
|
||
}
|
||
obj = fetch_params;
|
||
}else{
|
||
let headers = obj.headers||{};
|
||
let keys = Object.keys(headers).map(it=>it.toLowerCase());
|
||
if(!keys.includes('user-agent')){
|
||
headers['User-Agent'] = MOBILE_UA;
|
||
}if(!keys.includes('referer')){
|
||
headers['Referer'] = getHome(url);
|
||
}
|
||
obj.headers = headers;
|
||
}
|
||
if(rule.encoding&&rule.encoding!=='utf-8'&&!ocr_flag){
|
||
if(!obj.headers.hasOwnProperty('Content-Type')&&!obj.headers.hasOwnProperty('content-type')){ // 手动指定了就不管
|
||
obj.headers["Content-Type"] = 'text/html; charset='+rule.encoding;
|
||
}
|
||
}
|
||
if(typeof(obj.body)!='undefined'&&obj.body&&typeof (obj.body)==='string'){
|
||
// let data = {};
|
||
// obj.body.split('&').forEach(it=>{
|
||
// data[it.split('=')[0]] = it.split('=')[1]
|
||
// });
|
||
// obj.data = data;
|
||
// delete obj.body
|
||
|
||
// 传body加 "Content-Type":"application/x-www-form-urlencoded;" 即可post form
|
||
if(!obj.headers.hasOwnProperty('Content-Type')&&!obj.headers.hasOwnProperty('content-type')){ // 手动指定了就不管
|
||
obj.headers["Content-Type"] = 'application/x-www-form-urlencoded; charset='+rule.encoding;
|
||
}
|
||
}else if(typeof(obj.body)!='undefined'&&obj.body&&typeof (obj.body)==='object'){
|
||
obj.data = obj.body;
|
||
delete obj.body
|
||
}
|
||
if(!url){
|
||
return obj.withHeaders?'{}':''
|
||
}
|
||
if(obj.toBase64){ // 返回base64,用于请求图片
|
||
obj.buffer = 2;
|
||
delete obj.toBase64
|
||
}
|
||
console.log(JSON.stringify(obj.headers));
|
||
// console.log('request:'+url+' obj:'+JSON.stringify(obj));
|
||
console.log('request:'+url+`|method:${obj.method||'GET'}|body:${obj.body||''}`);
|
||
let res = req(url, obj);
|
||
let html = res.content||'';
|
||
// console.log(html);
|
||
if(obj.withHeaders){
|
||
let htmlWithHeaders = res.headers;
|
||
htmlWithHeaders.body = html;
|
||
return JSON.stringify(htmlWithHeaders);
|
||
}else{
|
||
return html
|
||
}
|
||
}
|
||
|
||
/**
|
||
* 快捷post请求
|
||
* @param url 地址
|
||
* @param obj 对象
|
||
* @returns {string|DocumentFragment|*}
|
||
*/
|
||
function post(url,obj){
|
||
obj.method = 'POST';
|
||
return request(url,obj);
|
||
}
|
||
|
||
fetch = request;
|
||
print = function (data){
|
||
data = data||'';
|
||
if(typeof(data)=='object'&&Object.keys(data).length>0){
|
||
try {
|
||
data = JSON.stringify(data);
|
||
console.log(data);
|
||
}catch (e) {
|
||
// console.log('print:'+e.message);
|
||
console.log(typeof(data)+':'+data.length);
|
||
return
|
||
}
|
||
}else if(typeof(data)=='object'&&Object.keys(data).length<1){
|
||
console.log('null object');
|
||
}else{
|
||
console.log(data);
|
||
}
|
||
}
|
||
log = print;
|
||
/**
|
||
* 检查宝塔验证并自动跳过获取正确源码
|
||
* @param html 之前获取的html
|
||
* @param url 之前的来源url
|
||
* @param obj 来源obj
|
||
* @returns {string|DocumentFragment|*}
|
||
*/
|
||
function checkHtml(html,url,obj){
|
||
if(/\?btwaf=/.test(html)){
|
||
let btwaf = html.match(/btwaf(.*?)"/)[1];
|
||
url = url.split('#')[0]+'?btwaf'+btwaf;
|
||
print('宝塔验证访问链接:'+url);
|
||
html = request(url,obj);
|
||
}
|
||
return html
|
||
}
|
||
|
||
/**
|
||
* 带一次宝塔验证的源码获取
|
||
* @param url 请求链接
|
||
* @param obj 请求参数
|
||
* @returns {string|DocumentFragment}
|
||
*/
|
||
function getCode(url,obj){
|
||
let html = request(url,obj);
|
||
html = checkHtml(html,url,obj);
|
||
return html
|
||
}
|
||
|
||
/**
|
||
* 源rule专用的请求方法,自动注入cookie
|
||
* @param url 请求链接
|
||
* @returns {string|DocumentFragment}
|
||
*/
|
||
function getHtml(url){
|
||
let obj = {};
|
||
if(rule.headers){
|
||
obj.headers = rule.headers;
|
||
}
|
||
let cookie = getItem(RULE_CK,'');
|
||
if(cookie){
|
||
// log('有cookie:'+cookie);
|
||
if(obj.headers && ! Object.keys(obj.headers).map(it=>it.toLowerCase()).includes('cookie')){
|
||
log('历史无cookie,新增过验证后的cookie');
|
||
obj.headers['Cookie'] = cookie;
|
||
}else if(obj.headers && obj.headers.cookie && obj.headers.cookie!==cookie){
|
||
obj.headers['Cookie'] = cookie;
|
||
log('历史有小写过期的cookie,更新过验证后的cookie');
|
||
}else if(obj.headers && obj.headers.Cookie && obj.headers.Cookie!==cookie){
|
||
obj.headers['Cookie'] = cookie;
|
||
log('历史有大写过期的cookie,更新过验证后的cookie');
|
||
}else if(!obj.headers){
|
||
obj.headers = {Cookie:cookie};
|
||
log('历史无headers,更新过验证后的含cookie的headers');
|
||
}
|
||
}
|
||
let html = getCode(url,obj);
|
||
return html
|
||
}
|
||
|
||
/**
|
||
* 首页分类解析,筛选暂未实现
|
||
* @param homeObj 首页传参对象
|
||
* @returns {string}
|
||
*/
|
||
function homeParse(homeObj) {
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let classes = [];
|
||
if (homeObj.class_name && homeObj.class_url) {
|
||
let names = homeObj.class_name.split('&');
|
||
let urls = homeObj.class_url.split('&');
|
||
let cnt = Math.min(names.length, urls.length);
|
||
for (let i = 0; i < cnt; i++) {
|
||
classes.push({
|
||
'type_id': urls[i],
|
||
'type_name': names[i]
|
||
});
|
||
}
|
||
}
|
||
|
||
if (homeObj.class_parse) {
|
||
let p = homeObj.class_parse.split(';');
|
||
let _ps = parseTags.getParse(p[0]);
|
||
_pdfa = _ps.pdfa;
|
||
_pdfh = _ps.pdfh;
|
||
_pd = _ps.pd;
|
||
MY_URL = rule.url;
|
||
if (p.length >= 3) { // 可以不写正则
|
||
try {
|
||
let html = getHtml(homeObj.MY_URL);
|
||
if (html) {
|
||
homeHtmlCache = html;
|
||
let list = _pdfa(html, p[0]);
|
||
if (list && list.length > 0) {
|
||
list.forEach((it,idex) => {
|
||
try {
|
||
let name = _pdfh(it, p[1]);
|
||
if (homeObj.cate_exclude && (new RegExp(homeObj.cate_exclude).test(name))) {
|
||
return;
|
||
}
|
||
// let url = pdfh(it, p[2]);
|
||
let url = _pd(it, p[2]);
|
||
if (p.length > 3 && p[3]) {
|
||
let exp = new RegExp(p[3]);
|
||
url = url.match(exp)[1];
|
||
}
|
||
|
||
classes.push({
|
||
'type_id': url.trim(),
|
||
'type_name': name.trim()
|
||
});
|
||
} catch (e) {
|
||
console.log(`分类列表定位第${idex}个元素正常报错:${e.message}`);
|
||
}
|
||
});
|
||
}
|
||
}
|
||
} catch (e) {
|
||
console.log(e.message);
|
||
}
|
||
|
||
}
|
||
}
|
||
// 排除分类
|
||
classes = classes.filter(it=>!homeObj.cate_exclude || !(new RegExp(homeObj.cate_exclude).test(it.type_name)));
|
||
let resp = {
|
||
'class': classes
|
||
};
|
||
if(homeObj.filter){
|
||
resp.filters = homeObj.filter;
|
||
}
|
||
console.log(JSON.stringify(resp));
|
||
return JSON.stringify(resp);
|
||
|
||
}
|
||
|
||
/**
|
||
* 推荐和搜索单字段继承一级
|
||
* @param p 推荐或搜索的解析分割;列表
|
||
* @param pn 自身列表序号
|
||
* @param pp 一级解析分割;列表
|
||
* @param ppn 继承一级序号
|
||
* @returns {*}
|
||
*/
|
||
function getPP(p, pn, pp, ppn){
|
||
try {
|
||
let ps = p[pn] === '*' && pp.length > ppn ?pp[ppn]:p[pn]
|
||
return ps
|
||
}catch (e) {
|
||
return ''
|
||
}
|
||
}
|
||
|
||
/**
|
||
* 首页推荐列表解析
|
||
* @param homeVodObj
|
||
* @returns {string}
|
||
*/
|
||
function homeVodParse(homeVodObj){
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let d = [];
|
||
MY_URL = homeVodObj.homeUrl;
|
||
// setItem('MY_URL',MY_URL);
|
||
console.log(MY_URL);
|
||
let t1 = (new Date()).getTime();
|
||
let p = homeVodObj.推荐;
|
||
print('p:'+p);
|
||
if(p==='*' && rule.一级){
|
||
p = rule.一级;
|
||
homeVodObj.double = false;
|
||
}
|
||
if(!p||typeof(p)!=='string'){
|
||
return '{}'
|
||
}
|
||
p = p.trim();
|
||
let pp = rule.一级.split(';');
|
||
if(p.startsWith('js:')){
|
||
const TYPE = 'home';
|
||
var input = MY_URL;
|
||
HOST = rule.host;
|
||
eval(p.replace('js:',''));
|
||
d = VODS;
|
||
}else {
|
||
p = p.split(';');
|
||
if (!homeVodObj.double && p.length < 5) {
|
||
return '{}'
|
||
} else if (homeVodObj.double && p.length < 6) {
|
||
return '{}'
|
||
}
|
||
let p0 = getPP(p,0,pp,0)
|
||
let _ps = parseTags.getParse(p0);
|
||
_pdfa = _ps.pdfa;
|
||
_pdfh = _ps.pdfh;
|
||
_pd = _ps.pd;
|
||
let is_json = p0.startsWith('json:');
|
||
p0 = p0.replace(/^(jsp:|json:|jq:)/,'');
|
||
// print(p[0]);
|
||
let html = homeHtmlCache || getHtml(MY_URL);
|
||
homeHtmlCache = undefined;
|
||
if(is_json){
|
||
// print('是json,开始处理');
|
||
html = dealJson(html);
|
||
}
|
||
try {
|
||
console.log('double:' + homeVodObj.double);
|
||
if (homeVodObj.double) {
|
||
let items = _pdfa(html, p0);
|
||
// console.log(items.length);
|
||
let p1 = getPP(p,1,pp,0);
|
||
let p2 = getPP(p,2,pp,1);
|
||
let p3 = getPP(p,3,pp,2);
|
||
let p4 = getPP(p,4,pp,3);
|
||
let p5 = getPP(p,5,pp,4);
|
||
let p6 = getPP(p,6,pp,5);
|
||
for (let item of items) {
|
||
// console.log(p[1]);
|
||
let items2 = _pdfa(item, p1);
|
||
// console.log(items2.length);
|
||
for (let item2 of items2) {
|
||
try {
|
||
let title = _pdfh(item2, p2);
|
||
let img = '';
|
||
try {
|
||
img = _pd(item2, p3);
|
||
} catch (e) {}
|
||
let desc = '';
|
||
try {
|
||
desc = _pdfh(item2, p4);
|
||
}catch (e) {}
|
||
let links = [];
|
||
for (let _p5 of p5.split('+')) {
|
||
let link = !homeVodObj.detailUrl ? _pd(item2, _p5, MY_URL) : _pdfh(item2, _p5);
|
||
links.push(link);
|
||
}
|
||
let content;
|
||
if(p.length > 6 && p[6]){
|
||
content = _pdfh(item2, p6);
|
||
} else{
|
||
content = '';
|
||
}
|
||
let vid = links.join('$');
|
||
if(rule.二级==='*'){
|
||
vid = vid+'@@'+title+'@@'+img;
|
||
}
|
||
let vod = {
|
||
vod_name: title,
|
||
vod_pic: img,
|
||
vod_remarks: desc,
|
||
vod_content: content,
|
||
vod_id: vid
|
||
};
|
||
// print(vod);
|
||
d.push(vod);
|
||
} catch (e) {
|
||
console.log('首页列表双层定位处理发生错误:'+e.message);
|
||
}
|
||
|
||
}
|
||
|
||
|
||
}
|
||
|
||
|
||
} else {
|
||
let items = _pdfa(html, p0);
|
||
let p1 = getPP(p,1,pp,1);
|
||
let p2 = getPP(p,2,pp,2);
|
||
let p3 = getPP(p,3,pp,3);
|
||
let p4 = getPP(p,4,pp,4);
|
||
let p5 = getPP(p,5,pp,5);
|
||
|
||
for (let item of items) {
|
||
try {
|
||
let title = _pdfh(item, p1);
|
||
let img = '';
|
||
try {
|
||
img = _pd(item, p2, MY_URL);
|
||
} catch (e) {}
|
||
let desc = '';
|
||
try {
|
||
desc = _pdfh(item, p3);
|
||
}catch (e) {}
|
||
let links = [];
|
||
for (let _p5 of p4.split('+')) {
|
||
let link = !homeVodObj.detailUrl ? _pd(item, _p5, MY_URL) : _pdfh(item, _p5);
|
||
links.push(link);
|
||
}
|
||
let content;
|
||
if(p.length > 5 && p[5]){
|
||
content = _pdfh(item, p5);
|
||
}else{
|
||
content = ''
|
||
}
|
||
let vid = links.join('$');
|
||
if(rule.二级==='*'){
|
||
vid = vid+'@@'+title+'@@'+img;
|
||
}
|
||
let vod = {
|
||
vod_name: title,
|
||
vod_pic: img,
|
||
vod_remarks: desc,
|
||
vod_content: content,
|
||
vod_id: vid
|
||
};
|
||
d.push(vod);
|
||
|
||
} catch (e) {
|
||
console.log('首页列表单层定位处理发生错误:'+e.message);
|
||
}
|
||
|
||
}
|
||
|
||
}
|
||
|
||
} catch (e) {
|
||
|
||
}
|
||
}
|
||
let t2 = (new Date()).getTime();
|
||
console.log('加载首页推荐耗时:'+(t2-t1)+'毫秒');
|
||
// console.log(JSON.stringify(d));
|
||
if(rule.图片来源){
|
||
d.forEach(it=>{
|
||
if(it.vod_pic&&it.vod_pic.startsWith('http')){
|
||
it.vod_pic = it.vod_pic + rule.图片来源;
|
||
}
|
||
});
|
||
}
|
||
if(d.length>0){
|
||
print(d.slice(0,2));
|
||
}
|
||
return JSON.stringify({
|
||
list:d
|
||
})
|
||
}
|
||
|
||
/**
|
||
* 一级分类页数据解析
|
||
* @param cateObj
|
||
* @returns {string}
|
||
*/
|
||
function categoryParse(cateObj) {
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let p = cateObj.一级;
|
||
if(!p||typeof(p)!=='string'){
|
||
return '{}'
|
||
}
|
||
let d = [];
|
||
// let url = cateObj.url.replaceAll('fyclass', cateObj.tid).replaceAll('fypage', cateObj.pg);
|
||
let url = cateObj.url.replaceAll('fyclass', cateObj.tid);
|
||
if(cateObj.pg === 1 && url.includes('[')&&url.includes(']')){
|
||
url = url.split('[')[1].split(']')[0];
|
||
}else if(cateObj.pg > 1 && url.includes('[')&&url.includes(']')){
|
||
url = url.split('[')[0];
|
||
}
|
||
if(rule.filter_url){
|
||
if(!/fyfilter/.test(url)){
|
||
if(!url.endsWith('&')&&!rule.filter_url.startsWith('&')){
|
||
url+='&'
|
||
}
|
||
url+=rule.filter_url;
|
||
}else{
|
||
url = url.replace('fyfilter', rule.filter_url);
|
||
}
|
||
// console.log('filter:'+cateObj.filter);
|
||
let fl = cateObj.filter?cateObj.extend:{};
|
||
// 自动合并 不同分类对应的默认筛选
|
||
if(rule.filter_def && typeof(rule.filter_def)==='object'){
|
||
try {
|
||
if(Object.keys(rule.filter_def).length>0 && rule.filter_def.hasOwnProperty(cateObj.tid)){
|
||
let self_fl_def = rule.filter_def[cateObj.tid];
|
||
if(self_fl_def && typeof(self_fl_def)==='object'){
|
||
// 引用传递转值传递,避免污染self变量
|
||
let fl_def = JSON.parse(JSON.stringify(self_fl_def));
|
||
fl = Object.assign(fl_def,fl);
|
||
}
|
||
}
|
||
}catch (e) {
|
||
print('合并不同分类对应的默认筛选出错:'+e.message);
|
||
}
|
||
}
|
||
let new_url;
|
||
new_url = cheerio.jinja2(url,{fl:fl});
|
||
// console.log('jinjia2执行后的new_url类型为:'+typeof(new_url));
|
||
url = new_url;
|
||
}
|
||
if(/fypage/.test(url)){
|
||
if(url.includes('(')&&url.includes(')')){
|
||
let url_rep = url.match(/.*?\((.*)\)/)[1];
|
||
// console.log(url_rep);
|
||
let cnt_page = url_rep.replaceAll('fypage', cateObj.pg);
|
||
// console.log(cnt_page);
|
||
let cnt_pg = eval(cnt_page);
|
||
// console.log(cnt_pg);
|
||
url = url.replaceAll(url_rep,cnt_pg).replaceAll('(','').replaceAll(')','');
|
||
}else{
|
||
url = url.replaceAll('fypage',cateObj.pg);
|
||
}
|
||
}
|
||
|
||
MY_URL = url;
|
||
// setItem('MY_URL',MY_URL);
|
||
console.log(MY_URL);
|
||
p = p.trim();
|
||
const MY_CATE = cateObj.tid;
|
||
if(p.startsWith('js:')){
|
||
var MY_FL = cateObj.extend;
|
||
const TYPE = 'cate';
|
||
var input = MY_URL;
|
||
const MY_PAGE = cateObj.pg;
|
||
var desc = '';
|
||
eval(p.trim().replace('js:',''));
|
||
d = VODS;
|
||
}else {
|
||
p = p.split(';');
|
||
if (p.length < 5) {
|
||
return '{}'
|
||
}
|
||
let _ps = parseTags.getParse(p[0]);
|
||
_pdfa = _ps.pdfa;
|
||
_pdfh = _ps.pdfh;
|
||
_pd = _ps.pd;
|
||
let is_json = p[0].startsWith('json:');
|
||
p[0] = p[0].replace(/^(jsp:|json:|jq:)/,'');
|
||
try {
|
||
let html = getHtml(MY_URL);
|
||
if (html) {
|
||
if(is_json){
|
||
html = dealJson(html);
|
||
}
|
||
let list = _pdfa(html, p[0]);
|
||
list.forEach(it => {
|
||
let links = p[4].split('+').map(p4=>{
|
||
return !rule.detailUrl?_pd(it, p4,MY_URL):_pdfh(it, p4);
|
||
});
|
||
let link = links.join('$');
|
||
let vod_id = rule.detailUrl?MY_CATE+'$'+link:link;
|
||
|
||
let vod_name = _pdfh(it, p[1]).replace(/\n|\t/g,'').trim();
|
||
let vod_pic = _pd(it, p[2],MY_URL);
|
||
|
||
if(rule.二级==='*'){
|
||
vod_id = vod_id+'@@'+vod_name+'@@'+vod_pic;
|
||
}
|
||
d.push({
|
||
'vod_id': vod_id,
|
||
'vod_name': vod_name,
|
||
'vod_pic': vod_pic,
|
||
'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g,'').trim(),
|
||
});
|
||
});
|
||
}
|
||
} catch (e) {
|
||
console.log(e.message);
|
||
}
|
||
}
|
||
if(rule.图片来源){
|
||
d.forEach(it=>{
|
||
if(it.vod_pic&&it.vod_pic.startsWith('http')){
|
||
it.vod_pic = it.vod_pic + rule.图片来源;
|
||
}
|
||
});
|
||
}
|
||
// print(d);
|
||
if(d.length>0){
|
||
print(d.slice(0,2));
|
||
}
|
||
let pagecount = 0;
|
||
if(rule.pagecount && typeof(rule.pagecount) === 'object' && rule.pagecount.hasOwnProperty(MY_CATE)){
|
||
print(`MY_CATE:${MY_CATE},pagecount:${JSON.stringify(rule.pagecount)}`);
|
||
pagecount = parseInt(rule.pagecount[MY_CATE]);
|
||
}
|
||
let nodata = {
|
||
list:[{vod_name:'无数据,防无限请求',vod_id:'no_data',vod_remarks:'不要点,会崩的',vod_pic:'https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/404.jpg'}],
|
||
total:1,pagecount:1,page:1,limit:1
|
||
};
|
||
let vod = d.length<1?JSON.stringify(nodata):JSON.stringify({
|
||
'page': parseInt(cateObj.pg),
|
||
'pagecount': pagecount||999,
|
||
'limit': 20,
|
||
'total': 999,
|
||
'list': d,
|
||
});
|
||
// print(vod);
|
||
return vod
|
||
}
|
||
|
||
/**
|
||
* 搜索列表数据解析
|
||
* @param searchObj
|
||
* @returns {string}
|
||
*/
|
||
function searchParse(searchObj) {
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let d = [];
|
||
if(!searchObj.searchUrl){
|
||
return '{}'
|
||
}
|
||
let p = searchObj.搜索==='*'&&rule.一级 ? rule.一级 : searchObj.搜索;
|
||
if(!p||typeof(p)!=='string'){
|
||
return '{}'
|
||
}
|
||
p = p.trim();
|
||
let pp = rule.一级.split(';');
|
||
let url = searchObj.searchUrl.replaceAll('**', searchObj.wd).replaceAll('fypage', searchObj.pg);
|
||
MY_URL = url;
|
||
console.log(MY_URL);
|
||
// log(searchObj.搜索);
|
||
// setItem('MY_URL',MY_URL);
|
||
if(p.startsWith('js:')){
|
||
const TYPE = 'search';
|
||
const MY_PAGE = searchObj.pg;
|
||
const KEY = searchObj.wd;
|
||
var input = MY_URL;
|
||
var detailUrl = rule.detailUrl||'';
|
||
eval(p.trim().replace('js:',''));
|
||
d = VODS;
|
||
}else{
|
||
p = p.split(';');
|
||
if (p.length < 5) {
|
||
return '{}'
|
||
}
|
||
let p0 = getPP(p,0,pp,0);
|
||
let _ps = parseTags.getParse(p0);
|
||
_pdfa = _ps.pdfa;
|
||
_pdfh = _ps.pdfh;
|
||
_pd = _ps.pd;
|
||
let is_json = p0.startsWith('json:');
|
||
p0 = p0.replace(/^(jsp:|json:|jq:)/,'');
|
||
// print('1381 p0:'+p0);
|
||
try {
|
||
let req_method = MY_URL.split(';').length>1?MY_URL.split(';')[1].toLowerCase():'get';
|
||
let html;
|
||
if(req_method==='post'){
|
||
let rurls = MY_URL.split(';')[0].split('#')
|
||
let rurl = rurls[0]
|
||
let params = rurls.length > 1 ?rurls[1]:'';
|
||
print(`post=》rurl:${rurl},params:${params}`);
|
||
// let new_dict = {};
|
||
// let new_tmp = params.split('&');
|
||
// new_tmp.forEach(i=>{
|
||
// new_dict[i.split('=')[0]] = i.split('=')[1];
|
||
// });
|
||
// html = post(rurl,{body:new_dict});
|
||
let _fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let postData = {body:params};
|
||
Object.assign(_fetch_params,postData);
|
||
html = post(rurl,_fetch_params);
|
||
}else if(req_method==='postjson'){
|
||
let rurls = MY_URL.split(';')[0].split('#')
|
||
let rurl = rurls[0]
|
||
let params = rurls.length > 1 ?rurls[1]:'';
|
||
print(`postjson-》rurl:${rurl},params:${params}`);
|
||
try{
|
||
params = JSON.parse(params);
|
||
}catch (e) {
|
||
params = '{}'
|
||
}
|
||
let _fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let postData = {body:params};
|
||
Object.assign(_fetch_params,postData);
|
||
html = post(rurl,_fetch_params);
|
||
}else{
|
||
html = getHtml(MY_URL);
|
||
}
|
||
if (html) {
|
||
if(/系统安全验证|输入验证码/.test(html)){
|
||
let cookie = verifyCode(MY_URL);
|
||
if(cookie){
|
||
console.log(`本次成功过验证,cookie:${cookie}`);
|
||
setItem(RULE_CK,cookie);
|
||
}else{
|
||
console.log(`本次自动过搜索验证失败,cookie:${cookie}`);
|
||
}
|
||
// obj.headers['Cookie'] = cookie;
|
||
html = getHtml(MY_URL);
|
||
}
|
||
if(!html.includes(searchObj.wd)){
|
||
console.log('搜索结果源码未包含关键字,疑似搜索失败,正为您打印结果源码');
|
||
console.log(html);
|
||
}
|
||
if(is_json){
|
||
// console.log(html);
|
||
html = dealJson(html);
|
||
// console.log(JSON.stringify(html));
|
||
}
|
||
// console.log(html);
|
||
let list = _pdfa(html, p0);
|
||
// print(list.length);
|
||
// print(list);
|
||
let p1 = getPP(p, 1, pp, 1);
|
||
let p2 = getPP(p, 2, pp, 2);
|
||
let p3 = getPP(p, 3, pp, 3);
|
||
let p4 = getPP(p, 4, pp, 4);
|
||
let p5 = getPP(p,5,pp,5);
|
||
list.forEach(it => {
|
||
let links = p4.split('+').map(_p4=>{
|
||
return !rule.detailUrl?_pd(it, _p4,MY_URL):_pdfh(it, _p4)
|
||
});
|
||
let link = links.join('$');
|
||
let content;
|
||
if(p.length > 5 && p[5]){
|
||
content = _pdfh(it, p5);
|
||
}else{
|
||
content = '';
|
||
}
|
||
let vod_id = link;
|
||
let vod_name = _pdfh(it, p1).replace(/\n|\t/g,'').trim();
|
||
let vod_pic = _pd(it, p2,MY_URL);
|
||
if(rule.二级==='*'){
|
||
vod_id = vod_id+'@@'+vod_name+'@@'+vod_pic;
|
||
}
|
||
let ob = {
|
||
'vod_id': vod_id,
|
||
'vod_name': vod_name,
|
||
'vod_pic': vod_pic,
|
||
'vod_remarks': _pdfh(it, p3).replace(/\n|\t/g,'').trim(),
|
||
'vod_content': content.replace(/\n|\t/g,'').trim(),
|
||
};
|
||
d.push(ob);
|
||
});
|
||
|
||
}
|
||
} catch (e) {
|
||
print('搜索发生错误:'+e.message);
|
||
return '{}'
|
||
}
|
||
}
|
||
if(rule.图片来源){
|
||
d.forEach(it=>{
|
||
if(it.vod_pic&&it.vod_pic.startsWith('http')){
|
||
it.vod_pic = it.vod_pic + rule.图片来源;
|
||
}
|
||
});
|
||
}
|
||
// print(d);
|
||
return JSON.stringify({
|
||
'page': parseInt(searchObj.pg),
|
||
'pagecount': 10,
|
||
'limit': 20,
|
||
'total': 100,
|
||
'list': d,
|
||
});
|
||
}
|
||
|
||
/**
|
||
* 二级详情页数据解析
|
||
* @param detailObj
|
||
* @returns {string}
|
||
*/
|
||
function detailParse(detailObj){
|
||
let t1 = (new Date()).getTime();
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
let orId = detailObj.orId;
|
||
let vod_name = '片名';
|
||
let vod_pic = '';
|
||
let vod_id = orId;
|
||
if(rule.二级==='*'){
|
||
// vod_id = orId.split('@@')[0]; // 千万不能分割
|
||
let extra = orId.split('@@');
|
||
vod_name = extra.length>1?extra[1]:vod_name;
|
||
vod_pic = extra.length>2?extra[2]:vod_pic;
|
||
}
|
||
// print(vod_pic);
|
||
let vod = {
|
||
vod_id: vod_id, //"id",
|
||
vod_name: vod_name,
|
||
vod_pic: vod_pic,
|
||
type_name: "类型",
|
||
vod_year: "年份",
|
||
vod_area: "地区",
|
||
vod_remarks: "更新信息",
|
||
vod_actor: "主演",
|
||
vod_director: "导演",
|
||
vod_content: "简介"
|
||
};
|
||
let p = detailObj.二级;
|
||
let url = detailObj.url;
|
||
let detailUrl = detailObj.detailUrl;
|
||
let fyclass = detailObj.fyclass;
|
||
let tab_exclude = detailObj.tab_exclude;
|
||
let html = detailObj.html||'';
|
||
MY_URL = url;
|
||
if(detailObj.二级访问前){
|
||
try {
|
||
print(`尝试在二级访问前执行代码:${detailObj.二级访问前}`);
|
||
eval(detailObj.二级访问前.trim().replace('js:',''));
|
||
}catch (e) {
|
||
print(`二级访问前执行代码出现错误:${e.message}`)
|
||
}
|
||
}
|
||
// console.log(MY_URL);
|
||
// setItem('MY_URL',MY_URL);
|
||
if(p==='*'){
|
||
vod.vod_play_from = '道长在线';
|
||
vod.vod_remarks = detailUrl;
|
||
vod.vod_actor = '没有二级,只有一级链接直接嗅探播放';
|
||
vod.vod_content = MY_URL;
|
||
vod.vod_play_url = '嗅探播放$' + MY_URL.split('@@')[0];
|
||
}else if(typeof(p)==='string'&&p.trim().startsWith('js:')){
|
||
const TYPE = 'detail';
|
||
var input = MY_URL;
|
||
var play_url = '';
|
||
eval(p.trim().replace('js:',''));
|
||
vod = VOD;
|
||
console.log(JSON.stringify(vod));
|
||
}else if(p&&typeof(p)==='object'){
|
||
let tt1 = (new Date()).getTime();
|
||
if(!html){
|
||
html = getHtml(MY_URL);
|
||
}
|
||
print(`二级${MY_URL}仅获取源码耗时:${(new Date()).getTime()-tt1}毫秒`);
|
||
let _ps;
|
||
if(p.is_json){
|
||
print('二级是json');
|
||
_ps = parseTags.json;
|
||
html = dealJson(html);
|
||
}else if(p.is_jsp){
|
||
print('二级是jsp');
|
||
_ps = parseTags.jsp;
|
||
}else if(p.is_jq){
|
||
print('二级是jq');
|
||
_ps = parseTags.jq;
|
||
}else{
|
||
print('二级默认jq');
|
||
_ps = parseTags.jq;
|
||
// print('二级默认jsp');
|
||
// _ps = parseTags.jsp;
|
||
}
|
||
let tt2 = (new Date()).getTime();
|
||
print(`二级${MY_URL}获取并装载源码耗时:${tt2-tt1}毫秒`);
|
||
_pdfa = _ps.pdfa;
|
||
_pdfh = _ps.pdfh;
|
||
_pd = _ps.pd;
|
||
if(p.title){
|
||
let p1 = p.title.split(';');
|
||
vod.vod_name = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim();
|
||
let type_name = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g,'').replace(/ /g,'').trim():'';
|
||
vod.type_name = type_name||vod.type_name;
|
||
}
|
||
if(p.desc){
|
||
try{
|
||
let p1 = p.desc.split(';');
|
||
vod.vod_remarks = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim();
|
||
vod.vod_year = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g,'').trim():'';
|
||
vod.vod_area = p1.length > 2 ? _pdfh(html, p1[2]).replace(/\n|\t/g,'').trim():'';
|
||
// vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replaceAll('\n', ' ').trim():'';
|
||
vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replace(/\n|\t/g,'').trim():'';
|
||
vod.vod_director = p1.length > 4 ? _pdfh(html, p1[4]).replace(/\n|\t/g,'').trim():'';
|
||
}
|
||
catch (e) {
|
||
|
||
}
|
||
}
|
||
if(p.content){
|
||
try{
|
||
let p1 = p.content.split(';');
|
||
vod.vod_content = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim();
|
||
}
|
||
catch (e) {}
|
||
}
|
||
if(p.img){
|
||
try{
|
||
let p1 = p.img.split(';');
|
||
vod.vod_pic = _pd(html, p1[0],MY_URL);
|
||
}
|
||
catch (e) {}
|
||
}
|
||
|
||
let vod_play_from = '$$$';
|
||
let playFrom = [];
|
||
if(p.重定向&&p.重定向.startsWith('js:')){
|
||
print('开始执行重定向代码:'+p.重定向);
|
||
html = eval(p.重定向.replace('js:',''));
|
||
}
|
||
|
||
// console.log(2);
|
||
if(p.tabs){
|
||
if(p.tabs.startsWith('js:')){
|
||
print('开始执行tabs代码:'+p.tabs);
|
||
var input = MY_URL;
|
||
eval(p.tabs.replace('js:',''));
|
||
playFrom = TABS;
|
||
}else{
|
||
let p_tab = p.tabs.split(';')[0];
|
||
// console.log(p_tab);
|
||
let vHeader = _pdfa(html, p_tab);
|
||
console.log(vHeader.length);
|
||
let tab_text = p.tab_text||'body&&Text';
|
||
// print('tab_text:'+tab_text);
|
||
let new_map = {};
|
||
for(let v of vHeader){
|
||
let v_title = _pdfh(v,tab_text).trim();
|
||
console.log(v_title);
|
||
if(tab_exclude&& (new RegExp(tab_exclude)).test(v_title)){
|
||
continue;
|
||
}
|
||
if(!new_map.hasOwnProperty(v_title)){
|
||
new_map[v_title] = 1;
|
||
}else{
|
||
new_map[v_title] += 1;
|
||
}
|
||
if(new_map[v_title]>1){
|
||
v_title+=Number(new_map[v_title]-1);
|
||
}
|
||
playFrom.push(v_title);
|
||
}
|
||
}
|
||
console.log(JSON.stringify(playFrom));
|
||
}else{
|
||
playFrom = ['道长在线']
|
||
}
|
||
vod.vod_play_from = playFrom.join(vod_play_from);
|
||
|
||
// console.log(3);
|
||
let vod_play_url = '$$$';
|
||
let vod_tab_list = [];
|
||
if(p.lists){
|
||
if(p.lists.startsWith('js:')){
|
||
print('开始执行lists代码:'+p.lists);
|
||
try {
|
||
var input = MY_URL;
|
||
var play_url = '';
|
||
eval(p.lists.replace('js:',''));
|
||
for(let i in LISTS){
|
||
if(LISTS.hasOwnProperty(i)){
|
||
// print(i);
|
||
try {
|
||
LISTS[i] = LISTS[i].map(it=>it.split('$').slice(0,2).join('$'));
|
||
}catch (e) {
|
||
print('格式化LISTS发生错误:'+e.message);
|
||
}
|
||
}
|
||
}
|
||
vod_play_url = LISTS.map(it=>it.join('#')).join(vod_play_url);
|
||
}catch (e) {
|
||
print('js执行lists: 发生错误:'+e.message);
|
||
}
|
||
|
||
}else{
|
||
let list_text = p.list_text||'body&&Text';
|
||
let list_url = p.list_url||'a&&href';
|
||
// print('list_text:'+list_text);
|
||
// print('list_url:'+list_url);
|
||
// print('list_parse:'+p.lists);
|
||
let is_tab_js = p.tabs.trim().startsWith('js:');
|
||
for(let i=0;i<playFrom.length;i++){
|
||
let tab_name = playFrom[i];
|
||
let tab_ext = p.tabs.split(';').length > 1 && !is_tab_js ? p.tabs.split(';')[1] : '';
|
||
let p1 = p.lists.replaceAll('#idv', tab_name).replaceAll('#id', i);
|
||
tab_ext = tab_ext.replaceAll('#idv', tab_name).replaceAll('#id', i);
|
||
let tabName = tab_ext?_pdfh(html, tab_ext):tab_name;
|
||
console.log(tabName);
|
||
// print('tab_ext:'+tab_ext);
|
||
let new_vod_list = [];
|
||
let tt1 = (new Date()).getTime();
|
||
// print('pdfl:'+typeof (pdfl));
|
||
if(typeof (pdfl) ==='function'){
|
||
new_vod_list = pdfl(html, p1, list_text, list_url, MY_URL);
|
||
}else {
|
||
let vodList = [];
|
||
try {
|
||
vodList = _pdfa(html, p1);
|
||
console.log('len(vodList):'+vodList.length);
|
||
}catch (e) {
|
||
// console.log(e.message);
|
||
}
|
||
for (let i = 0; i < vodList.length; i++) {
|
||
let it = vodList[i];
|
||
new_vod_list.push(_pdfh(it, list_text).trim() + '$' + _pd(it, list_url, MY_URL));
|
||
}
|
||
}
|
||
if(new_vod_list.length>0){
|
||
new_vod_list = forceOrder(new_vod_list,'',x=>x.split('$')[0]);
|
||
console.log(`drpy影响性能代码共计列表数循环次数:${new_vod_list.length},耗时:${(new Date()).getTime()-tt1}毫秒`);
|
||
}
|
||
// print(new_vod_list);
|
||
let vlist = new_vod_list.join('#');
|
||
vod_tab_list.push(vlist);
|
||
}
|
||
vod_play_url = vod_tab_list.join(vod_play_url);
|
||
}
|
||
}
|
||
vod.vod_play_url = vod_play_url;
|
||
}
|
||
if(rule.图片来源 && vod.vod_pic && vod.vod_pic.startsWith('http')){
|
||
vod.vod_pic = vod.vod_pic + rule.图片来源;
|
||
}
|
||
if(!vod.vod_id||(vod_id.includes('$')&&vod.vod_id!==vod_id)){
|
||
vod.vod_id = vod_id;
|
||
}
|
||
let t2 = (new Date()).getTime();
|
||
console.log(`加载二级界面${MY_URL}耗时:${t2-t1}毫秒`);
|
||
// print(vod);
|
||
return JSON.stringify({
|
||
list: [vod]
|
||
})
|
||
}
|
||
|
||
/**
|
||
* 判断是否需要解析
|
||
* @param url
|
||
* @returns {number|number}
|
||
*/
|
||
function tellIsJx(url){
|
||
try {
|
||
let is_vip = !/\.(m3u8|mp4|m4a)$/.test(url.split('?')[0]) && 是否正版(url);
|
||
return is_vip?1:0
|
||
}catch (e) {
|
||
return 1
|
||
}
|
||
}
|
||
/**
|
||
* 选集播放点击事件解析
|
||
* @param playObj
|
||
* @returns {string}
|
||
*/
|
||
function playParse(playObj){
|
||
fetch_params = JSON.parse(JSON.stringify(rule_fetch_params));
|
||
MY_URL = playObj.url;
|
||
if(!/http/.test(MY_URL)){
|
||
try {
|
||
MY_URL = base64Decode(MY_URL);
|
||
}catch (e) {}
|
||
}
|
||
MY_URL = decodeURIComponent(MY_URL);
|
||
var input = MY_URL;//注入给免嗅js
|
||
let common_play = {
|
||
parse:1,
|
||
url:input,
|
||
// url:urlencode(input),
|
||
jx:tellIsJx(input)
|
||
};
|
||
let lazy_play;
|
||
if(!rule.play_parse||!rule.lazy){
|
||
lazy_play = common_play;
|
||
}else if(rule.play_parse&&rule.lazy&&typeof(rule.lazy)==='string'){
|
||
try {
|
||
let lazy_code = rule.lazy.replace('js:','').trim();
|
||
print('开始执行js免嗅=>'+lazy_code);
|
||
eval(lazy_code);
|
||
lazy_play = typeof(input) === 'object'?input:{
|
||
parse:1,
|
||
jx:tellIsJx(input),
|
||
url:input
|
||
};
|
||
}catch (e) {
|
||
print('js免嗅错误:'+e.message);
|
||
lazy_play = common_play;
|
||
}
|
||
}else{
|
||
lazy_play = common_play;
|
||
}
|
||
// print('play_json:'+typeof(rule.play_json));
|
||
// console.log(Array.isArray(rule.play_json));
|
||
if(Array.isArray(rule.play_json) && rule.play_json.length >0){ // 数组情况判断长度大于0
|
||
let web_url = lazy_play.url;
|
||
for(let pjson of rule.play_json){
|
||
if(pjson.re && (pjson.re==='*'||web_url.match(new RegExp(pjson.re)))){
|
||
if(pjson.json && typeof(pjson.json)==='object'){
|
||
let base_json = pjson.json;
|
||
// print('开始合并:');
|
||
// print(base_json);
|
||
lazy_play = Object.assign(lazy_play,base_json);
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
}else if(rule.play_json && !Array.isArray(rule.play_json)){ // 其他情况 非[] 判断true/false
|
||
let base_json = {
|
||
jx:1,
|
||
parse:1,
|
||
};
|
||
lazy_play = Object.assign(lazy_play,base_json);
|
||
}else if(!rule.play_json){ // 不解析传0
|
||
let base_json = {
|
||
jx:0,
|
||
parse:1,
|
||
};
|
||
lazy_play = Object.assign(lazy_play,base_json);
|
||
}
|
||
console.log(JSON.stringify(lazy_play));
|
||
return JSON.stringify(lazy_play);
|
||
}
|
||
|
||
/**
|
||
* js源预处理特定返回对象中的函数
|
||
* @param ext
|
||
*/
|
||
function init(ext) {
|
||
console.log('init');
|
||
try {
|
||
// make shared jsContext happy muban不能import,不然会造成换源继承后变量被篡改
|
||
// if (typeof (globalThis.mubanJs) === 'undefined') {
|
||
// let mubanJs = request('https://ghproxy.net/https://raw.githubusercontent.com/hjdhnx/dr_py/main/js/模板.js', { 'User-Agent': MOBILE_UA });
|
||
// mubanJs = mubanJs.replace('export default', '(function() {return muban;}()) // export default');
|
||
// // console.log(mubanJs);
|
||
// globalThis.mubanJs = mubanJs;
|
||
// }
|
||
// let muban = eval(globalThis.mubanJs);
|
||
|
||
let muban = 模板.getMubans();
|
||
// print(typeof (muban));
|
||
// print(muban);
|
||
if (typeof ext == 'object'){
|
||
rule = ext;
|
||
} else if (typeof ext == 'string') {
|
||
if (ext.startsWith('http')) {
|
||
let js = request(ext,{'method':'GET'});
|
||
if (js){
|
||
eval(js.replace('var rule', 'rule'));
|
||
}
|
||
} else {
|
||
eval(ext.replace('var rule', 'rule'));
|
||
}
|
||
}
|
||
if (rule.模板 && muban.hasOwnProperty(rule.模板)) {
|
||
print('继承模板:'+rule.模板);
|
||
rule = Object.assign(muban[rule.模板], rule);
|
||
}
|
||
/** 处理一下 rule规则关键字段没传递的情况 **/
|
||
let rule_cate_excludes = (rule.cate_exclude||'').split('|').filter(it=>it.trim());
|
||
let rule_tab_excludes = (rule.tab_exclude||'').split('|').filter(it=>it.trim());
|
||
rule_cate_excludes = rule_cate_excludes.concat(CATE_EXCLUDE.split('|').filter(it=>it.trim()));
|
||
rule_tab_excludes = rule_tab_excludes.concat(TAB_EXCLUDE.split('|').filter(it=>it.trim()));
|
||
|
||
rule.cate_exclude = rule_cate_excludes.join('|');
|
||
rule.tab_exclude = rule_tab_excludes.join('|');
|
||
rule.host = (rule.host||'').rstrip('/');
|
||
HOST = rule.host;
|
||
if(rule.hostJs){
|
||
console.log(`检测到hostJs,准备执行...`);
|
||
try {
|
||
eval(rule.hostJs);
|
||
rule.host = HOST.rstrip('/');
|
||
}catch (e) {
|
||
console.log(`执行${rule.hostJs}获取host发生错误:`+e.message);
|
||
}
|
||
}
|
||
rule.url = rule.url||'';
|
||
rule.double = rule.double||false;
|
||
rule.homeUrl = rule.homeUrl||'';
|
||
rule.detailUrl = rule.detailUrl||'';
|
||
rule.searchUrl = rule.searchUrl||'';
|
||
rule.homeUrl = rule.host&&rule.homeUrl?urljoin(rule.host,rule.homeUrl):(rule.homeUrl||rule.host);
|
||
rule.detailUrl = rule.host&&rule.detailUrl?urljoin(rule.host,rule.detailUrl):rule.detailUrl;
|
||
rule.二级访问前 = rule.二级访问前||'';
|
||
if(rule.url.includes('[')&&rule.url.includes(']')){
|
||
let u1 = rule.url.split('[')[0]
|
||
let u2 = rule.url.split('[')[1].split(']')[0]
|
||
rule.url = rule.host && rule.url?urljoin(rule.host,u1)+'['+urljoin(rule.host,u2)+']':rule.url;
|
||
}else{
|
||
rule.url = rule.host && rule.url ? urljoin(rule.host,rule.url) : rule.url;
|
||
}
|
||
rule.searchUrl = rule.host && rule.searchUrl ? urljoin(rule.host,rule.searchUrl) : rule.searchUrl;
|
||
|
||
rule.timeout = rule.timeout||5000;
|
||
rule.encoding = rule.编码||rule.encoding||'utf-8';
|
||
rule.search_encoding = rule.搜索编码||rule.search_encoding||'';
|
||
rule.图片来源 = rule.图片来源||'';
|
||
rule.play_json = rule.hasOwnProperty('play_json')?rule.play_json:[];
|
||
rule.pagecount = rule.hasOwnProperty('pagecount')?rule.pagecount:{};
|
||
if(rule.headers && typeof(rule.headers) === 'object'){
|
||
try {
|
||
let header_keys = Object.keys(rule.headers);
|
||
for(let k of header_keys){
|
||
if(k.toLowerCase() === 'user-agent'){
|
||
let v = rule.headers[k];
|
||
console.log(v);
|
||
if(['MOBILE_UA','PC_UA','UC_UA','IOS_UA','UA'].includes(v)){
|
||
rule.headers[k] = eval(v);
|
||
}
|
||
}else if(k.toLowerCase() === 'cookie'){
|
||
let v = rule.headers[k];
|
||
if(v && v.startsWith('http')){
|
||
console.log(v);
|
||
try {
|
||
v = fetch(v);
|
||
console.log(v);
|
||
rule.headers[k] = v;
|
||
}catch (e) {
|
||
console.log(`从${v}获取cookie发生错误:`+e.message);
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}catch (e) {
|
||
console.log('处理headers发生错误:'+e.message);
|
||
}
|
||
}
|
||
// print(rule.headers);
|
||
rule_fetch_params = {'headers': rule.headers||false, 'timeout': rule.timeout, 'encoding': rule.encoding};
|
||
oheaders = rule.headers||{};
|
||
RKEY = typeof(key)!=='undefined'&&key?key:'drpy_' + (rule.title || rule.host);
|
||
pre(); // 预处理
|
||
init_test();
|
||
}catch (e) {
|
||
console.log('init_test发生错误:'+e.message);
|
||
}
|
||
}
|
||
|
||
let homeHtmlCache = undefined;
|
||
|
||
/**
|
||
* js源获取首页分类和筛选特定返回对象中的函数
|
||
* @param filter 筛选条件字典对象
|
||
* @returns {string}
|
||
*/
|
||
function home(filter) {
|
||
console.log("home");
|
||
let homeObj = {
|
||
filter:rule.filter||false,
|
||
MY_URL: rule.homeUrl,
|
||
class_name: rule.class_name || '',
|
||
class_url: rule.class_url || '',
|
||
class_parse: rule.class_parse || '',
|
||
cate_exclude: rule.cate_exclude,
|
||
};
|
||
return homeParse(homeObj);
|
||
}
|
||
|
||
/**
|
||
* js源获取首页推荐数据列表特定返回对象中的函数
|
||
* @param params
|
||
* @returns {string}
|
||
*/
|
||
function homeVod(params) {
|
||
console.log("homeVod");
|
||
let homeVodObj = {
|
||
推荐:rule.推荐,
|
||
double:rule.double,
|
||
homeUrl:rule.homeUrl,
|
||
detailUrl:rule.detailUrl
|
||
};
|
||
return homeVodParse(homeVodObj)
|
||
// return "{}";
|
||
}
|
||
|
||
/**
|
||
* js源获取分类页一级数据列表特定返回对象中的函数
|
||
* @param tid 分类id
|
||
* @param pg 页数
|
||
* @param filter 当前选中的筛选条件
|
||
* @param extend 扩展
|
||
* @returns {string}
|
||
*/
|
||
function category(tid, pg, filter, extend) {
|
||
let cateObj = {
|
||
url: rule.url,
|
||
一级: rule.一级,
|
||
tid: tid,
|
||
pg: parseInt(pg),
|
||
filter: filter,
|
||
extend: extend
|
||
};
|
||
// console.log(JSON.stringify(extend));
|
||
return categoryParse(cateObj)
|
||
}
|
||
|
||
/**
|
||
* js源获取二级详情页数据特定返回对象中的函数
|
||
* @param vod_url 一级列表中的vod_id或者是带分类的自拼接 vod_id 如 fyclass$vod_id
|
||
* @returns {string}
|
||
*/
|
||
function detail(vod_url) {
|
||
let orId = vod_url;
|
||
let fyclass = '';
|
||
log('orId:'+orId);
|
||
if(vod_url.indexOf('$')>-1){
|
||
let tmp = vod_url.split('$');
|
||
fyclass = tmp[0];
|
||
vod_url = tmp[1];
|
||
}
|
||
let detailUrl = vod_url.split('@@')[0];
|
||
let url;
|
||
if(!detailUrl.startsWith('http')&&!detailUrl.includes('/')){
|
||
url = rule.detailUrl.replaceAll('fyid', detailUrl).replaceAll('fyclass',fyclass);
|
||
}else if(detailUrl.includes('/')){
|
||
url = urljoin(rule.homeUrl,detailUrl);
|
||
}else{
|
||
url = detailUrl
|
||
}
|
||
let detailObj = {
|
||
orId: orId,
|
||
url:url,
|
||
二级:rule.二级,
|
||
二级访问前:rule.二级访问前,
|
||
detailUrl:detailUrl,
|
||
fyclass:fyclass,
|
||
tab_exclude:rule.tab_exclude,
|
||
}
|
||
return detailParse(detailObj)
|
||
}
|
||
|
||
/**
|
||
* js源选集按钮播放点击事件特定返回对象中的函数
|
||
* @param flag 线路名
|
||
* @param id 播放按钮的链接
|
||
* @param flags 全局配置的flags是否需要解析的标识列表
|
||
* @returns {string}
|
||
*/
|
||
function play(flag, id, flags) {
|
||
let playObj = {
|
||
url:id,
|
||
flag:flag,
|
||
flags:flags
|
||
}
|
||
return playParse(playObj);
|
||
}
|
||
|
||
/**
|
||
* js源搜索返回的数据列表特定返回对象中的函数
|
||
* @param wd 搜索关键字
|
||
* @param quick 是否来自快速搜索
|
||
* @returns {string}
|
||
*/
|
||
function search(wd, quick) {
|
||
if(rule.search_encoding){
|
||
if(rule.search_encoding.toLowerCase()!=='utf-8'){
|
||
// 按搜索编码进行编码
|
||
wd = encodeStr(wd,rule.search_encoding);
|
||
}
|
||
}else if(rule.encoding && rule.encoding.toLowerCase()!=='utf-8'){
|
||
// 按全局编码进行编码
|
||
wd = encodeStr(wd,rule.encoding);
|
||
}
|
||
let searchObj = {
|
||
searchUrl: rule.searchUrl,
|
||
搜索: rule.搜索,
|
||
wd: wd,
|
||
//pg: pg,
|
||
pg: 1,
|
||
quick: quick,
|
||
};
|
||
// console.log(JSON.stringify(searchObj));
|
||
return searchParse(searchObj)
|
||
}
|
||
|
||
function DRPY(){//导出函数
|
||
return {
|
||
init: init,
|
||
home: home,
|
||
homeVod: homeVod,
|
||
category: category,
|
||
detail: detail,
|
||
play: play,
|
||
search: search,
|
||
}
|
||
}
|
||
|
||
// 导出函数对象
|
||
export default {
|
||
init: init,
|
||
home: home,
|
||
homeVod: homeVod,
|
||
category: category,
|
||
detail: detail,
|
||
play: play,
|
||
search: search,
|
||
DRPY:DRPY
|
||
} |