From 81bf450749a21ca43e4b0f22989d4c9ccbab537e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?2=E5=93=88=E7=A4=BE=E5=8C=BA?= Date: Wed, 19 Oct 2022 10:01:10 +0800 Subject: [PATCH] Update drpy.js --- drpy/drpy.js | 1312 ++++++++++++++++---------------------------------- 1 file changed, 417 insertions(+), 895 deletions(-) diff --git a/drpy/drpy.js b/drpy/drpy.js index b44f99e..f457e11 100644 --- a/drpy/drpy.js +++ b/drpy/drpy.js @@ -1,30 +1,22 @@ -// import 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/libs/es6py.js'; -// import {是否正版,urlDeal,setResult,setResult2,setHomeResult,maoss,urlencode} from 'http://192.168.10.103:5705/libs/es6py.js'; -// import 'http://192.168.1.124:5705/libs/es6py.js'; -import cheerio from 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/libs/cheerio.min.js'; -// import cheerio from 'http://192.168.10.103:5705/libs/cheerio.min.js'; -import 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/libs/crypto-js.js'; -import 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/libs/drT.js'; -// import 'http://192.168.10.103:5705/libs/drT.js'; -// import muban from 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/js/模板.js'; -// import muban from 'http://192.168.10.103:5705/admin/view/模板.js'; +import 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/lib/util.js'; +import cheerio from 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/lib/cheerio.min.js'; +import 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/lib/crypto-js.js' +// import muban from 'https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js'; // const key = 'drpy_zbk'; // eval(req('http://192.168.1.124:5705/libs/es6py.js').content); -function init_test(){ - // console.log(typeof(CryptoJS)); +function init_test() { console.log("init_test_start"); console.log(RKEY); console.log(JSON.stringify(rule)); - // console.log('123456的md5值是:'+md5('123456')); + // clearItem(RULE_CK); + // console.log(JSON.stringify(rule)); // let aa = base64Encode('编码测试一下') // log(aa); // let bb = base64Decode(aa); - // log('bb:'+bb); - // clearItem(RULE_CK); - // console.log(JSON.stringify(rule)); + // log('bb:' + bb); // console.log(request('https://www.baidu.com',{withHeaders:true})); - // console.log(request('https://www.baidu.com/favicon.ico',{toBase64:true})); + // console.log(request('https://www.baidu.com/favicon.ico', { toBase64: true })); // require('http://192.168.10.99:5705/txt/pluto/drT.js'); // console.log(typeof(drT)); // console.log(drT.renderText('{{fl.cate}},hi, {{fl}}哈哈.{{fl}}',{sort: 1,cate:'movie'},'fl')); @@ -33,15 +25,13 @@ function init_test(){ let rule = {}; /** 已知问题记录 - * 1.影魔的jinjia2引擎不支持 {{fl}}对象直接渲染 (有能力解决的话尽量解决下,支持对象直接渲染字符串转义,如果加了|safe就不转义)[影魔牛逼,最新的文件发现这问题已经解决了] - * Array.prototype.append = Array.prototype.push; 这种js执行后有毛病,for in 循环列表会把属性给打印出来 (这个大毛病需要重点排除一下) - * 2.import es6py.js但是里面的函数没有被装载进来.比如drpy规则报错setResult2 is undefiend(合并文件了可以不管了) + * 1.影魔的jinjia2引擎不支持 {{fl}}对象直接渲染 + * Array.prototype.append = Array.prototype.push; 这种js执行后有毛病,for in 循环列表会把属性给打印出来 + * 2.import es6py.js但是里面的函数没有被装载进来.比如drpy规则报错setResult2 is undefiend * 3.无法重复导入cheerio(怎么解决drpy和parseTag里都需要导入cheerio的问题) 无法在副文件导入cheerio (现在是全部放在drpy一个文件里了,凑合解决?) - * 4.有个错误不知道哪儿来的 executeScript: com.quickjs.JSObject$Undefined cannot be cast to java.lang.String 在 点击选集播放打印init_test_end后面打印(貌似不影响使用) + * 4.有个错误不知道哪儿来的 executeScript: com.quickjs.JSObject$Undefined cannot be cast to java.lang.String 在 点击选集播放打印init_test_end后面打印 * 5.需要实现 stringify 函数,比起JSON.stringify函数,它会原封不动保留中文不会编码unicode - * 6.base64Encode,base64Decode,md5函数还没有实现 (抄影魔代码实现了) - * 7.eval(getCryptoJS());还没有实现 (可以空实现了,以后遇到能忽略) - * done: jsp:{pdfa,pdfh,pd},json:{pdfa,pdfh,pd},jq:{pdfa,pdfh,pd} + * todo: jsp:{pdfa,pdfh,pd},json:{pdfa,pdfh,pd},jq:{pdfa,pdfh,pd} * * 电脑看日志调试 adb tcpip 5555 adb connect 192.168.10.192 @@ -64,9 +54,8 @@ const TAB_EXCLUDE = '猜你|喜欢|APP|下载|剧情|热播'; const OCR_RETRY = 3;//ocr验证重试次数 // const OCR_API = 'http://dm.mudery.com:10000';//ocr在线识别接口 // const OCR_API = 'http://192.168.3.239:5705/parse/ocr';//ocr在线识别接口 -// const OCR_API = 'http://cms.nokia.press/parse/ocr';//ocr在线识别接口 -const OCR_API = 'http://cms.nokia.press:5706/parse/ocr';//ocr在线识别接口 -if(typeof(MY_URL)==='undefined'){ +const OCR_API = 'http://cms.nokia.press/parse/ocr';//ocr在线识别接口 +if (typeof (MY_URL) === 'undefined') { var MY_URL; // 全局注入变量,pd函数需要 } var RKEY; // 源的唯一标识 @@ -84,186 +73,49 @@ const DOM_CHECK_ATTR = /(url|src|href|data-original|data-src)$/; const SELECT_REGEX = /:eq|:lt|:gt|#/g; const SELECT_REGEX_A = /:eq|:lt|:gt/g; -/** -es6py扩展 - */ -if (typeof Object.assign != 'function') { - Object.assign = function () { - var target = arguments[0]; - for (var i = 1; i < arguments.length; i++) { - var source = arguments[i]; - for (var key in source) { - if (Object.prototype.hasOwnProperty.call(source, key)) { - target[key] = source[key]; - } - } - } - return target; - }; -} -if (!String.prototype.includes) { - String.prototype.includes = function (search, start) { - if (typeof start !== 'number') { - start = 0; - } - - if (start + search.length > this.length) { - return false; - } else { - return this.indexOf(search, start) !== -1; - } - }; -} - -if (!Array.prototype.includes) { - Object.defineProperty(Array.prototype, 'includes', { - value: function (searchElement, fromIndex) { - - if (this == null) {//this是空或者未定义,抛出错误 - throw new TypeError('"this" is null or not defined'); - } - - var o = Object(this);//将this转变成对象 - var len = o.length >>> 0;//无符号右移0位,获取对象length属性,如果未定义就会变成0 - - if (len === 0) {//length为0直接返回false未找到目标值 - return false; - } - - var n = fromIndex | 0;//查找起始索引 - var k = Math.max(n >= 0 ? n : len - Math.abs(n), 0);//计算正确起始索引,因为有可能是负值 - - while (k < len) {//从起始索引处开始循环 - if (o[k] === searchElement) {//如果某一位置与寻找目标相等,返回true,找到了 - return true; - } - k++; - } - return false;//未找到,返回false - } - }); -} -if (typeof String.prototype.startsWith != 'function') { - String.prototype.startsWith = function (prefix){ - return this.slice(0, prefix.length) === prefix; - }; -} -if (typeof String.prototype.endsWith != 'function') { - String.prototype.endsWith = function(suffix) { - return this.indexOf(suffix, this.length - suffix.length) !== -1; - }; -} -Object.prototype.myValues=function(obj){ - if(obj ==null) { - throw new TypeError("Cannot convert undefined or null to object"); - } - var res=[] - for(var k in obj){ - if(obj.hasOwnProperty(k)){//需判断是否是本身的属性 - res.push(obj[k]); - } - } - return res; -} -if (typeof Object.prototype.values != 'function') { - Object.prototype.values=function(obj){ - if(obj ==null) { - throw new TypeError("Cannot convert undefined or null to object"); - } - var res=[] - for(var k in obj){ - if(obj.hasOwnProperty(k)){//需判断是否是本身的属性 - res.push(obj[k]); - } - } - return res; - } -} -if (typeof Array.prototype.join != 'function') { - Array.prototype.join = function (emoji) { - // emoji = emoji||','; - emoji = emoji||''; - let self = this; - let str = ""; - let i = 0; - if (!Array.isArray(self)) {throw String(self)+'is not Array'} - if(self.length===0){return ''} - if (self.length === 1){return String(self[0])} - i = 1; - str = this[0]; - for (; i < self.length; i++) { - str += String(emoji)+String(self[i]); - } - return str; - }; -} - -String.prototype.rstrip = function (chars) { - let regex = new RegExp(chars + "$"); - return this.replace(regex, ""); -}; - -Array.prototype.append = Array.prototype.push; -String.prototype.strip = String.prototype.trim; -function 是否正版(vipUrl){ - let flag = new RegExp('qq\.com|iqiyi\.com|youku\.com|mgtv\.com|bilibili\.com|sohu\.com|ixigua\.com|pptv\.com|miguvideo\.com|le\.com|1905\.com|fun\.tv'); - return flag.test(vipUrl); -} -function urlDeal(vipUrl){ - if(!vipUrl){ - return '' - } - if(!是否正版(vipUrl)){ - return vipUrl - } - if(!/miguvideo/.test(vipUrl)){ - vipUrl=vipUrl.split('#')[0].split('?')[0]; - } - return vipUrl -} -function setResult(d){ - if(!Array.isArray(d)){ +function setResult(d) { + if (!Array.isArray(d)) { return [] } VODS = []; // print(d); - d.forEach(function (it){ + d.forEach(function (it) { let obj = { - vod_id:it.url||'', - vod_name: it.title||'', - vod_remarks: it.desc||'', - vod_content: it.content||'', - vod_pic: it.pic_url||it.img||'', + vod_id: it.url || '', + vod_name: it.title || '', + vod_remarks: it.desc || '', + vod_content: it.content || '', + vod_pic: it.pic_url || it.img || '', }; let keys = Object.keys(it); - if(keys.includes('tname')){ - obj.type_name = it.tname||''; + if (keys.includes('tname')) { + obj.type_name = it.tname || ''; } - if(keys.includes('tid')){ - obj.type_id = it.tid||''; + if (keys.includes('tid')) { + obj.type_id = it.tid || ''; } - if(keys.includes('year')){ - obj.vod_year = it.year||''; + if (keys.includes('year')) { + obj.vod_year = it.year || ''; } - if(keys.includes('actor')){ - obj.vod_actor = it.actor||''; + if (keys.includes('actor')) { + obj.vod_actor = it.actor || ''; } - if(keys.includes('director')){ - obj.vod_director = it.director||''; + if (keys.includes('director')) { + obj.vod_director = it.director || ''; } - if(keys.includes('area')){ - obj.vod_area = it.area||''; + if (keys.includes('area')) { + obj.vod_area = it.area || ''; } VODS.push(obj); }); return VODS } -function setResult2(res){ - VODS = res.list||[]; +function setResult2(res) { + VODS = res.list || []; return VODS } -function setHomeResult(res){ - if(!res||typeof(res)!=='object'){ +function setHomeResult(res) { + if (!res || typeof (res) !== 'object') { return [] } return setResult(res.list); @@ -300,11 +152,10 @@ function rc(js) { // 千万不要用for in 推荐 forEach (for in 会打乱顺序) //猫函数 function maoss(jxurl, ref, key) { - fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); eval(getCryptoJS()); try { var getVideoInfo = function (text) { - return CryptoJS.AES.decrypt(text, key, {iv: iv, padding: CryptoJS.pad.Pkcs7}).toString(CryptoJS.enc.Utf8); + return CryptoJS.AES.decrypt(text, key, { iv: iv, padding: CryptoJS.pad.Pkcs7 }).toString(CryptoJS.enc.Utf8); }; var token_key = key == undefined ? 'dvyYRQlnPRCMdQSe' : key; if (ref) { @@ -347,155 +198,26 @@ function maoss(jxurl, ref, key) { } } -function urlencode (str) { - str = (str + '').toString(); - return encodeURIComponent(str).replace(/!/g, '%21').replace(/'/g, '%27').replace(/\(/g, '%28'). - replace(/\)/g, '%29').replace(/\*/g, '%2A').replace(/%20/g, '+'); -} - -function base64Encode(text){ - return CryptoJS.enc.Base64.stringify(CryptoJS.enc.Utf8.parse(text)); - // return text -} - -function base64Decode(text){ - return CryptoJS.enc.Utf8.stringify(CryptoJS.enc.Base64.parse(text)); - // return text -} - -function md5(text) { - return CryptoJS.MD5(text).toString(); -} - -function getCryptoJS(){ - // return request('https://raw.iqiq.io/2hacc/TVBox/main/drpy/libs/crypto-hiker.js'); - return 'console.log("CryptoJS已装载");' -} - let VODS = [];// 一级或者搜索需要的数据列表 let VOD = {};// 二级的单个数据 -let TABS = [];// 二级的自定义线路列表 如: TABS=['道长在线','道长在线2'] -let LISTS = [];// 二级的自定义选集播放列表 如: LISTS=[['第1集$http://1.mp4','第2集$http://2.mp4'],['第3集$http://1.mp4','第4集$http://2.mp4']] -globalThis.encodeUrl = urlencode; -globalThis.urlencode = urlencode; - - /** - * url拼接 - * @param fromPath 初始当前页面url - * @param nowPath 相对当前页面url - * @returns {*} - */ -function urljoin(fromPath, nowPath) { - fromPath = fromPath||''; - nowPath = nowPath||''; - return joinUrl(fromPath, nowPath); - // try { - // // import Uri from './uri.min.js'; - // // var Uri = require('./uri.min.js'); - // // eval(request('https://cdn.bootcdn.net/ajax/libs/URI.js/1.19.11/URI.min.js')); - // // let new_uri = URI(nowPath, fromPath); - - // let new_uri = Uri(nowPath, fromPath); - // new_uri = new_uri.toString(); - // // console.log(new_uri); - // // return fromPath + nowPath - // return new_uri - // } - // catch (e) { - // console.log('urljoin发生错误:'+e.message); - // if(nowPath.startsWith('http')){ - // return nowPath - // }if(nowPath.startsWith('/')){ - // return getHome(fromPath)+nowPath - // } - // return fromPath+nowPath - // } -} -var urljoin2 = urljoin; - -// 内置 pdfh,pdfa,pd -const defaultParser = { - pdfh:pdfh, - pdfa:pdfa, - pd(html,parse,uri){ - let ret = this.pdfh(html,parse); - if(typeof(uri)==='undefined'||!uri){ - uri = ''; - } - if(DOM_CHECK_ATTR.test(parse)){ - if(/http/.test(ret)){ - ret = ret.substr(ret.indexOf('http')); - }else{ - ret = urljoin(MY_URL,ret) - } - } - return ret - }, -}; - - -/** - * pdfh原版优化,能取style属性里的图片链接 - * @param html 源码 - * @param parse 解析表达式 - * @returns {string|*} - */ -function pdfh2(html,parse){ - let html2 = html; - try { - if(typeof(html)!=='string'){ - html2 = html.rr(html.ele).toString(); - } - }catch (e) { - print('html对象转文本发生了错误:'+e.message); - } - let result = defaultParser.pdfh(html2,parse); - let option = parse.includes('&&')?parse.split('&&').slice(-1)[0]:parse.split(' ').slice(-1)[0]; - if(/style/.test(option.toLowerCase())&&/url\(/.test(result)){ - try { - result = result.match(/url\((.*?)\)/)[1]; - }catch (e) {} - } - return result -} - -/** - * pdfa原版优化,可以转换jq的html对象 - * @param html - * @param parse - * @returns {*} - */ -function pdfa2(html,parse){ - let html2 = html; - try { - if(typeof(html)!=='string'){ - html2 = html.rr(html.ele).toString(); - } - }catch (e) { - print('html对象转文本发生了错误:'+e.message); - } - return defaultParser.pdfa(html2,parse); -} - -/** - * pd原版方法重写-增加自动urljoin + * 重写pd方法-增加自动urljoin(没法重写,改个名继续骗) * @param html * @param parse * @param uri * @returns {*} */ -function pd2(html,parse,uri){ - let ret = pdfh2(html,parse); - if(typeof(uri)==='undefined'||!uri){ +function pD(html, parse, uri) { + let ret = pdfh(html, parse); + if (typeof (uri) === 'undefined' || !uri) { uri = ''; } - if(DOM_CHECK_ATTR.test(parse)){ - if(/http/.test(ret)){ + if (DOM_CHECK_ATTR.test(parse)) { + if (/http/.test(ret)) { ret = ret.substr(ret.indexOf('http')); - }else{ - ret = urljoin(MY_URL,ret) + } else { + ret = urljoin(MY_URL, ret) } } // MY_URL = getItem('MY_URL',MY_URL); @@ -504,164 +226,80 @@ function pd2(html,parse,uri){ } const parseTags = { - jsp:{ - pdfh:pdfh2, - pdfa:pdfa2, - pd:pd2, + jsp: { + pdfh: pdfh, + pdfa: pdfa, + pd: pD, }, - json:{ + json: { pdfh(html, parse) { - if (!parse || !parse.trim()){ + if (!parse || !parse.trim()) { return ''; } - if (typeof(html) === 'string'){ - // print('jsonpath:pdfh字符串转dict'); + if (typeof (html) === 'string') { html = JSON.parse(html); } parse = parse.trim(); - if (!parse.startsWith('$.')){ + if (!parse.startsWith('$.')) { parse = '$.' + parse; } parse = parse.split('||'); for (let ps of parse) { let ret = cheerio.jp(ps, html); - if (Array.isArray(ret)){ + if (Array.isArray(ret)) { ret = ret[0] || ''; - } else{ + } else { ret = ret || '' } - if (ret && typeof (ret) !== 'string'){ + if (ret && typeof (ret) !== 'string') { ret = ret.toString(); } - if(ret){ + if (ret) { return ret } } return ''; }, pdfa(html, parse) { - if (!parse || !parse.trim()){ + if (!parse || !parse.trim()) { return ''; } - if (typeof(html) === 'string'){ - // print('jsonpath:pdfa字符串转dict'); + if (typeof (html) === 'string') { html = JSON.parse(html); } parse = parse.trim() - if (!parse.startsWith('$.')){ + if (!parse.startsWith('$.')) { parse = '$.' + parse; } let ret = cheerio.jp(parse, html); - if (Array.isArray(ret) && Array.isArray(ret[0]) && ret.length === 1){ + if (Array.isArray(ret) && Array.isArray(ret[0]) && ret.length === 1) { return ret[0] || [] } return ret || [] }, - pd(html,parse){ - let ret = parseTags.json.pdfh(html,parse); - if(ret){ - return urljoin(MY_URL,ret); + pd(html, parse) { + let ret = parseTags.json.pdfh(html, parse); + if (ret) { + return urljoin(MY_URL, ret); } return ret }, }, - jq:{ - pdfh(html, parse, base_url) { - if (!parse || !parse.trim()) { - return '' - } - let eleFind = typeof html === 'object'; - let option = undefined; - if (eleFind && parse.startsWith('body&&')) { - parse = parse.substr(6); - if (parse.indexOf('&&') < 0) { - option = parse.trim(); - parse = '*=*'; - } - } - if (parse.indexOf('&&') > -1) { - let sp = parse.split('&&'); - option = sp[sp.length - 1]; - sp.splice(sp.length - 1); - if (sp.length > 1) { - for (let i in sp) { - if (!SELECT_REGEX.test(sp[i])) { - sp[i] = sp[i] + ':eq(0)'; - } - } - } else { - if (!SELECT_REGEX.test(sp[0])) { - sp[0] = sp[0] + ':eq(0)'; - } - } - parse = sp.join(' '); - } - let result = ''; - const $ = eleFind ? html.rr : cheerio.load(html); - let ret = eleFind ? ((parse === '*=*' || $(html.ele).is(parse)) ? html.ele : $(html.ele).find(parse)) : $(parse); - if (option) { - if (option === 'Text') { - result = $(ret).text(); - } - else if (option === 'Html') { - result = $(ret).html(); - } - else { - result = $(ret).attr(option); - if(/style/.test(option.toLowerCase())&&/url\(/.test(result)){ - try { - result = result.match(/url\((.*?)\)/)[1]; - }catch (e) {} - } - } - if (result && base_url && DOM_CHECK_ATTR.test(option)) { - if (/http/.test(result)) { - result = result.substr(result.indexOf('http')); - } else { - result = urljoin(base_url, result) - } - } - } else { - result = $(ret).toString(); - } - return result; - }, - pdfa(html, parse) { - if (!parse || !parse.trim()) { - return []; - } - let eleFind = typeof html === 'object'; - if (parse.indexOf('&&') > -1) { - let sp = parse.split('&&'); - for (let i in sp) { - if (!SELECT_REGEX_A.test(sp[i]) && i < sp.length - 1) { - sp[i] = sp[i] + ':eq(0)'; - } - } - parse = sp.join(' '); - } - const $ = eleFind ? html.rr : cheerio.load(html); - let ret = eleFind ? ($(html.ele).is(parse) ? html.ele : $(html.ele).find(parse)) : $(parse); - let result = []; - if (ret) { - ret.each(function (idx, ele) { - result.push({ rr: $, ele: ele }); - }); - } - return result; - }, - pd(html,parse,uri){ + jq: { + pdfh: pdfh, + pdfa: pdfa, + pd(html, parse, uri) { return parseTags.jq.pdfh(html, parse, MY_URL); }, }, - getParse(p0){//非js开头的情况自动获取解析标签 - if(p0.startsWith('jsp:')){ + getParse(p0) {//非js开头的情况自动获取解析标签 + if (p0.startsWith('jsp:')) { return this.jsp - }else if(p0.startsWith('json:')){ + } else if (p0.startsWith('json:')) { return this.json - }else if(p0.startsWith('jq:')){ + } else if (p0.startsWith('jq:')) { return this.jq - }else { + } else { return this.jq } } @@ -669,7 +307,6 @@ const parseTags = { const stringify = JSON.stringify; const jsp = parseTags.jsp; -const jq = parseTags.jq; /*** 后台需要实现的java方法并注入到js中 ***/ @@ -678,8 +315,8 @@ const jq = parseTags.jq; * @param filePath * @returns {string} */ -function readFile(filePath){ - filePath = filePath||'./uri.min.js'; +function readFile(filePath) { + filePath = filePath || 'https://raw.iqiq.io/2hacc/TVBox/main/drpy/lib/uri.min.js'; var fd = os.open(filePath); var buffer = new ArrayBuffer(1024); var len = os.read(fd, buffer, 0, 1024); @@ -696,13 +333,12 @@ function readFile(filePath){ */ function dealJson(html) { try { - // html = html.match(/[\w|\W|\s|\S]*?(\{[\w|\W|\s|\S]*\})/).group[1]; - html = '{'+html.match(/.*?\{(.*)\}/)[1]+'}'; + return html.match(/[\w|\W|\s|\S]*?(\{[\w|\W|\s|\S]*\})/).group[1]; } catch (e) { } try { html = JSON.parse(html); - }catch (e) {} + } catch (e) { } // console.log(typeof(html)); return html; } @@ -711,15 +347,15 @@ function dealJson(html) { * 验证码识别逻辑,需要java实现(js没有bytes类型,无法调用后端的传递图片二进制获取验证码文本的接口) * @type {{api: string, classification: (function(*=): string)}} */ -var OcrApi={ - api:OCR_API, - classification:function (img){ // img是byte类型,这里不方便搞啊 +var OcrApi = { + api: OCR_API, + classification: function (img) { // img是byte类型,这里不方便搞啊 let code = ''; try { - let html = request(this.api,{data:{img:img},headers:{'User-Agent':PC_UA},'method':'POST'},true); + let html = request(this.api, { data: { img: img }, headers: { 'User-Agent': PC_UA }, 'method': 'POST' }); html = JSON.parse(html); - code = html.url||''; - }catch (e) {} + code = html.url || ''; + } catch (e) { } return code } }; @@ -728,44 +364,44 @@ var OcrApi={ * @param url 验证码图片链接 * @returns {string} 验证成功后的cookie */ -function verifyCode(url){ +function verifyCode(url) { let cnt = 0; let host = getHome(url); let cookie = ''; - while (cnt < OCR_RETRY){ - try{ + while (cnt < OCR_RETRY) { + try { // let obj = {headers:headers,timeout:timeout}; let yzm_url = `${host}/index.php/verify/index.html`; console.log(`验证码链接:${yzm_url}`); - let hhtml = request(yzm_url,{withHeaders:true,toBase64:true},true); + let hhtml = request(yzm_url, { withHeaders: true, toBase64: true }); let json = JSON.parse(hhtml); - if(!cookie){ - cookie = json['set-cookie']?json['set-cookie'].split(';')[0]:''; + if (!cookie) { + cookie = json['set-cookie'] ? json['set-cookie'].split(';')[0] : ''; } // console.log(hhtml); - console.log('cookie:'+cookie); + console.log('cookie:' + cookie); let img = json.body; // console.log(img); let code = OcrApi.classification(img); - console.log(`第${cnt+1}次验证码识别结果:${code}`); + console.log(`第${cnt + 1}次验证码识别结果:${code}`); let submit_url = `${host}/index.php/ajax/verify_check?type=search&verify=${code}`; console.log(submit_url); - let html = request(submit_url,{headers:{Cookie:cookie,'User-Agent':MOBILE_UA},'method':'POST'}); + let html = request(submit_url, { headers: { Cookie: cookie, 'User-Agent': MOBILE_UA }, 'method': 'POST' }); // console.log(html); html = JSON.parse(html); - if(html.msg === 'ok'){ - console.log(`第${cnt+1}次验证码提交成功`); + if (html.msg === 'ok') { + console.log(`第${cnt + 1}次验证码提交成功`); return cookie // 需要返回cookie - }else if(html.msg!=='ok'&&cnt+1>=OCR_RETRY){ + } else if (html.msg !== 'ok' && cnt + 1 >= OCR_RETRY) { cookie = ''; // 需要清空返回cookie } - }catch (e) { - console.log(`第${cnt+1}次验证码提交失败:${e.message}`); - if(cnt+1>=OCR_RETRY){ + } catch (e) { + console.log(`第${cnt + 1}次验证码提交失败:${e.message}`); + if (cnt + 1 >= OCR_RETRY) { cookie = ''; } } - cnt+=1 + cnt += 1 } return cookie } @@ -775,8 +411,8 @@ function verifyCode(url){ * @param k 键 * @param v 值 */ -function setItem(k,v){ - local.set(RKEY,k,v); +function setItem(k, v) { + local.set(RKEY, k, v); console.log(`规则${RKEY}设置${k} => ${v}`) } @@ -786,16 +422,16 @@ function setItem(k,v){ * @param v 值 * @returns {*} */ -function getItem(k,v){ - return local.get(RKEY,k) || v; +function getItem(k, v) { + return local.get(RKEY, k) || v; } /** * 删除数据库key对应的一条数据,并清除此key对应的内存缓存 * @param k */ -function clearItem(k){ - local.delete(RKEY,k); +function clearItem(k) { + local.delete(RKEY, k); } /*** js自封装的方法 ***/ @@ -805,15 +441,15 @@ function clearItem(k){ * @param url 任意一个正常完整的Url,自动提取根 * @returns {string} */ -function getHome(url){ - if(!url){ +function getHome(url) { + if (!url) { return '' } let tmp = url.split('//'); url = tmp[0] + '//' + tmp[1].split('/')[0]; try { url = decodeURIComponent(url); - }catch (e) {} + } catch (e) { } return url } @@ -823,21 +459,21 @@ function getHome(url){ * @param obj 参数字典 * @returns {*} */ -function buildUrl(url,obj){ - obj = obj||{}; - if(url.indexOf('?')<0){ +function buildUrl(url, obj) { + obj = obj || {}; + if (url.indexOf('?') < 0) { url += '?' } let param_list = []; let keys = Object.keys(obj); - keys.forEach(it=>{ - param_list.push(it+'='+obj[it]) + keys.forEach(it => { + param_list.push(it + '=' + obj[it]) }); let prs = param_list.join('&'); - if(keys.length > 0 && !url.endsWith('?')){ + if (keys.length > 0 && !url.endsWith('?')) { url += '&' } - url+=prs; + url += prs; return url } @@ -845,90 +481,82 @@ function buildUrl(url,obj){ * 远程依赖执行函数 * @param url 远程js地址 */ -function require(url){ +function require(url) { eval(request(url)); } /** * 海阔网页请求函数完整封装 * @param url 请求链接 * @param obj 请求对象 {headers:{},method:'',timeout:5000,body:'',withHeaders:false} - * @param ocr_flag 标识此flag是用于请求ocr识别的,自动过滤content-type指定编码 * @returns {string|string|DocumentFragment|*} */ -function request(url,obj,ocr_flag){ - ocr_flag = ocr_flag||false; - if(typeof(obj)==='undefined'||!obj||obj==={}){ - if(!fetch_params||!fetch_params.headers){ +function request(url, obj) { + if (typeof (obj) === 'undefined' || !obj || obj === {}) { + if (!fetch_params || !fetch_params.headers) { let headers = { - 'User-Agent':MOBILE_UA, + 'User-Agent': MOBILE_UA, }; - if(rule.headers){ - Object.assign(headers,rule.headers); + if (rule.headers) { + Object.assign(headers, rule.headers); } fetch_params.headers = headers; } - if(!fetch_params.headers.Referer){ + if (!fetch_params.headers.Referer) { fetch_params.headers.Referer = getHome(url) } obj = fetch_params; - }else{ - let headers = obj.headers||{}; - let keys = Object.keys(headers).map(it=>it.toLowerCase()); - if(!keys.includes('user-agent')){ + } else { + let headers = obj.headers || {}; + let keys = Object.keys(headers).map(it => it.toLowerCase()); + if (!keys.includes('user-agent')) { headers['User-Agent'] = MOBILE_UA; - }if(!keys.includes('referer')){ + } if (!keys.includes('referer')) { headers['Referer'] = getHome(url); } obj.headers = headers; } - if(rule.encoding&&rule.encoding!=='utf-8'&&!ocr_flag){ - if(!obj.headers.hasOwnProperty('Content-Type')){ // 手动指定了就不管 - obj.headers["Content-Type"] = 'text/html; charset='+rule.encoding; - } - } - if(typeof(obj.headers.body)!='undefined'&&obj.headers.body&&typeof (obj.headers.body)==='string'){ + console.log(JSON.stringify(obj.headers)); + if (typeof (obj.headers.body) != 'undefined' && obj.headers.body && typeof (obj.headers.body) === 'string') { let data = {}; - obj.headers.body.split('&').forEach(it=>{ + obj.headers.body.split('&').forEach(it => { data[it.split('=')[0]] = it.split('=')[1] }); obj.data = data; delete obj.headers.body } - if(!url){ - return obj.withHeaders?'{}':'' + if (!url) { + return obj.withHeaders ? '{}' : '' } - if(obj.toBase64){ // 返回base64,用于请求图片 + if (obj.toBase64) { // 返回base64,用于请求图片 obj.buffer = 2; delete obj.toBase64 } - console.log(JSON.stringify(obj.headers)); - // console.log('request:'+url+' obj:'+JSON.stringify(obj)); - console.log('request:'+url); + console.log('request:' + url); let res = req(url, obj); - let html = res.content||''; + let html = res.content || ''; // console.log(html); - if(obj.withHeaders){ + if (obj.withHeaders) { let htmlWithHeaders = res.headers; htmlWithHeaders.body = html; return JSON.stringify(htmlWithHeaders); - }else{ + } else { return html } } fetch = request; -print = function (data){ - data = data||''; - if(typeof(data)!=='string'){ +print = function (data) { + data = data || ''; + if (typeof (data) !== 'string') { try { data = JSON.stringify(data); - }catch (e) { - console.log('print:'+e.message) + } catch (e) { + console.log('print:' + e.message) } } console.log(data); } -log = print; +log = console.log; /** * 检查宝塔验证并自动跳过获取正确源码 * @param html 之前获取的html @@ -936,11 +564,11 @@ log = print; * @param obj 来源obj * @returns {string|DocumentFragment|*} */ -function checkHtml(html,url,obj){ - if(/\?btwaf=/.test(html)){ +function checkHtml(html, url, obj) { + if (/\?btwaf=/.test(html)) { let btwaf = html.match(/btwaf(.*?)"/)[1]; - url = url.split('#')[0]+'?btwaf'+btwaf; - html = request(url,obj); + url = url.split('#')[0] + '?btwaf' + btwaf; + html = request(url, obj); } return html } @@ -951,9 +579,9 @@ function checkHtml(html,url,obj){ * @param obj 请求参数 * @returns {string|DocumentFragment} */ -function getCode(url,obj){ - let html = request(url,obj); - html = checkHtml(html,url,obj); +function getCode(url, obj) { + let html = request(url, obj); + html = checkHtml(html, url, obj); return html } @@ -962,20 +590,20 @@ function getCode(url,obj){ * @param url 请求链接 * @returns {string|DocumentFragment} */ -function getHtml(url){ +function getHtml(url) { let obj = {}; - if(rule.headers){ + if (rule.headers) { obj.headers = rule.headers; } - let cookie = getItem(RULE_CK,''); - if(cookie){ - if(obj.headers && ! Object.keys(obj.headers).map(it=>it.toLowerCase()).includes('cookie')){ + let cookie = getItem(RULE_CK, ''); + if (cookie) { + if (obj.headers && !Object.keys(obj.headers).map(it => it.toLowerCase()).includes('cookie')) { obj.headers['Cookie'] = cookie; - }else if(!obj.headers){ - obj.headers = {Cookie:cookie}; + } else if (!obj.headers) { + obj.headers = { Cookie: cookie }; } } - let html = getCode(url,obj); + let html = getCode(url, obj); return html } @@ -1001,27 +629,21 @@ function homeParse(homeObj) { if (homeObj.class_parse) { let p = homeObj.class_parse.split(';'); - let _ps = parseTags.getParse(p[0]); - _pdfa = _ps.pdfa; - _pdfh = _ps.pdfh; - _pd = _ps.pd; - MY_URL = rule.url; - if (p.length >= 3) { // 可以不写正则 + if (p.length >= 4) { try { let html = getHtml(homeObj.MY_URL); if (html) { homeHtmlCache = html; - let list = _pdfa(html, p[0]); + let list = pdfa(html, p[0]); if (list && list.length > 0) { - list.forEach((it,idex) => { + list.forEach((it, idex) => { try { - let name = _pdfh(it, p[1]); + let name = pdfh(it, p[1]); if (homeObj.cate_exclude && (new RegExp(homeObj.cate_exclude).test(name))) { return; } - // let url = pdfh(it, p[2]); - let url = _pd(it, p[2]); - if (p.length > 3 && p[3]) { + let url = pdfh(it, p[2]); + if (p[3]) { let exp = new RegExp(p[3]); url = url.match(exp)[1]; } @@ -1043,11 +665,11 @@ function homeParse(homeObj) { } } // 排除分类 - classes = classes.filter(it=>!homeObj.cate_exclude || !(new RegExp(homeObj.cate_exclude).test(it.type_name))); + classes = classes.filter(it => !homeObj.cate_exclude || !(new RegExp(homeObj.cate_exclude).test(it.type_name))); let resp = { 'class': classes }; - if(homeObj.filter){ + if (homeObj.filter) { resp.filters = homeObj.filter; } console.log(JSON.stringify(resp)); @@ -1055,71 +677,51 @@ function homeParse(homeObj) { } -/** - * 推荐和搜索单字段继承一级 - * @param p 推荐或搜索的解析分割;列表 - * @param pn 自身列表序号 - * @param pp 一级解析分割;列表 - * @param ppn 继承一级序号 - * @returns {*} - */ -function getPP(p, pn, pp, ppn){ - let ps = p[pn] === '*' && pp.length > ppn ?pp[ppn]:p[pn] - return ps -} - /** * 首页推荐列表解析 * @param homeVodObj * @returns {string} */ -function homeVodParse(homeVodObj){ +function homeVodParse(homeVodObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let d = []; MY_URL = homeVodObj.homeUrl; // setItem('MY_URL',MY_URL); console.log(MY_URL); let p = homeVodObj.推荐; - if(p==='*' && rule.一级){ - p = rule.一级; - homeVodObj.double = false; - } - if(!p||typeof(p)!=='string'){ + if (!p || typeof (p) !== 'string') { return '{}' } p = p.trim(); - let pp = rule.一级.split(';'); - if(p.startsWith('js:')){ + if (p.startsWith('js:')) { const TYPE = 'home'; var input = MY_URL; const HOST = rule.host; - eval(p.replace('js:','')); + eval(p.replace('js:', '')); d = VODS; - }else { + } else { p = p.split(';'); if (!homeVodObj.double && p.length < 5) { return '{}' } else if (homeVodObj.double && p.length < 6) { return '{}' } - let p0 = getPP(p,0,pp,0) - let _ps = parseTags.getParse(p0); + let _ps = parseTags.getParse(p[0]); _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; - let is_json = p0.startsWith('json:'); - p0 = p0.replace(/^(jsp:|json:|jq:)/,''); + let is_json = p[0].startsWith('json:'); + p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); // print(p[0]); let html = homeHtmlCache || getHtml(MY_URL); homeHtmlCache = undefined; - if(is_json){ - // print('是json,开始处理'); + if (is_json) { html = dealJson(html); } try { console.log('double:' + homeVodObj.double); if (homeVodObj.double) { - let items = _pdfa(html, p0); + let items = _pdfa(html, p[0]); // console.log(items.length); for (let item of items) { // console.log(p[1]); @@ -1127,84 +729,53 @@ function homeVodParse(homeVodObj){ // console.log(items2.length); for (let item2 of items2) { try { - let p2 = getPP(p,2,pp,1); - let title = _pdfh(item2, p2); + let title = _pdfh(item2, p[2]); let img = ''; try { - let p3 = getPP(p,3,pp,2); - img = _pd(item2, p3); - } catch (e) {} - let desc = ''; - try { - let p4 = getPP(p,4,pp,3); - desc = _pdfh(item2, p4); - }catch (e) {} - let p5 = getPP(p,5,pp,4); + img = _pd(item2, p[3]) + } catch (e) { + } + let desc = _pdfh(item2, p[4]); let links = []; - for (let _p5 of p5.split('+')) { - let link = !homeVodObj.detailUrl ? _pd(item2, _p5, MY_URL) : _pdfh(item2, _p5); + for (let p5 of p[5].split('+')) { + let link = !homeVodObj.detailUrl ? _pd(item2, p5, MY_URL) : _pdfh(item2, p5); links.push(link); } - let content; - if(p.length > 6 && p[6]){ - let p6 = getPP(p,6,pp,5); - content = _pdfh(item2, p6); - } else{ - content = ''; - } let vod = { vod_name: title, vod_pic: img, vod_remarks: desc, - vod_content: content, vod_id: links.join('$') }; // print(vod); d.push(vod); } catch (e) { - console.log('首页列表处理发生错误:'+e.message); + console.log('首页列表处理发生错误:' + e.message); } } - - } - - } else { - let items = _pdfa(html, p0); + let items = _pdfa(html, p[0]); for (let item of items) { try { - let p1 = getPP(p,1,pp,1); - let title = _pdfh(item, p1); + let title = _pdfh(item, p[1]); let img = ''; try { - let p2 = getPP(p,2,pp,2); - img = _pd(item, p2, MY_URL); - } catch (e) {} - let desc = ''; - try { - let p3 = getPP(p,3,pp,3); - desc = _pdfh(item, p3); - }catch (e) {} - let p4 = getPP(p,4,pp,4); + img = _pd(item, p[2], MY_URL); + } catch (e) { + + } + let desc = _pdfh(item, p[3]); let links = []; - for (let _p5 of p4.split('+')) { - let link = !homeVodObj.detailUrl ? _pd(item, _p5, MY_URL) : _pdfh(item, _p5); + for (let p5 of p[4].split('+')) { + let link = !homeVodObj.detailUrl ? _pd(item, p5, MY_URL) : _pdfh(item, p5); links.push(link); } - let content; - if(p.length > 5 && p[5]){ - let p5 = getPP(p,5,pp,5); - content = _pdfh(item, p5); - }else{ - content = '' - } let vod = { vod_name: title, vod_pic: img, vod_remarks: desc, - vod_content: content, vod_id: links.join('$') }; d.push(vod); @@ -1223,7 +794,7 @@ function homeVodParse(homeVodObj){ } // console.log(JSON.stringify(d)); return JSON.stringify({ - list:d + list: d }) } @@ -1235,63 +806,60 @@ function homeVodParse(homeVodObj){ function categoryParse(cateObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let p = cateObj.一级; - if(!p||typeof(p)!=='string'){ + if (!p || typeof (p) !== 'string') { return '{}' } let d = []; // let url = cateObj.url.replaceAll('fyclass', cateObj.tid).replaceAll('fypage', cateObj.pg); let url = cateObj.url.replaceAll('fyclass', cateObj.tid); - if(rule.filter_url){ - if(!/fyfilter/.test(url)){ - if(!url.endsWith('&')&&!rule.filter_url.startsWith('&')){ - url+='&' + if (rule.filter_url) { + if (!/fyfilter/.test(url)) { + if (!url.endsWith('&') && !rule.filter_url.startsWith('&')) { + url += '&' } - url+=rule.filter_url; - }else{ + url += rule.filter_url; + } else { url = url.replace('fyfilter', rule.filter_url); } // console.log('filter:'+cateObj.filter); - let fl = cateObj.filter?cateObj.extend:{}; + let fl = cateObj.filter ? cateObj.extend : {}; let new_url; - new_url = cheerio.jinja2(url,{fl:fl}); - // console.log('jinjia2执行后的new_url类型为:'+typeof(new_url)); - if(/object Object/.test(new_url)){ - new_url = drT.renderText(url,fl); - } + new_url = cheerio.jinja2(url, { fl: fl }); + // if (/object Object/.test(new_url)) { + // new_url = drT.renderText(url, fl); + // } url = new_url; } - if(/fypage/.test(url)){ - if(url.includes('(')&&url.includes(')')){ + if (/fypage/.test(url)) { + if (url.includes('(') && url.includes(')')) { let url_rep = url.match(/.*?\((.*)\)/)[1]; // console.log(url_rep); let cnt_page = url_rep.replaceAll('fypage', cateObj.pg); // console.log(cnt_page); let cnt_pg = eval(cnt_page); // console.log(cnt_pg); - url = url.replaceAll(url_rep,cnt_pg).replaceAll('(','').replaceAll(')',''); - }else{ - url = url.replaceAll('fypage',cateObj.pg); + url = url.replaceAll(url_rep, cnt_pg).replaceAll('(', '').replaceAll(')', ''); + } else { + url = url.replaceAll('fypage', cateObj.pg); } } - if(cateObj.pg === 1 && url.includes('[')&&url.includes(']')){ + if (cateObj.pg === 1 && url.includes('[') && url.includes(']')) { url = url.split('[')[1].split(']')[0]; - }else if(cateObj.pg > 1 && url.includes('[')&&url.includes(']')){ - url = url.split('[')[0]; } MY_URL = url; // setItem('MY_URL',MY_URL); console.log(MY_URL); p = p.trim(); const MY_CATE = cateObj.tid; - if(p.startsWith('js:')){ + if (p.startsWith('js:')) { var MY_FL = cateObj.extend; const TYPE = 'cate'; var input = MY_URL; const MY_PAGE = cateObj.pg; var desc = ''; - eval(p.trim().replace('js:','')); + eval(p.trim().replace('js:', '')); d = VODS; - }else { + } else { p = p.split(';'); if (p.length < 5) { return '{}' @@ -1301,25 +869,25 @@ function categoryParse(cateObj) { _pdfh = _ps.pdfh; _pd = _ps.pd; let is_json = p[0].startsWith('json:'); - p[0] = p[0].replace(/^(jsp:|json:|jq:)/,''); + p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); try { let html = getHtml(MY_URL); if (html) { - if(is_json){ + if (is_json) { html = dealJson(html); } let list = _pdfa(html, p[0]); list.forEach(it => { - let links = p[4].split('+').map(p4=>{ - return !rule.detailUrl?_pd(it, p4,MY_URL):_pdfh(it, p4); + let links = p[4].split('+').map(p4 => { + return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4); }); let link = links.join('$'); - let vod_id = rule.detailUrl?MY_CATE+'$'+link:link; + let vod_id = rule.detailUrl ? MY_CATE + '$' + link : link; d.push({ 'vod_id': vod_id, - 'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g,'').trim(), - 'vod_pic': _pd(it, p[2],MY_URL), - 'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g,'').trim(), + 'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(), + 'vod_pic': _pd(it, p[2], MY_URL), + 'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(), }); }); } @@ -1328,7 +896,7 @@ function categoryParse(cateObj) { } } // print(d); - return d.length<1?'{}':JSON.stringify({ + return d.length < 1 ? '{}' : JSON.stringify({ 'page': parseInt(cateObj.pg), 'pagecount': 999, 'limit': 20, @@ -1345,94 +913,82 @@ function categoryParse(cateObj) { function searchParse(searchObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let d = []; - if(!searchObj.searchUrl){ + if (!searchObj.searchUrl) { return '{}' } - let p = searchObj.搜索==='*'&&rule.一级 ? rule.一级 : searchObj.搜索; - if(!p||typeof(p)!=='string'){ + let p = searchObj.搜索 === '*' && rule.一级 ? rule.一级 : searchObj.搜索; + if (!p || typeof (p) !== 'string') { return '{}' } p = p.trim(); - let pp = rule.一级.split(';'); let url = searchObj.searchUrl.replaceAll('**', searchObj.wd).replaceAll('fypage', searchObj.pg); MY_URL = url; console.log(MY_URL); - // log(searchObj.搜索); // setItem('MY_URL',MY_URL); - if(p.startsWith('js:')){ + if (p.startsWith('js:')) { const TYPE = 'search'; const MY_PAGE = searchObj.pg; const KEY = searchObj.wd; var input = MY_URL; - var detailUrl = rule.detailUrl||''; - eval(p.trim().replace('js:','')); + var detailUrl = rule.detailUrl || ''; + eval(p.trim().replace('js:', '')); d = VODS; - }else{ + } else { p = p.split(';'); if (p.length < 5) { return '{}' } - let p0 = getPP(p,0,pp,0); - let _ps = parseTags.getParse(p0); + let _ps = parseTags.getParse(p[0]); _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; - let is_json = p0.startsWith('json:'); - p0 = p0.replace(/^(jsp:|json:|jq:)/,''); - // print('1381 p0:'+p0); + let is_json = p[0].startsWith('json:'); + p[0] = p[0].replace(/^(jsp:|json:|jq:)/, ''); try { let html = getHtml(MY_URL); if (html) { - if(/系统安全验证|输入验证码/.test(html)){ + if (/系统安全验证|输入验证码/.test(html)) { let cookie = verifyCode(MY_URL); - if(cookie){ + if (cookie) { console.log(`本次成功过验证,cookie:${cookie}`); - setItem(RULE_CK,cookie); - }else{ + setItem(RULE_CK, cookie); + } else { console.log(`本次自动过搜索验证失败,cookie:${cookie}`); } // obj.headers['Cookie'] = cookie; html = getHtml(MY_URL); } - if(!html.includes(searchObj.wd)){ + if (!html.includes(searchObj.wd)) { console.log('搜索结果源码未包含关键字,疑似搜索失败,正为您打印结果源码'); console.log(html); } - if(is_json){ + if (is_json) { html = dealJson(html); } - let list = _pdfa(html, p0); + let list = _pdfa(html, p[0]); list.forEach(it => { - let p1 = getPP(p, 1, pp, 1); - let p2 = getPP(p, 2, pp, 2); - let p3 = getPP(p, 3, pp, 3); - let p4 = getPP(p, 4, pp, 4); - let links = p4.split('+').map(_p4=>{ - return !rule.detailUrl?_pd(it, _p4,MY_URL):_pdfh(it, _p4) + let links = p[4].split('+').map(p4 => { + return !rule.detailUrl ? _pd(it, p4, MY_URL) : _pdfh(it, p4) }); + let link = links.join('$'); - let content; - if(p.length > 5 && p[5]){ - let p5 = getPP(p,5,pp,5); - content = _pdfh(it, p5); - }else{ - content = ''; - } let ob = { 'vod_id': link, - 'vod_name': _pdfh(it, p1).replace(/\n|\t/g,'').trim(), - 'vod_pic': _pd(it, p2,MY_URL), - 'vod_remarks': _pdfh(it, p3).replace(/\n|\t/g,'').trim(), - 'vod_content': content.replace(/\n|\t/g,'').trim(), + 'vod_name': _pdfh(it, p[1]).replace(/\n|\t/g, '').trim(), + 'vod_pic': _pd(it, p[2], MY_URL), + 'vod_remarks': _pdfh(it, p[3]).replace(/\n|\t/g, '').trim(), }; + if (p.length > 5 && p[5]) { + ob.vod_content = _pdfh(it, p[5]); + } d.push(ob); }); } } catch (e) { - print('搜索发生错误:'+e.message); return '{}' } + } return JSON.stringify({ 'page': parseInt(searchObj.pg), @@ -1448,7 +1004,7 @@ function searchParse(searchObj) { * @param detailObj * @returns {string} */ -function detailParse(detailObj){ +function detailParse(detailObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); let vod = { vod_id: detailObj.orId, //"id", @@ -1467,37 +1023,37 @@ function detailParse(detailObj){ let detailUrl = detailObj.detailUrl; let fyclass = detailObj.fyclass; let tab_exclude = detailObj.tab_exclude; - let html = detailObj.html||''; + let html = detailObj.html || ''; MY_URL = url; console.log(MY_URL); // setItem('MY_URL',MY_URL); - if(p==='*'){ + if (p === '*') { vod.vod_play_from = '道长在线'; vod.vod_remarks = detailUrl; vod.vod_actor = '没有二级,只有一级链接直接嗅探播放'; vod.vod_content = MY_URL; vod.vod_play_url = '嗅探播放$' + MY_URL; - }else if(typeof(p)==='string'&&p.trim().startsWith('js:')){ + } else if (typeof (p) === 'string' && p.trim().startsWith('js:')) { const TYPE = 'detail'; var input = MY_URL; - eval(p.trim().replace('js:','')); + eval(p.trim().replace('js:', '')); vod = VOD; console.log(JSON.stringify(vod)); - }else if(p&&typeof(p)==='object'){ - if(!html){ + } else if (p && typeof (p) === 'object') { + if (!html) { html = getHtml(MY_URL); } let _impJQP = true; let _ps; - if(p.is_json){ + if (p.is_json) { _ps = parseTags.json; html = dealJson(html); _impJQP = false; - }else if(p.is_jsp){ + } else if (p.is_jsp) { _ps = parseTags.jsp; - }else if(p.is_jq){ + } else if (p.is_jq) { _ps = parseTags.jq; - }else{ + } else { _ps = parseTags.jq; } if (_impJQP) { @@ -1507,127 +1063,105 @@ function detailParse(detailObj){ _pdfa = _ps.pdfa; _pdfh = _ps.pdfh; _pd = _ps.pd; - if(p.title){ + if (p.title) { let p1 = p.title.split(';'); - vod.vod_name = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim(); - let type_name = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g,'').replace(/ /g,'').trim():''; - vod.type_name = type_name||vod.type_name; + vod.vod_name = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); + let type_name = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').replace(/ /g, '').trim() : ''; + vod.type_name = type_name || vod.type_name; } - if(p.desc){ - try{ + if (p.desc) { + try { let p1 = p.desc.split(';'); - vod.vod_remarks = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim(); - vod.vod_year = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g,'').trim():''; - vod.vod_area = p1.length > 2 ? _pdfh(html, p1[2]).replace(/\n|\t/g,'').trim():''; + vod.vod_remarks = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); + vod.vod_year = p1.length > 1 ? _pdfh(html, p1[1]).replace(/\n|\t/g, '').trim() : ''; + vod.vod_area = p1.length > 2 ? _pdfh(html, p1[2]).replace(/\n|\t/g, '').trim() : ''; // vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replaceAll('\n', ' ').trim():''; - vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replace(/\n|\t/g,'').trim():''; - vod.vod_director = p1.length > 4 ? _pdfh(html, p1[4]).replace(/\n|\t/g,'').trim():''; + vod.vod_actor = p1.length > 3 ? _pdfh(html, p1[3]).replace(/\n|\t/g, '').trim() : ''; + vod.vod_director = p1.length > 4 ? _pdfh(html, p1[4]).replace(/\n|\t/g, '').trim() : ''; } catch (e) { } } - if(p.content){ - try{ + if (p.content) { + try { let p1 = p.content.split(';'); - vod.vod_content = _pdfh(html, p1[0]).replace(/\n|\t/g,'').trim(); + vod.vod_content = _pdfh(html, p1[0]).replace(/\n|\t/g, '').trim(); } - catch (e) {} + catch (e) { } } - if(p.img){ - try{ + if (p.img) { + try { let p1 = p.img.split(';'); - vod.vod_pic = _pd(html, p1[0],MY_URL); + vod.vod_pic = _pd(html, p1[0], MY_URL); } - catch (e) {} + catch (e) { } } let vod_play_from = '$$$'; let playFrom = []; - if(p.重定向&&p.重定向.startsWith('js:')){ - print('开始执行重定向代码:'+p.重定向); - html = eval(p.重定向.replace('js:','')); + if (p.重定向 && p.重定向.startsWith('js:')) { + html = eval(p.重定向.replace('js:', '')); if (_impJQP) { let c$ = cheerio.load(html); html = { rr: c$, ele: c$('html')[0] } } } - -// console.log(2); - if(p.tabs){ - if(p.tabs.startsWith('js:')){ - print('开始执行tabs代码:'+p.tabs); - if(html&&typeof (html)!=='string'){ - html = html.rr(html.ele).toString(); - } - var input = MY_URL; - eval(p.tabs.replace('js:','')); - playFrom = TABS; - }else{ - let p_tab = p.tabs.split(';')[0]; - console.log(p_tab); - let vHeader = _pdfa(html, p_tab); - - console.log(vHeader.length); - for(let v of vHeader){ - let v_title = _pdfh(v,'body&&Text').trim(); - console.log(v_title); - if(tab_exclude&& (new RegExp(tab_exclude)).test(v_title)){ - continue; - } - playFrom.push(v_title); + + // console.log(2); + if (p.tabs) { + let p_tab = p.tabs.split(';')[0]; + console.log(p_tab); + let vHeader = _pdfa(html, p_tab); + + console.log(vHeader.length); + for (let v of vHeader) { + let v_title = _pdfh(v, 'body&&Text'); + console.log(v_title); + if (tab_exclude && (new RegExp(tab_exclude)).test(v_title)) { + continue; } + playFrom.push(v_title); } console.log(JSON.stringify(playFrom)); - }else{ + } else { playFrom = ['道长在线'] } vod.vod_play_from = playFrom.join(vod_play_from); -// console.log(3); + // console.log(3); let vod_play_url = '$$$'; let vod_tab_list = []; - if(p.lists){ - if(p.lists.startsWith('js:')){ - print('开始执行lists代码:'+p.lists); - if(html&&typeof (html)!=='string'){ - html = html.rr(html.ele).toString(); + if (p.lists) { + for (let i = 0; i < playFrom.length; i++) { + let tab_name = playFrom[i]; + let tab_ext = p.tabs.split(';').length > 1 ? p.tabs.split(';')[1] : ''; + let p1 = p.lists.replaceAll('#idv', tab_name).replaceAll('#id', i); + tab_ext = tab_ext.replaceAll('#idv', tab_name).replaceAll('#id', i); + console.log(p1); + // console.log(html); + let vodList = []; + try { + vodList = _pdfa(html, p1); + console.log('len(vodList):' + vodList.length); + } catch (e) { + // console.log(e.message); } - var input = MY_URL; - eval(p.lists.replace('js:','')); - vod_play_url = LISTS.map(it=>it.join('#')).join(vod_play_url); - }else{ - for(let i=0;i 1 ? p.tabs.split(';')[1] : ''; - let p1 = p.lists.replaceAll('#idv', tab_name).replaceAll('#id', i); - tab_ext = tab_ext.replaceAll('#idv', tab_name).replaceAll('#id', i); - console.log(p1); - // console.log(html); - let vodList = []; - try { - vodList = _pdfa(html, p1); - console.log('len(vodList):'+vodList.length); - }catch (e) { - // console.log(e.message); - } - let new_vod_list = []; - let tabName = tab_ext?_pdfh(html, tab_ext):tab_name; - console.log(tabName); - // console.log('cheerio解析Text'); - vodList.forEach(it=>{ - // 请注意,这里要固定pdfh解析body&&Text,不需要下划线,没写错 - // new_vod_list.push(pdfh(it,'body&&Text')+'$'+_pd(it,'a&&href',MY_URL)); - // new_vod_list.push(cheerio.load(it).text()+'$'+_pd(it,'a&&href',MY_URL)); - new_vod_list.push(_pdfh(it, 'body&&Text').trim() + '$' + _pd(it, 'a&&href', MY_URL)); - }); - let vlist = new_vod_list.join('#'); - vod_tab_list.push(vlist); - } - vod_play_url = vod_tab_list.join(vod_play_url); + let new_vod_list = []; + let tabName = tab_ext ? _pdfh(html, tab_ext) : tab_name; + console.log(tabName); + // console.log('cheerio解析Text'); + vodList.forEach(it => { + // 请注意,这里要固定pdfh解析body&&Text,不需要下划线,没写错 + // new_vod_list.push(pdfh(it,'body&&Text')+'$'+_pd(it,'a&&href',MY_URL)); + // new_vod_list.push(cheerio.load(it).text() + '$' + _pd(it, 'a&&href', MY_URL)); + new_vod_list.push(_pdfh(it, 'body&&Text') + '$' + _pd(it, 'a&&href', MY_URL)); + }); + let vlist = new_vod_list.join('#'); + vod_tab_list.push(vlist); } } - vod.vod_play_url = vod_play_url; + vod.vod_play_url = vod_tab_list.join(vod_play_url); } // print(vod); return JSON.stringify({ @@ -1635,58 +1169,44 @@ function detailParse(detailObj){ }) } -/** - * 判断是否需要解析 - * @param url - * @returns {number|number} - */ -function tellIsJx(url){ - try { - let is_vip = !/\.(m3u8|mp4|m4a)$/.test(url.split('?')[0]) && 是否正版(url); - return is_vip?1:0 - }catch (e) { - return 1 - } -} /** * 选集播放点击事件解析 * @param playObj * @returns {string} */ -function playParse(playObj){ +function playParse(playObj) { fetch_params = JSON.parse(JSON.stringify(rule_fetch_params)); MY_URL = playObj.url; - if(!/http/.test(MY_URL)){ + if (!/http/.test(MY_URL)) { try { MY_URL = base64Decode(MY_URL); - }catch (e) {} + } catch (e) { } } MY_URL = decodeURIComponent(MY_URL); var input = MY_URL;//注入给免嗅js let common_play = { - parse:1, - url:input, - jx:tellIsJx(input) + parse: 1, + url: input }; let lazy_play; - if(!rule.play_parse||!rule.lazy){ - lazy_play = common_play; - }else if(rule.play_parse&&rule.lazy&&typeof(rule.lazy)==='string'){ + if (!rule.play_parse || !rule.lazy) { + lazy_play = common_play; + } else if (rule.play_parse && rule.lazy && typeof (rule.lazy) === 'string') { try { - let lazy_code = rule.lazy.replace('js:','').trim(); - print('开始执行js免嗅=>'+lazy_code); + let lazy_code = rule.lazy.replace('js:', '').trim(); + print('开始执行js免嗅=>' + lazy_code); eval(lazy_code); - lazy_play = typeof(input) === 'object'?input:{ - parse:1, - jx:tellIsJx(input), - url:input + lazy_play = typeof (input) === 'object' ? input : { + parse: 1, + jx: 1, + url: input }; - }catch (e) { - print('js免嗅错误:'+e.message); - lazy_play = common_play; + } catch (e) { + print('js免嗅错误:' + e.message); + lazy_play = common_play; } - }else{ - lazy_play = common_play; + } else { + lazy_play = common_play; } console.log(JSON.stringify(lazy_play)); return JSON.stringify(lazy_play); @@ -1696,83 +1216,82 @@ function playParse(playObj){ * js源预处理特定返回对象中的函数 * @param ext */ - function init(ext) { +function init(ext) { console.log('init'); try { - // make shared jsContext happy muban不能import,不然会造成换源继承后变量被篡改 + // make shared jsContext happy if (typeof (globalThis.mubanJs) === 'undefined') { - let mubanJs = request('https://raw.iqiq.io/2hacc/TVBox/main/drpy/js/模板.js', { 'User-Agent': MOBILE_UA }); + // let mubanJs = request('https://gitcode.net/qq_32394351/dr_py/-/raw/master/js/模板.js', { 'User-Agent': MOBILE_UA }); 原始地址 + let mubanJs = request('https://raw.iqiq.io/2hacc/TVBox/main/drpy/lib/模板.js', { 'User-Agent': MOBILE_UA }); mubanJs = mubanJs.replace('export default', '(function() {return muban;}()) // export default'); - // console.log(mubanJs); globalThis.mubanJs = mubanJs; } let muban = eval(globalThis.mubanJs); - if (typeof ext == 'object'){ + if (typeof ext == 'object') { rule = ext; + if (rule.template) { + rule = Object.assign(muban[rule.template], rule); + } } else if (typeof ext == 'string') { if (ext.startsWith('http')) { - let js = request(ext,{'method':'GET'}); - if (js){ + let js = request(ext, { 'method': 'GET' }); + if (js) { eval(js.replace('var rule', 'rule')); } - } + } } else { eval(ext.replace('var rule', 'rule')); } - if (rule.模板 && muban.hasOwnProperty(rule.模板)) { - print('继承模板:'+rule.模板); - rule = Object.assign(muban[rule.模板], rule); - } /** 处理一下 rule规则关键字段没传递的情况 **/ - let rule_cate_excludes = (rule.cate_exclude||'').split('|').filter(it=>it.trim()); - let rule_tab_excludes = (rule.tab_exclude||'').split('|').filter(it=>it.trim()); - rule_cate_excludes = rule_cate_excludes.concat(CATE_EXCLUDE.split('|').filter(it=>it.trim())); - rule_tab_excludes = rule_tab_excludes.concat(TAB_EXCLUDE.split('|').filter(it=>it.trim())); + let rule_cate_excludes = (rule.cate_exclude || '').split('|').filter(it => it.trim()); + let rule_tab_excludes = (rule.tab_exclude || '').split('|').filter(it => it.trim()); + rule_cate_excludes = rule_cate_excludes.concat(CATE_EXCLUDE.split('|').filter(it => it.trim())); + rule_tab_excludes = rule_tab_excludes.concat(TAB_EXCLUDE.split('|').filter(it => it.trim())); rule.cate_exclude = rule_cate_excludes.join('|'); rule.tab_exclude = rule_tab_excludes.join('|'); - rule.host = (rule.host||'').rstrip('/'); - rule.url = rule.url||''; - rule.double = rule.double||false; - rule.homeUrl = rule.homeUrl||''; - rule.detailUrl = rule.detailUrl||''; - rule.searchUrl = rule.searchUrl||''; - rule.homeUrl = rule.host&&rule.homeUrl?urljoin(rule.host,rule.homeUrl):(rule.homeUrl||rule.host); - rule.detailUrl = rule.host&&rule.detailUrl?urljoin(rule.host,rule.detailUrl):rule.detailUrl; - if(rule.url.includes('[')&&rule.url.includes(']')){ + rule.host = (rule.host || '').rstrip('/'); + rule.url = rule.url || ''; + rule.double = rule.double || false; + rule.homeUrl = rule.homeUrl || ''; + rule.detailUrl = rule.detailUrl || ''; + rule.searchUrl = rule.searchUrl || ''; + rule.homeUrl = rule.host && rule.homeUrl ? urljoin(rule.host, rule.homeUrl) : (rule.homeUrl || rule.host); + rule.detailUrl = rule.host && rule.detailUrl ? urljoin(rule.host, rule.detailUrl) : rule.detailUrl; + if (rule.url.includes('[') && rule.url.includes(']')) { let u1 = rule.url.split('[')[0] let u2 = rule.url.split('[')[1].split(']')[0] - rule.url = rule.host && rule.url?urljoin(rule.host,u1)+'['+urljoin(rule.host,u2)+']':rule.url; - }else{ - rule.url = rule.host && rule.url ? urljoin(rule.host,rule.url) : rule.url; + rule.url = rule.host && rule.url ? urljoin(rule.host, u1) + '[' + urljoin(rule.host, u2) + ']' : rule.url; + } else { + rule.url = rule.host && rule.url ? urljoin(rule.host, rule.url) : rule.url; } - rule.searchUrl = rule.host && rule.searchUrl ? urljoin(rule.host,rule.searchUrl) : rule.searchUrl; + rule.searchUrl = rule.host && rule.searchUrl ? urljoin(rule.host, rule.searchUrl) : rule.searchUrl; - rule.timeout = rule.timeout||5000; - rule.encoding = rule.编码||rule.encoding||'utf-8'; - if(rule.headers && typeof(rule.headers) === 'object'){ + rule.timeout = rule.timeout || 5000; + rule.encoding = rule.编码 || rule.encoding || 'utf-8'; + if (rule.headers && typeof (rule.headers) === 'object') { try { let header_keys = Object.keys(rule.headers); - for(let k of header_keys){ - if(k.toLowerCase() === 'user-agent'){ + for (let k of header_keys) { + if (k.toLowerCase() === 'user-agent') { let v = rule.headers[k]; console.log(v); - if(['MOBILE_UA','PC_UA','UC_UA','IOS_UA','UA'].includes(v)){ + if (['MOBILE_UA', 'PC_UA', 'UC_UA', 'IOS_UA', 'UA'].includes(v)) { rule.headers[k] = eval(v); } } } - }catch (e) { - console.log('处理headers发生错误:'+e.message); + } catch (e) { + console.log('处理headers发生错误:' + e.message); } } // print(rule.headers); - rule_fetch_params = {'headers': rule.headers||false, 'timeout': rule.timeout, 'encoding': rule.encoding}; - oheaders = rule.headers||{}; - RKEY = typeof(key)!=='undefined'&&key?key:'drpy_' + (rule.title || rule.host); + rule_fetch_params = { 'headers': rule.headers || false, 'timeout': rule.timeout, 'encoding': rule.encoding }; + oheaders = rule.headers || {}; + RKEY = typeof (key) !== 'undefined' && key ? key : 'drpy_' + (rule.title || rule.host); init_test(); - }catch (e) { - console.log('init_test发生错误:'+e.message); + } catch (e) { + console.log('init_test发生错误:' + e.message); } } @@ -1786,7 +1305,7 @@ let homeHtmlCache = undefined; function home(filter) { console.log("home"); let homeObj = { - filter:rule.filter||false, + filter: rule.filter || false, MY_URL: rule.homeUrl, class_name: rule.class_name || '', class_url: rule.class_url || '', @@ -1803,10 +1322,10 @@ function home(filter) { */ function homeVod(params) { let homeVodObj = { - 推荐:rule.推荐, - double:rule.double, - homeUrl:rule.homeUrl, - detailUrl:rule.detailUrl + 推荐: rule.推荐, + double: rule.double, + homeUrl: rule.homeUrl, + detailUrl: rule.detailUrl }; return homeVodParse(homeVodObj) // return "{}"; @@ -1841,27 +1360,27 @@ function category(tid, pg, filter, extend) { function detail(vod_url) { let orId = vod_url; let fyclass = ''; - if(vod_url.indexOf('$')>-1){ + if (vod_url.indexOf('$') > -1) { let tmp = vod_url.split('$'); fyclass = tmp[0]; vod_url = tmp[1]; } let detailUrl = vod_url; let url; - if(!detailUrl.startsWith('http')&&!detailUrl.includes('/')){ - url = rule.detailUrl.replaceAll('fyid', detailUrl).replaceAll('fyclass',fyclass); - }else if(detailUrl.includes('/')){ - url = urljoin(rule.homeUrl,detailUrl); - }else{ + if (!detailUrl.startsWith('http') && !detailUrl.includes('/')) { + url = rule.detailUrl.replaceAll('fyid', detailUrl).replaceAll('fyclass', fyclass); + } else if (detailUrl.includes('/')) { + url = urljoin(rule.homeUrl, detailUrl); + } else { url = detailUrl } let detailObj = { orId: orId, - url:url, - 二级:rule.二级, - detailUrl:detailUrl, - fyclass:fyclass, - tab_exclude:rule.tab_exclude, + url: url, + 二级: rule.二级, + detailUrl: detailUrl, + fyclass: fyclass, + tab_exclude: rule.tab_exclude, } return detailParse(detailObj) } @@ -1875,9 +1394,9 @@ function detail(vod_url) { */ function play(flag, id, flags) { let playObj = { - url:id, - flag:flag, - flags:flags + url: id, + flag: flag, + flags: flags } return playParse(playObj); } @@ -1901,7 +1420,7 @@ function search(wd, quick) { return searchParse(searchObj) } -function DRPY(){//导出函数 +function DRPY() {//导出函数 return { init: init, home: home, @@ -1913,8 +1432,11 @@ function DRPY(){//导出函数 } } + +let pd = pD; + // 导出函数对象 -export default { +__JS_SPIDER__ = { init: init, home: home, homeVod: homeVod, @@ -1922,5 +1444,5 @@ export default { detail: detail, play: play, search: search, - DRPY:DRPY + DRPY: DRPY }