// ==UserScript== // @name 小说下载器 // @namespace https://blog.bgme.me // @match http://www.yruan.com/article/*.html // @match https://www.jingcaiyuedu.com/novel/*/list.html // @match http://www.shuquge.com/txt/*/index.html // @match http://www.dingdiann.com/ddk*/ // @match https://www.dingdiann.com/ddk*/ // @match http://www.biquwo.org/bqw*/ // @match http://www.xkzw.org/xkzw*/ // @match https://www.fpzw.com/xiaoshuo/*/*/ // @match https://www.hetushu.com/book/*/index.html // @grant unsafeWindow // @require https://cdn.jsdelivr.net/npm/file-saver@2.0.2/dist/FileSaver.min.js // @require https://cdn.jsdelivr.net/npm/jszip@3.2.1/dist/jszip.min.js // @run-at document-end // @version 1.1.5.6 // @author bgme // @description 一个从笔趣阁这样的小说网站下载小说的通用脚本 // @supportURL https://github.com/yingziwu/Greasemonkey/issues // @icon https://greasyfork.org/assets/blacklogo96-1221dbbb8f0d47a728f968c35c2e2e03c64276a585b8dceb7a79a17a3f350e8a.png // @license AGPL-3.0-or-later // @downloadURL none // ==/UserScript== "use strict"; /* 本下载器可添加抓取规则以支持更多网站 抓取规则示例: ["www.yruan.com", { bookname() { return document.querySelector('#info > h1:nth-child(1)').innerText.trim() }, author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() }, intro() { return convertDomNode(document.querySelector('#intro > p'))[0] }, linkList() { return document.querySelectorAll('div.box_con div#list dl dd a') }, coverUrl() { return document.querySelector('#fmimg > img').src; }, chapterName: function(doc) { return doc.querySelector('.bookname > h1:nth-child(1)').innerText.trim() }, content: function(doc) { return doc.querySelector('#content') }, }], 抓取规则的 `key` 为该抓取规则适用的网站域名,即 `document.location.host`。 抓取规则的 `value` 一对象,该对象由7个函数组成: 函数名 功能 返回值 bookname() 抓取小说题名 String author() 抓取小说作者 String intro() 抓取小说简介 String linkList() 抓取小说分章链接列表 NodeList coverUrl() 抓取小说封面图片地址 String 以上5个函数在小说目录页(即按下按钮时的页面)运行。 函数名 功能 返回值 chapterName(doc) 抓取小说章节名 String content(doc) 抓取小说章节主体部分 Element 以上2个函数在小说章节页运行,输入值 `doc` 为小说章节页的 `document` 。 根据上述要求添加好相应网站抓取规则,并在 `// @match` 中添加相应网站,即可在新网站上使用本下载器。 调试功能: 将 `enableDebug` 变量改为 `true` 可开启调试功能,开启之后可在控制台(console)中访问如下对象: 对象名 类型 功能 rule 变量 当前抓取规则 main(rule) 函数 运行下载器 convertDomNode(node) 函数 输出处理后的txt文本及Dom节点 ruleTest(rule) 函数 测试抓取规则 */ const enableDebug = false; const maxRetryTimes = 3; const maxConcurrency = 10; const rules = new Map([ ["www.yruan.com", { bookname() { return document.querySelector('#info > h1:nth-child(1)').innerText.trim() }, author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() }, intro() { return convertDomNode(document.querySelector('#intro > p'))[0] }, linkList() { return document.querySelectorAll('div.box_con div#list dl dd a') }, coverUrl() { return document.querySelector('#fmimg > img').src }, chapterName: function(doc) { return doc.querySelector('.bookname > h1:nth-child(1)').innerText.trim() }, content: function(doc) { return doc.querySelector('#content') }, }], ["www.jingcaiyuedu.com", { bookname() { return document.querySelector('div.row.text-center.mb10 > h1:nth-child(1)').innerText.trim() }, author() { return document.querySelector('div.row.text-center.mb10 a[href^="/novel/"]').innerText.trim() }, intro: async() => { const indexUrl = document.location.href.replace(/\/list.html$/, '.html'); return (crossPage(indexUrl, "convertDomNode(doc.querySelector('#bookIntro'))[0]")) }, linkList() { return document.querySelectorAll('dd.col-md-4 > a') }, coverUrl: async() => { const indexUrl = document.location.href.replace(/\/list.html$/, '.html'); return (crossPage(indexUrl, "doc.querySelector('.panel-body img').getAttribute('data-original')")) }, chapterName: function(doc) { return doc.querySelector('h1.readTitle').innerText.trim() }, content: function(doc) { let c = doc.querySelector('#htmlContent'); let ad = c.querySelector('p:nth-child(1)'); if (ad.innerText.includes('精彩小说网')) { ad.remove() } return c }, }], ["www.shuquge.com", { bookname() { return document.querySelector('.info > h2').innerText.trim() }, author() { return document.querySelector('.small > span:nth-child(1)').innerText.replace(/作者:/, '').trim() }, intro() { let iNode = document.querySelector('.intro'); iNode.innerHTML = iNode.innerHTML.replace(/推荐地址:http:\/\/www.shuquge.com\/txt\/\d+\/index\.html/, ''); return convertDomNode(iNode)[0]; }, linkList() { return includeLatestChapter('.listmain > dl:nth-child(1)') }, coverUrl() { return document.querySelector('.info > .cover > img').src }, chapterName: function(doc) { return doc.querySelector('.content > h1:nth-child(1)').innerText.trim() }, content: function(doc) { let content = doc.querySelector('#content'); content.innerHTML = content.innerHTML.replace('请记住本书首发域名:www.shuquge.com。书趣阁_笔趣阁手机版阅读网址:m.shuquge.com', '').replace(/http:\/\/www.shuquge.com\/txt\/\d+\/\d+\.html/, ''); return content }, }], ["www.dingdiann.com", { bookname() { return document.querySelector('#info > h1:nth-child(1)').innerText.trim() }, author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() }, intro() { return convertDomNode(document.querySelector('#intro'))[0] }, linkList() { return includeLatestChapter('#list > dl') }, coverUrl() { return document.querySelector('#fmimg > img').src }, chapterName: function(doc) { return doc.querySelector('.bookname > h1:nth-child(1)').innerText.trim() }, content: function(doc) { let content = doc.querySelector('#content'); let ad = '
章节错误,点此举报(免注册),举报后维护人员会在两分钟内校正章节内容,请耐心等待,并刷新页面。
'; content.innerHTML = content.innerHTML.replace(ad, '').replace(/http:\/\/www.shuquge.com\/txt\/\d+\/\d+\.html/, ''); return content }, }], ["www.fpzw.com", { bookname() { return document.querySelector('#title > h1:nth-child(1)').innerText.trim() }, author() { return document.querySelector('.author > a:nth-child(1)').innerText.trim() }, intro: async() => { const indexUrl = document.location.href.replace(/xiaoshuo\/\d+\//, ''); const charset = 'GBK'; return (crossPage(indexUrl, "convertDomNode(doc.querySelector('.wright .Text'))[0]", charset)) }, linkList() { return includeLatestChapter('.book') }, coverUrl: async() => { const indexUrl = document.location.href.replace(/xiaoshuo\/\d+\//, ''); const charset = 'GBK'; return (crossPage(indexUrl, "doc.querySelector('div.bortable.wleft > img').src", charset)) }, chapterName: function(doc) { return doc.querySelector('h2').innerText.trim() }, content: function(doc) { let content = doc.querySelector('.Text'); content.querySelector('.Text > a:nth-child(1)').remove(); content.querySelector('.Text > font[color="#F00"]').remove(); content.querySelector('strong.top_book').remove(); return content }, charset: 'GBK', }], ["www.hetushu.com", { bookname() { return document.querySelector('.book_info > h2').innerText.trim() }, author() { return document.querySelector('.book_info > div:nth-child(3) > a:nth-child(1)').innerText.trim() }, intro() { return convertDomNode(document.querySelector('.intro'))[0] }, linkList() { return document.querySelectorAll('#dir dd a') }, coverUrl() { return document.querySelector('.book_info > img').src }, chapterName: function(doc) { return doc.querySelector('#content .h2').innerText.trim() }, content: function(doc) { let content = doc.querySelector('#content'); content.querySelectorAll('h2').forEach(n => n.remove()) return content }, }], ["www.biquwo.org", { bookname() { return document.querySelector('#info > h1').innerText.trim() }, author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() }, intro() { return convertDomNode(document.querySelector('#intro'))[0] }, linkList() { return includeLatestChapter('#list > dl:nth-child(1)') }, coverUrl() { return document.querySelector('#fmimg > img').src }, chapterName: function(doc) { return doc.querySelector('.bookname > h1:nth-child(1)').innerText.trim() }, content: function(doc) { return doc.querySelector('#content') }, }], ["www.xkzw.org", { bookname() { return document.querySelector('#info > h1').innerText.trim() }, author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() }, intro() { return convertDomNode(document.querySelector('#intro'))[0] }, linkList() { let showmore = document.querySelector('#showMore a'); let showmoreJS = showmore.href.replace('javascript:', ''); if (!showmore.innerText.includes('点击关闭')) { eval(showmoreJS); } return document.querySelectorAll('.list dd > a') }, coverUrl() { return document.querySelector('#fmimg > img').src }, chapterName: function(doc) { return doc.querySelector('.bookname > h1:nth-child(1)').innerText.trim() }, content: async function(doc) { const CryptoJS = await loadCryptoJs(); runEval(CryptoJS); return doc.querySelector('#content') async function loadCryptoJs() { const url = 'https://cdn.jsdelivr.net/npm/crypto-js@4.0.0/crypto-js.min.js'; let response = await fetch(url); let scriptText = await response.text(); eval(scriptText) const CryptoJS = unsafeWindow.CryptoJS; return CryptoJS } function runEval(CryptoJS) { // 以下部分来自 http://www.xkzw.org/js/c.js 中的去除混淆后的解密代码 // 本人将原代码中 document 修改为 doc function gettt1(str, keyStr, ivStr) { var key = CryptoJS.enc.Utf8.parse(keyStr); var iv = CryptoJS.enc.Utf8.parse(ivStr); var encryptedHexStr = CryptoJS.enc.Hex.parse(str); var srcs = CryptoJS.enc.Base64.stringify(encryptedHexStr); var decrypt = CryptoJS.DES.decrypt(srcs, key, { iv: iv, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }); var decryptedStr = decrypt.toString(CryptoJS.enc.Utf8); return decryptedStr.toString() }; function gettt2(str, keyStr, ivStr) { var key = CryptoJS.enc.Utf8.parse(keyStr); var iv = CryptoJS.enc.Utf8.parse(ivStr); var encryptedHexStr = CryptoJS.enc.Hex.parse(str); var srcs = CryptoJS.enc.Base64.stringify(encryptedHexStr); var decrypt = CryptoJS.AES.decrypt(srcs, key, { iv: iv, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }); var decryptedStr = decrypt.toString(CryptoJS.enc.Utf8); return decryptedStr.toString() }; function gettt3(str, keyStr, ivStr) { var key = CryptoJS.enc.Utf8.parse(keyStr); var iv = CryptoJS.enc.Utf8.parse(ivStr); var encryptedHexStr = CryptoJS.enc.Hex.parse(str); var srcs = CryptoJS.enc.Base64.stringify(encryptedHexStr); var decrypt = CryptoJS.RC4.decrypt(srcs, key, { iv: iv, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }); var decryptedStr = decrypt.toString(CryptoJS.enc.Utf8); return decryptedStr.toString() }; function getttn(str, keyStr, ivStr) { var key = CryptoJS.enc.Utf8.parse(keyStr); var iv = CryptoJS.enc.Utf8.parse(ivStr); var encryptedHexStr = CryptoJS.enc.Hex.parse(str); var srcs = CryptoJS.enc.Base64.stringify(encryptedHexStr); var decrypt = CryptoJS.TripleDES.decrypt(srcs, key, { iv: iv, mode: CryptoJS.mode.CBC, padding: CryptoJS.pad.Pkcs7 }); var decryptedStr = decrypt.toString(CryptoJS.enc.Utf8); return decryptedStr.toString() }; function showttt1(doc) { var obj = doc.getElementById("other"); var objTips = doc.getElementById("contenttips"); if (obj) { var content = obj.innerHTML.trim(); var type = parseInt(content.substring(0, 1)); var key; var iv; if (type == 1) { key = content.substring(1, 9); iv = content.substring(9, 17); content = content.substring(17); obj.innerHTML = gettt1(content, key, iv); obj.style.display = "block"; if (objTips) { objTips.style.display = "none" } } else if (type == 2) { key = content.substring(1, 33); iv = content.substring(33, 49); content = content.substring(49); obj.innerHTML = gettt2(content, key, iv); obj.style.display = "block"; if (objTips) { objTips.style.display = "none" } } else if (type == 3) { key = content.substring(1, 9); iv = content.substring(9, 17); content = content.substring(17); obj.innerHTML = gettt3(content, key, iv); obj.style.display = "block"; if (objTips) { objTips.style.display = "none" } } else { key = content.substring(1, 25); iv = content.substring(25, 33); content = content.substring(33); obj.innerHTML = getttn(content, key, iv); obj.style.display = "block"; if (objTips) { objTips.style.display = "none" } } } }; showttt1(doc); } }, }], ]); function includeLatestChapter(selector) { let dl = document.querySelector(selector); let rDt = dl.querySelector('dt:nth-child(1)') if (rDt.innerText.includes('最新章节')) { let p = null; let n = rDt; while (true) { if (n.nodeName == 'DD') { p = n; n = n.nextSibling; p.classList.add('not_download') } else if (n.nodeName == 'DT' && !n.innerText.includes('最新章节')) { break; } else { p = n; n = n.nextSibling; } } } return dl.querySelectorAll('dd:not(.not_download) > a') } async function crossPage(url, functionString, charset) { let text; if (charset === undefined) { text = await fetch(url).then(response => response.text()) } else { text = await fetch(url) .then(response => response.arrayBuffer()) .then(buffer => { let decoder = new TextDecoder(charset); let text = decoder.decode(buffer); return text }) } const doc = (new DOMParser()).parseFromString(text, 'text/html'); return (eval(functionString)) } const host = document.location.host; const rule = rules.get(host); const charset = rule.charset; const icon0 = ''; const icon1 = ''; let nowWorking = 0; let downloading = false; window.addEventListener('DOMContentLoaded', function() { if (rule.linkList()) { addButton() } if (enableDebug) { debug() } }) function addButton() { let button = document.createElement('button'); button.id = 'novel-downloader'; button.style.cssText = `position: fixed; top: 15%; right: 5%; z-index: 99; border-style: none; text-align:center; vertical-align:baseline; background-color: rgba(128, 128, 128, 0.2); padding: 5px; border-radius: 12px;`; let img = document.createElement('img'); img.src = icon0; img.style.cssText = 'height: 2em;'; button.onclick = function() { if (downloading) { alert('正在下载中,请耐心等待……'); } else { downloading = true; img.src = icon1; console.log('开始下载……') main(rule) } } button.appendChild(img); document.body.appendChild(button); } async function main(rule) { let bookname, author, intro, linkList, cover, sourceUrl, infoText; [bookname, author, intro, linkList, cover, sourceUrl, infoText] = await getMetadate(rule); const pageNum = linkList.length; let pageTaskQueue = genPageTaskQueue(linkList); let pageWorkerResolved = new Map(); let pageWorkerRejected = new Map(); let loopId = setInterval(loop, 300); function loop() { let finishNum = pageWorkerResolved.size + pageWorkerRejected.size; if (finishNum !== pageNum) { for (let i = nowWorking; i < maxConcurrency; i++) { const pageTask = pageTaskQueue.pop(); if (pageTask) { nowWorking++; console.log(`开始下载:${pageTask.id}\t${pageTask.dom.innerText}\t${pageTask.url}\t第${pageTask.retry}次重试`); pageWorker(pageTask, pageWorkerResolved, pageWorkerRejected, pageTaskQueue, rule); } } } else { clearInterval(loopId); save(pageWorkerResolved, bookname, author, infoText, cover, pageNum); } } } function save(pageWorkerResolved, bookname, author, infoText, cover, pageNum) { console.log('保存文件中……') let sortKeys = []; for (let key of pageWorkerResolved.keys()) { sortKeys.push(key); } sortKeys.sort(compareNumeric); let savedTxt = infoText; let savedZip = new JSZip(); for (let key of sortKeys) { let v = pageWorkerResolved.get(key); savedTxt = savedTxt + '\n\n\n\n' + `## ${v.chapterName}` + '\n' + '='.repeat(30) + '\n\n' + v.txt.trim(); const htmlFileName = 'Chapter' + '0'.repeat(pageNum.toString().length - key.toString().length) + key.toString() + '.html'; const htmlFile = genHtml(v.chapterName, v.dom); savedZip.file(htmlFileName, htmlFile); } const saveBaseFileName = `[${author}]${bookname}`; saveAs((new Blob([savedTxt], { type: "text/plain;charset=utf-8" })), saveBaseFileName + '.txt'); savedZip.file('info.txt', (new Blob([infoText], { type: "text/plain;charset=utf-8" }))); savedZip.file(`cover.${cover.type}`, cover.file); savedZip.generateAsync({ type: "blob", compression: "DEFLATE", compressionOptions: { level: 6 } }).then((blob) => { saveAs(blob, saveBaseFileName + '.zip'); }) .catch(err => console.log('saveZip: ' + err)); downloading = false; document.querySelector('#novel-downloader > img').src = icon0; console.log('下载完毕!') function compareNumeric(a, b) { if (a > b) return 1; if (a == b) return 0; if (a < b) return -1; } } function genHtml(chapterName, dom) { let htmlFile = (new DOMParser()).parseFromString( `${chapterName}

${chapterName}

`, 'text/html'); htmlFile.querySelector('body').appendChild(dom); return new Blob([htmlFile.documentElement.outerHTML], { type: "text/html; charset=UTF-8" }) } async function getMetadate(rule) { let bookname, author, intro, linkList, coverUrl, cover, sourceUrl, infoText; if (rule.bookname[Symbol.toStringTag] == 'AsyncFunction') { await rule.bookname().then(result => bookname = result) } else { bookname = rule.bookname() } if (rule.author[Symbol.toStringTag] == 'AsyncFunction') { await rule.author().then(result => author = result) } else { author = rule.author() } if (rule.intro[Symbol.toStringTag] == 'AsyncFunction') { await rule.intro().then(result => intro = result) } else { intro = rule.intro() } if (rule.linkList[Symbol.toStringTag] == 'AsyncFunction') { await rule.linkList().then(result => linkList = result) } else { linkList = rule.linkList() } if (rule.coverUrl[Symbol.toStringTag] == 'AsyncFunction') { await rule.coverUrl().then(result => coverUrl = result) } else { coverUrl = rule.coverUrl() } await fetch(coverUrl).then(response => { cover = { 'type': response.headers.get('Content-Type').split('/')[1], 'file': response.blob(), 'url': coverUrl }; }) intro = intro.replaceAll(/\n{2,}/g, '\n'); sourceUrl = document.location.href; infoText = `题名:${bookname}\n作者:${author}\n简介:${intro}\n来源:${document.location.href}`; return [bookname, author, intro, linkList, cover, sourceUrl, infoText] } function genPageTaskQueue(linkList) { let pageTaskQueue = []; for (let i = 0; i < linkList.length; i++) { let pageTask = { 'id': i, 'url': linkList[i].href, 'retry': 0, 'dom': linkList[i] }; pageTaskQueue.push(pageTask); } return pageTaskQueue } function pageWorker(pageTask, pageWorkerResolved, pageWorkerRejected, pageTaskQueue, rule) { let id = pageTask.id; let url = pageTask.url; let retry = pageTask.retry; let dom = pageTask.dom; let text; if (charset === undefined) { text = fetch(url).then( response => response.text(), error => { nowWorking--; errorCallback(error) } ) } else { text = fetch(url).then( response => response.arrayBuffer(), error => { nowWorking--; errorCallback(error) }).then( buffer => { let decoder = new TextDecoder(charset); let text = decoder.decode(buffer); return text }) } text.then(text => { nowWorking--; extractData(id, url, text, rule, pageWorkerResolved) }).catch(error => errorCallback(error)) function errorCallback(error) { console.error(id, url, pageTask, error); retry++; if (retry > maxRetryTimes) { pageWorkerRejected.set(id, url); } else { pageTaskQueue.push({ 'id': id, 'url': url, 'retry': retry, 'dom': dom }); } } } async function extractData(id, url, text, rule, pageWorkerResolved) { let doc = (new DOMParser()).parseFromString(text, 'text/html'); let chapterName, content; if (rule.chapterName[Symbol.toStringTag] == 'AsyncFunction') { await rule.chapterName(doc).then(result => chapterName = result) } else { chapterName = rule.chapterName(doc) } if (rule.content[Symbol.toStringTag] == 'AsyncFunction') { await rule.content(doc).then(result => content = result) } else { content = rule.content(doc) } let txtOut, htmlOut; [txtOut, htmlOut] = convertDomNode(content); pageWorkerResolved.set(id, { 'id': id, 'url': url, 'chapterName': chapterName, 'content': content, 'txt': txtOut, 'dom': htmlOut }); } function convertDomNode(node) { let txtOut = ''; let htmlOut = document.createElement('div'); let brc = 0; [txtOut, htmlOut, brc] = walker(null, node.childNodes[0], node, brc, txtOut, htmlOut); txtOut = txtOut.trim(); return [txtOut, htmlOut] } function walker(p, n, r, brc, txtOut, htmlOut) { let pNodeName, nNodeName; if (p) { pNodeName = p.nodeName; } else { pNodeName = null; } if (n) { nNodeName = n.nodeName; } else { nNodeName = null; } const nodeType2 = ['DIV', 'P', 'OL', 'H1', 'H1', 'H2', 'H3', 'H4', 'H5', 'H6']; const nodeType3 = ['SCRIPT', 'STYLE', '#comment']; let lastNode; if (htmlOut.childElementCount !== 0) { lastNode = htmlOut.childNodes[htmlOut.childElementCount - 1]; } else { lastNode = document.createElement('p'); } if (nodeType3.includes(nNodeName)) { //pass } else if (nNodeName === 'BR') { brc++ } else if (nNodeName == 'HR') { txtOut = txtOut + '\n' + '-'.repeat(15) + 'n'; let hr = document.createElement('hr'); htmlOut.appendChild(hr); } else if (nNodeName === '#text') { const nodetext = n.textContent.trim() .replace(/(\s+)?\n+(\s+)?/g, '').replace(/\s+/, ' '); if (nodetext) { if (brc === 0) { if (nodeType2.includes(pNodeName)) { txtOut = txtOut + '\n'.repeat(2) + nodetext; let p0 = document.createElement('p'); p0.innerText = nodetext; htmlOut.appendChild(p0); } else { txtOut = txtOut + nodetext; lastNode.innerText = lastNode.innerText + nodetext; } } else if (brc === 1 || brc === 2) { txtOut = txtOut + '\n'.repeat(brc) + nodetext; let p0 = document.createElement('p'); p0.innerText = nodetext; htmlOut.appendChild(p0); } else { txtOut = txtOut + '\n'.repeat(3) + nodetext; let p1 = document.createElement('p'); let p2 = p1.cloneNode(); let br = document.createElement('br'); p1.appendChild(br); p2.innerText = nodetext; htmlOut.appendChild(p1); htmlOut.appendChild(p2); } brc = 0; } } else if (nodeType2.includes(nNodeName)) { if (n.childElementCount === 0) { const nodetext = n.innerText.trim(); if (nodetext) { if (brc >= 3) { txtOut = txtOut + '\n'.repeat(3) + nodetext; let p1 = document.createElement('p'); let p2 = p1.cloneNode(); let br = document.createElement('br'); p1.appendChild(br); p2.innerText = nodetext; htmlOut.appendChild(p1); htmlOut.appendChild(p2); } else { txtOut = txtOut + '\n'.repeat(2) + nodetext; let p0 = document.createElement('p'); p0.innerText = nodetext; htmlOut.appendChild(p0); } } } else { [txtOut, htmlOut, brc] = walker(null, n.childNodes[0], n, brc + 2, txtOut, htmlOut); } } else if (n.childElementCount === 0) { const nodetext = n.innerText.trim(); if (nodetext) { txtOut = txtOut + nodetext; lastNode.innerText = lastNode.innerText + nodetext; } } else if (n.childElementCount !== 0) { [txtOut, htmlOut, brc] = walker(null, n.childNodes[0], n, brc, txtOut, htmlOut); } p = n; n = n.nextSibling; if (n === null) { return [txtOut, htmlOut, brc] } else { [txtOut, htmlOut, brc] = walker(p, n, r, brc, txtOut, htmlOut) return [txtOut, htmlOut, brc] } } function debug() { unsafeWindow.rule = rule; unsafeWindow.main = main; unsafeWindow.convertDomNode = convertDomNode; unsafeWindow.ruleTest = ruleTest; } async function ruleTest(rule) { let bookname, author, intro, linkList, cover, sourceUrl, infoText; [bookname, author, intro, linkList, cover, sourceUrl, infoText] = await getMetadate(rule); console.log(`infoText:\n${infoText}`); console.log('cover: ', cover); console.log('linkList: ', linkList); let blob = await cover.file; let coverImg = document.createElement('img'); coverImg.src = URL.createObjectURL(blob); coverImg.onclick = function() { this.remove() }; coverImg.style.cssText = `position: fixed; bottom: 8%; right: 8%; z-index: 99; max-width: 150px;`; document.body.appendChild(coverImg); let pageTaskQueue = [{ 'id': 0, 'url': linkList[0].href, 'retry': 0, 'dom': linkList[0] }]; let pageWorkerResolved = new Map(); let pageWorkerRejected = new Map(); let loopId = setInterval(loop, 800); function loop() { let finishNum = pageWorkerResolved.size + pageWorkerRejected.size; if (finishNum != 1) { const pageTask = pageTaskQueue.pop() if (pageTask) { pageWorker(pageTask, pageWorkerResolved, pageWorkerRejected, pageTaskQueue, rule); } } else { clearInterval(loopId); let result = pageWorkerResolved.get(0); console.log(result); } } }