您需要先安装一个扩展,例如 篡改猴、Greasemonkey 或 暴力猴,之后才能安装此脚本。
您需要先安装一个扩展,例如 篡改猴 或 暴力猴,之后才能安装此脚本。
您需要先安装一个扩展,例如 篡改猴 或 暴力猴,之后才能安装此脚本。
您需要先安装一个扩展,例如 篡改猴 或 Userscripts ,之后才能安装此脚本。
您需要先安装一款用户脚本管理器扩展,例如 Tampermonkey,才能安装此脚本。
您需要先安装用户脚本管理器扩展后才能安装此脚本。
通用网站内容抓取工具,可抓取小说,论坛内容等
当前为
// ==UserScript== // @name DownloadAllContent // @name:zh-CN 懒人小说下载器 // @name:zh-TW 懶人小説下載器 // @name:ja 怠惰者小説ダウンロードツール // @namespace hoothin // @version 0.3 // @description Fetch and download main content on current page // @description:zh-CN 通用网站内容抓取工具,可抓取小说,论坛内容等 // @description:zh-TW 通用網站內容抓取工具,可抓取小說,論壇內容等 // @description:ja ユニバーサルサイトコンテンツクロールツール、クロール、フォーラム内容など // @author hoothin // @include * // @grant GM_xmlhttpRequest // @grant GM_registerMenuCommand // @require https://cdnjs.cloudflare.com/ajax/libs/FileSaver.js/1.3.3/FileSaver.min.js // @license MIT License // @compatible chrome // @compatible firefox // @compatible opera 未测试 // @compatible safari 未测试 // @contributionURL https://www.paypal.com/cgi-bin/webscr?cmd=_donations&[email protected]&item_name=Greasy+Fork+donation // @contributionAmount 1 // ==/UserScript== (function() { 'use strict'; var lang = navigator.appName=="Netscape"?navigator.language:navigator.userLanguage; var i18n={}; switch (lang){ case "zh-CN": i18n={ fetch:"开始下载小说或其他", info:"本文使用DownloadAllContent脚本下载" }; break; default: i18n={ fetch:"Download All Content", info:"The TXT is downloaded with 'DownloadAllContent'" }; break; } var rocketContent=document.createElement("div"); function indexDownload(aEles){ document.body.appendChild(rocketContent); rocketContent.outerHTML=` <div id="txtDownContent" style="display: none;"> <div style="width:300px;height:50px;position:fixed;left:50%;top:50%;margin-top:-25px;margin-left:-150px;z-index:100000;background-color:#ffffff;border:1px solid #afb3b6;border-radius:10px;opacity:0.95;filter:alpha(opacity=95);box-shadow:5px 5px 20px 0px #000;"> <div id="txtDownWords" style="position:absolute;left:20px;top:10px;width:260px;"> </div> <img src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAB4AAAAeCAMAAAAM7l6QAAAA5FBMVEUAAAD+/v7////9/f7////////+/v7+/v7////+/v7+/v7////+/v7+/v7////+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7+/v7////////////+/v7+/v7+/v7+/v7+/v4uje3///82ke7s9P3N5PtQoPDI4fqCu/Tu9v5Im+/6/P+VxfZgqPFNnvDp8/3f7fq42Pmnz/d1tPNvsfNkq/JCmO/4+/7X6fz19/rn8PqYx/aNwfV8uPRqrvJZpfFUovAzkO3Q5vu92/mr0fieyva92fWx0vQ6lO5pygFTAAAAJHRSTlMAmfD+RMGwgj2mknlIKR/36+XGnIyHfnJfVDk2My8S4E1CJBvTatKDAAABY0lEQVQoz4WSZ1fCMBRA05ahLPfemkspBUFwgGz3+P//x/hK6ZBzvB/ak96+kZeoGCtFK5eziitqCSfWOnM2CuWUrOyQYPc0bjM2htHXh+/ffQ4lQ6zEPoZ6TwdUp10M56EtAe5MR7y0HGAeX7Ghe6MTzIZwFtTfBrepUzw4UFSGY8CUTTMGLo3eglv58By21pRnB7aNBqTwPfWq/OVey9sH22wZXiWo6Yr3GtRl/f0IRyoPYy14v97YWjVY12BPrcK9XvhaZPUdWCoLbR35yOoW5P7R8eQ3JrmbSp6HVmSrXuTrmNYyUAs2JkL6D6YjG1PgNGXK87F4nWAsUxmL2gyH6oVD7cuhdqFg9CE4T/oPE6CsgvBOP21715AP7ugaDFK+3YD1KyUcAG47bn0TSylxFd8WDTwMMByoBSUHw+jd9/3JbQODnVExygUS7FRUksPVtdDZW8dqCZm8lc1auxcq4gc02GVGTUchmgAAAABJRU5ErkJggg==" id="txtDownQuit" style="position:absolute;right:0px;top:0px;cursor: pointer;" /> </div> </div>`; var txtDownContent=document.querySelector("#txtDownContent"); var txtDownWords=document.querySelector("#txtDownWords"); var txtDownQuit=document.querySelector("#txtDownQuit"); txtDownQuit.onclick=function(){ txtDownContent.style.display="none"; txtDownContent.parentNode.removeChild(txtDownContent); }; var j=0,rCats=[]; for(let i=0;i<aEles.length;i++){ let aTag=aEles[i]; GM_xmlhttpRequest({ method: 'GET', url: aTag.href, onload: function(result) { var doc = null; try { doc = document.implementation.createHTMLDocument(''); doc.documentElement.innerHTML = result.responseText; } catch (e) { console.log('parse error'); } if (!doc) { return; } j++; rCats[i]=(aTag.textContent+"\r\n"+getPageContent(doc)); txtDownContent.style.display="block"; txtDownWords.innerHTML="已下载完成 "+j+" 段,剩余 "+(aEles.length-j)+" 段"; if(j==aEles.length){ var blob = new Blob([i18n.info+"\r\n"+document.title+"\r\n\r\n"+rCats.join("\r\n\r\n")], {type: "text/plain;charset=utf-8"}); saveAs(blob, document.title+".txt"); } } }); } } function getPageContent(pageData){ var i,rStr=""; var largestContent,contents=pageData.querySelectorAll("span,div,article,p,td"); for(i=0;i<contents.length;i++){ var content=contents[i]; if(content.firstChild && ( (content.firstChild.nodeType!=3 && !/^[I|A]$/.test(content.firstChild.tagName)) || (/^\s*$/.test(content.firstChild.data) && (!content.childNodes[1]||!/^[I|A]$/.test(content.childNodes[1].tagName))) )) continue; if(pageData==document && content.offsetWidth <= 0 && content.offsetHeight <= 0) continue; if(navigator.userAgent.toLowerCase().indexOf('firefox')!=-1){ if(!largestContent || largestContent.textContent.length<content.textContent.length){ largestContent=content; } }else{ if(!largestContent || largestContent.innerText.length<content.innerText.length){ largestContent=content; } } } var childlist=pageData.querySelectorAll(largestContent.tagName); for(i=0;i<childlist.length;i++){ var child=childlist[i]; if(largestContent.className && largestContent.className==child.className){ }else if(child.firstChild && ((child.firstChild.nodeType!=3 && !/^[I|A]$/.test(child.firstChild.tagName)) || (/^\s*$/.test(child.firstChild.data) && (!child.childNodes[1] || !/^[I|A]$/.test(child.childNodes[1].tagName)))))continue; if(getDepth(child)==getDepth(largestContent)){ let childNodes=child.childNodes,cStr="\r\n",hasText=false; for(var j=0;j<childNodes.length;j++){ var childNode=childNodes[j]; if(childNode.nodeType==3 && childNode.data && !/^\s*$/.test(childNode.data))hasText=true; if(childNode.tagName=="BR")cStr+="\r\n"; else if(!/SCRIPT|STYLE/.test(childNode.tagName) && childNode.textContent)cStr+=childNode.textContent.replace(/\s*/," "); } if(hasText)rStr+=cStr; } } return rStr; } function getDepth(dom){ var pa=dom,i=0; while(pa.parentNode){ pa=pa.parentNode; i++; } return i; } function fetch(){ var aEles=document.querySelectorAll("a"),list=[]; for(var i=0;i<aEles.length;i++){ var aEle=aEles[i]; if(/第[\d|〇|零|一|二|三|四|五|六|七|八|九|十|百|千|万|萬]+[章|节|回|卷|折|篇|幕|集]|序|序\s*言|序\s*章|前\s*言|引\s*言|引\s*子|摘\s*要|楔\s*子|后\s*记|附\s*言|结\s*语/.test(aEle.innerHTML)){ list.push(aEle); } } if(list.length>2){ indexDownload(list); }else{ var blob = new Blob([i18n.info+"\r\n"+document.title+"\r\n\r\n"+getPageContent(document)], {type: "text/plain;charset=utf-8"}); saveAs(blob, document.title+".txt"); } } document.addEventListener("keydown", function(e) { if(e.keyCode == 120 && e.ctrlKey) { fetch(); } }); GM_registerMenuCommand(i18n.fetch, fetch); })();