Greasy Fork is available in English.

小说下载器

一个从笔趣阁这样的小说网站下载小说的通用脚本

Versione datata 26/06/2020. Vedi la nuova versione l'ultima versione.

// ==UserScript==
// @name        小说下载器
// @namespace   https://blog.bgme.me
// @match       http://www.yruan.com/article/*.html
// @match       https://www.jingcaiyuedu.com/novel/*/list.html
// @require     https://cdn.jsdelivr.net/npm/file-saver@2.0.2/dist/FileSaver.min.js
// @require     https://cdn.jsdelivr.net/npm/jszip@3.2.1/dist/jszip.min.js
// @run-at      document-end
// @version     1.0.1
// @author      bgme
// @description 一个从笔趣阁这样的小说网站下载小说的通用脚本
// @supportURL  https://github.com/yingziwu/Greasemonkey/issues
// @icon        -
// @license     AGPL-3.0-or-later
// ==/UserScript==

"use strict";
/*
// 直接在 Console 中使用时请去除此段注释
['https://cdn.jsdelivr.net/npm/file-saver@2.0.2/dist/FileSaver.min.js',
    'https://cdn.jsdelivr.net/npm/jszip@3.2.1/dist/jszip.min.js'
].forEach(item => {
    let script = document.createElement('script');
    script.src = item;
    document.body.append(script);
});
*/

const rules = new Map([
    ["www.yruan.com", {
        novelName() { return document.querySelector('#info > h1:nth-child(1)').innerText.trim() },
        author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() },
        intro() { return walk(document.querySelector('#intro > p').childNodes[0], null, 0, '', document.createElement('div'))[0].trim() },
        linkList() { return document.querySelectorAll('div.box_con div#list dl dd a') },
        chapter_name: function(h) { return h.querySelector('.bookname > h1:nth-child(1)').innerText.trim() },
        content: function(h) { return h.querySelector('#content') },
    }],
    ["www.jingcaiyuedu.com", {
        novelName() { return document.querySelector('div.row.text-center.mb10 > h1:nth-child(1)').innerText.trim() },
        author() { return document.querySelector('div.row.text-center.mb10 a[href^="/novel/"]').innerText.trim() },
        intro: (async() => {
            const indexUrl = document.location.href.replace(/\/list.html$/, '.html');
            let intro = await fetch(indexUrl)
                .then(response => response.text())
                .then(text => {
                    const h = (new DOMParser()).parseFromString(text, 'text/html');
                    const introNode = h.querySelector('#bookIntro');
                    let intro = walk(introNode.childNodes[0], null, 0, '', document.createElement('div'))[0].trim();
                    return intro
                });
            return intro
        }),
        linkList() { return document.querySelectorAll('dd.col-md-4 > a') },
        chapter_name: function(h) { return h.querySelector('h1.readTitle').innerText.trim() },
        content: function(h) {
            let c = h.querySelector('#htmlContent');
            let ad = c.querySelector('p:nth-child(1)');
            if (ad.innerText.includes('精彩小说网')) { ad.remove() }
            return c
        },
    }],
]);
const host = document.location.host;
const rule = rules.get(host);

window.addEventListener('DOMContentLoaded', function() {
    if (rule.linkList()) { addButton() }
})


function addButton() {
    let button = document.createElement('button');
    button.className = 'icon_pc';
    button.style.cssText = `position: fixed;
                        top: 15%;
                        right: 5%;
                        z-index: 99;
                        border-style: none;
                        text-align:center;
                        vertical-align:baseline;
                        background-color: rgba(128, 128, 128, 0.2);
                        padding: 5px;
                        border-radius: 12px;`;

    let img = document.createElement('img');
    img.src = ''
    img.style.cssText = 'height: 2em;';

    button.onclick = function() {
        run(rule);
        img.src = '';
        this.onclick = function() {
            alert('正在下载中,请耐心等待……');
        }
    }
    button.appendChild(img);
    document.body.appendChild(button);
    console.log('Add Button……');
}

function run(rule) {
    let novelName, author, intro;
    rule.novelName[Symbol.toStringTag] == 'AsyncFunction' ? rule.novelName().then(result => novelName = result) : novelName = rule.novelName();
    rule.author[Symbol.toStringTag] == 'AsyncFunction' ? rule.author().then(result => author = result) : author = rule.author();
    rule.intro[Symbol.toStringTag] == 'AsyncFunction' ? rule.intro().then(result => intro = result) : intro = rule.intro();

    const size = Symbol('size');
    let linkList = rule.linkList();
    getChapters(linkList)
        .then(chapters => {
            chapters[size] = 0;
            for (let i in chapters) {
                let v = chapters[i];
                let [txtOut, htmlOut] = clearHtml(v.content);
                chapters[i]['txt'] = txtOut;
                chapters[i]['html'] = htmlOut;
                if (chapters.hasOwnProperty(i)) {
                    chapters[size]++;
                }
            }
            return chapters
        })
        .then(chapters => {
            console.log(chapters);
            console.log('保存中……');
            const infoText = `题名:${novelName}\n作者:${author}\n简介:${intro}\n来源地址:${document.location.href}`;
            let outputTxt = infoText;
            let outputHtmlZip = new JSZip;
            for (let i in chapters) {
                let v = chapters[i];

                outputTxt = outputTxt + '\n\n\n\n' + i + '. ' + v.chapter_name + '\n' + v.txt.trim();

                const htmlFileName = 'Chapter' + '0'.repeat(chapters[size].toString().length - i.toString().length) + i.toString() + '.html';
                const htmlFile = genHtml(v);
                outputHtmlZip.file(htmlFileName, htmlFile);
            }
            let baseName = `[${author}]${novelName}`;
            saveAs((new Blob([outputTxt], { type: "text/plain;charset=utf-8" })), baseName + '.txt');
            outputHtmlZip.file('info.txt', (new Blob([infoText], { type: "text/plain;charset=utf-8" })));
            outputHtmlZip.generateAsync({ type: "blob" })
                .then((blob) => { saveAs(blob, baseName + '.zip'); })
                .catch(err => console.log('saveZip: ' + err));
        })


    async function getChapters(linkList) {
        let chapters = {};
        for (let i = 0; i < linkList.length; i++) {
            const href = linkList[i].href;
            await fetch(href)
                .then(response => {
                    console.log(`正在下载:${i}\t${href}`);
                    return response.text()
                })
                .then(text => {
                    const h = (new DOMParser()).parseFromString(text, 'text/html');
                    return h
                })
                .then(h => {
                    const chapter_name = rule.chapter_name(h);
                    let content = rule.content(h);
                    chapters[i] = { 'chapter_name': chapter_name, 'content': content }
                })
        }
        return chapters
    }

    function clearHtml(content) {
        let txtOut = '';
        let htmlOut = document.createElement('div');
        const firstNode = content.childNodes[0];
        [txtOut, htmlOut] = walk(firstNode, null, 0, txtOut, htmlOut);
        return [txtOut, htmlOut]
    }

    function genHtml(v) {
        let htmlFile = (new DOMParser()).parseFromString(
            `<!DOCTYPE html><html><head><meta charset="UTF-8"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>${v.chapter_name}</title></head><body><h2>${v.chapter_name}</h2></body></html>`,
            'text/html');
        htmlFile.querySelector('body').appendChild(v.html);
        return new Blob([htmlFile.documentElement.outerHTML], { type: "text/html; charset=UTF-8" })
    }
}

function walk(Node, preNode, brCount, txtOut, htmlOut) {
    let nodeName = Node.nodeName;
    if (nodeName === '#text') {
        let nodetext = Node.textContent.trim();
        if (nodetext !== "") {
            if (brCount != 0) {
                if ((Node.previousSibling && Node.previousSibling.nodeName !== 'BR') || (Node.previousSibling === null && ['P', 'DIV'].includes(Node.parentNode.nodeName))) {
                    txtOut = txtOut + '\n' + nodetext;
                } else {
                    txtOut = txtOut + nodetext;
                }
            } else {
                txtOut = txtOut + nodetext;
            }
            let p = document.createElement('p');
            p.innerText = nodetext;
            htmlOut.appendChild(p);
            brCount = 0;
        }
    } else if (nodeName === 'BR') {
        brCount++;
        const nNotBr = (Node.nextSibling && Node.nextSibling.nodeName !== 'BR');
        if (nNotBr) {
            if (brCount === 2) {
                txtOut = txtOut + '\n';
            } else if (brCount >= 3) {
                txtOut = txtOut + '\n\n';

                let p = document.createElement('p');
                p.innerHTML = '<br>';
                htmlOut.appendChild(p);
            }
        }
    } else if (['P', 'DIV'].includes(nodeName)) {
        [txtOut, htmlOut] = walk(Node.childNodes[0], null, brCount + 1, txtOut, htmlOut);
    } else if (Node.childElementCount && Node.childElementCount !== 0) {
        [txtOut, htmlOut] = walk(Node.childNodes[0], null, 0, txtOut, htmlOut);
    } else if (Node.innerText) {
        let nodetext = Node.innerText.trim();
        if (nodetext !== "") {
            txtOut = txtOut + nodetext;

            let lastNode = htmlOut.childNodes[htmlOut.childElementCount - 1];
            lastNode.innerText = lastNode.innerText + nodetext;
        }
    }

    preNode = Node;
    Node = Node.nextSibling;
    if (Node === null) {
        return [txtOut, htmlOut]
    } else {
        [txtOut, htmlOut] = walk(Node, preNode, brCount, txtOut, htmlOut);
        return [txtOut, htmlOut]
    }
}