// ==UserScript==
// @name 小说下载器
// @namespace https://blog.bgme.me
// @match http://www.yruan.com/article/*.html
// @match https://www.jingcaiyuedu.com/novel/*/list.html
// @require https://cdn.jsdelivr.net/npm/[email protected]/dist/FileSaver.min.js
// @require https://cdn.jsdelivr.net/npm/[email protected]/dist/jszip.min.js
// @run-at document-end
// @version 1.0.1
// @author bgme
// @description 一个从笔趣阁这样的小说网站下载小说的通用脚本
// @supportURL https://github.com/yingziwu/Greasemonkey/issues
// @icon -
// @license AGPL-3.0-or-later
// ==/UserScript==
"use strict";
/*
// 直接在 Console 中使用时请去除此段注释
['https://cdn.jsdelivr.net/npm/[email protected]/dist/FileSaver.min.js',
'https://cdn.jsdelivr.net/npm/[email protected]/dist/jszip.min.js'
].forEach(item => {
let script = document.createElement('script');
script.src = item;
document.body.append(script);
});
*/
const rules = new Map([
["www.yruan.com", {
novelName() { return document.querySelector('#info > h1:nth-child(1)').innerText.trim() },
author() { return document.querySelector('#info > p:nth-child(2)').innerText.replace(/作\s+者:/, '').trim() },
intro() { return walk(document.querySelector('#intro > p').childNodes[0], null, 0, '', document.createElement('div'))[0].trim() },
linkList() { return document.querySelectorAll('div.box_con div#list dl dd a') },
chapter_name: function(h) { return h.querySelector('.bookname > h1:nth-child(1)').innerText.trim() },
content: function(h) { return h.querySelector('#content') },
}],
["www.jingcaiyuedu.com", {
novelName() { return document.querySelector('div.row.text-center.mb10 > h1:nth-child(1)').innerText.trim() },
author() { return document.querySelector('div.row.text-center.mb10 a[href^="/novel/"]').innerText.trim() },
intro: (async() => {
const indexUrl = document.location.href.replace(/\/list.html$/, '.html');
let intro = await fetch(indexUrl)
.then(response => response.text())
.then(text => {
const h = (new DOMParser()).parseFromString(text, 'text/html');
const introNode = h.querySelector('#bookIntro');
let intro = walk(introNode.childNodes[0], null, 0, '', document.createElement('div'))[0].trim();
return intro
});
return intro
}),
linkList() { return document.querySelectorAll('dd.col-md-4 > a') },
chapter_name: function(h) { return h.querySelector('h1.readTitle').innerText.trim() },
content: function(h) {
let c = h.querySelector('#htmlContent');
let ad = c.querySelector('p:nth-child(1)');
if (ad.innerText.includes('精彩小说网')) { ad.remove() }
return c
},
}],
]);
const host = document.location.host;
const rule = rules.get(host);
window.addEventListener('DOMContentLoaded', function() {
if (rule.linkList()) { addButton() }
})
function addButton() {
let button = document.createElement('button');
button.className = 'icon_pc';
button.style.cssText = `position: fixed;
top: 15%;
right: 5%;
z-index: 99;
border-style: none;
text-align:center;
vertical-align:baseline;
background-color: rgba(128, 128, 128, 0.2);
padding: 5px;
border-radius: 12px;`;
let img = document.createElement('img');
img.src = ''
img.style.cssText = 'height: 2em;';
button.onclick = function() {
run(rule);
img.src = '';
this.onclick = function() {
alert('正在下载中,请耐心等待……');
}
}
button.appendChild(img);
document.body.appendChild(button);
console.log('Add Button……');
}
function run(rule) {
let novelName, author, intro;
rule.novelName[Symbol.toStringTag] == 'AsyncFunction' ? rule.novelName().then(result => novelName = result) : novelName = rule.novelName();
rule.author[Symbol.toStringTag] == 'AsyncFunction' ? rule.author().then(result => author = result) : author = rule.author();
rule.intro[Symbol.toStringTag] == 'AsyncFunction' ? rule.intro().then(result => intro = result) : intro = rule.intro();
const size = Symbol('size');
let linkList = rule.linkList();
getChapters(linkList)
.then(chapters => {
chapters[size] = 0;
for (let i in chapters) {
let v = chapters[i];
let [txtOut, htmlOut] = clearHtml(v.content);
chapters[i]['txt'] = txtOut;
chapters[i]['html'] = htmlOut;
if (chapters.hasOwnProperty(i)) {
chapters[size]++;
}
}
return chapters
})
.then(chapters => {
console.log(chapters);
console.log('保存中……');
const infoText = `题名:${novelName}\n作者:${author}\n简介:${intro}\n来源地址:${document.location.href}`;
let outputTxt = infoText;
let outputHtmlZip = new JSZip;
for (let i in chapters) {
let v = chapters[i];
outputTxt = outputTxt + '\n\n\n\n' + i + '. ' + v.chapter_name + '\n' + v.txt.trim();
const htmlFileName = 'Chapter' + '0'.repeat(chapters[size].toString().length - i.toString().length) + i.toString() + '.html';
const htmlFile = genHtml(v);
outputHtmlZip.file(htmlFileName, htmlFile);
}
let baseName = `[${author}]${novelName}`;
saveAs((new Blob([outputTxt], { type: "text/plain;charset=utf-8" })), baseName + '.txt');
outputHtmlZip.file('info.txt', (new Blob([infoText], { type: "text/plain;charset=utf-8" })));
outputHtmlZip.generateAsync({ type: "blob" })
.then((blob) => { saveAs(blob, baseName + '.zip'); })
.catch(err => console.log('saveZip: ' + err));
})
async function getChapters(linkList) {
let chapters = {};
for (let i = 0; i < linkList.length; i++) {
const href = linkList[i].href;
await fetch(href)
.then(response => {
console.log(`正在下载:${i}\t${href}`);
return response.text()
})
.then(text => {
const h = (new DOMParser()).parseFromString(text, 'text/html');
return h
})
.then(h => {
const chapter_name = rule.chapter_name(h);
let content = rule.content(h);
chapters[i] = { 'chapter_name': chapter_name, 'content': content }
})
}
return chapters
}
function clearHtml(content) {
let txtOut = '';
let htmlOut = document.createElement('div');
const firstNode = content.childNodes[0];
[txtOut, htmlOut] = walk(firstNode, null, 0, txtOut, htmlOut);
return [txtOut, htmlOut]
}
function genHtml(v) {
let htmlFile = (new DOMParser()).parseFromString(
`<!DOCTYPE html><html><head><meta charset="UTF-8"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>${v.chapter_name}</title></head><body><h2>${v.chapter_name}</h2></body></html>`,
'text/html');
htmlFile.querySelector('body').appendChild(v.html);
return new Blob([htmlFile.documentElement.outerHTML], { type: "text/html; charset=UTF-8" })
}
}
function walk(Node, preNode, brCount, txtOut, htmlOut) {
let nodeName = Node.nodeName;
if (nodeName === '#text') {
let nodetext = Node.textContent.trim();
if (nodetext !== "") {
if (brCount != 0) {
if ((Node.previousSibling && Node.previousSibling.nodeName !== 'BR') || (Node.previousSibling === null && ['P', 'DIV'].includes(Node.parentNode.nodeName))) {
txtOut = txtOut + '\n' + nodetext;
} else {
txtOut = txtOut + nodetext;
}
} else {
txtOut = txtOut + nodetext;
}
let p = document.createElement('p');
p.innerText = nodetext;
htmlOut.appendChild(p);
brCount = 0;
}
} else if (nodeName === 'BR') {
brCount++;
const nNotBr = (Node.nextSibling && Node.nextSibling.nodeName !== 'BR');
if (nNotBr) {
if (brCount === 2) {
txtOut = txtOut + '\n';
} else if (brCount >= 3) {
txtOut = txtOut + '\n\n';
let p = document.createElement('p');
p.innerHTML = '<br>';
htmlOut.appendChild(p);
}
}
} else if (['P', 'DIV'].includes(nodeName)) {
[txtOut, htmlOut] = walk(Node.childNodes[0], null, brCount + 1, txtOut, htmlOut);
} else if (Node.childElementCount && Node.childElementCount !== 0) {
[txtOut, htmlOut] = walk(Node.childNodes[0], null, 0, txtOut, htmlOut);
} else if (Node.innerText) {
let nodetext = Node.innerText.trim();
if (nodetext !== "") {
txtOut = txtOut + nodetext;
let lastNode = htmlOut.childNodes[htmlOut.childElementCount - 1];
lastNode.innerText = lastNode.innerText + nodetext;
}
}
preNode = Node;
Node = Node.nextSibling;
if (Node === null) {
return [txtOut, htmlOut]
} else {
[txtOut, htmlOut] = walk(Node, preNode, brCount, txtOut, htmlOut);
return [txtOut, htmlOut]
}
}