卓越飞翔博客卓越飞翔博客

卓越飞翔 - 您值得收藏的技术分享站
技术文章1829本站已运行4109

某电子书网站,电子书打包下载脚本

脚本用途:合并一部电子书多个章节为一个html文件 ,并清理网页中的html代码, 生成的html 适合转换为 kindle 的 mobi 等格式
使用方法:打开电子书的章节索引页面,会自动生成一个 “点击下载电子书”的链接,点击即可下载。
// ==UserScript==
// [url=home.php?mod=space&uid=170990]@name[/url]         **文学电子书下载
// [url=home.php?mod=space&uid=467642]@namespace[/url]    http://tampermonkey.net/
// [url=home.php?mod=space&uid=1248337]@version[/url]      2024-01-31
// @description  打包下载**文学电子书下载!
// [url=home.php?mod=space&uid=686208]@AuThor[/url]       You
// [url=home.php?mod=space&uid=195849]@match[/url]        https://www.*ing*ue*oke.com/*/
// [url=home.php?mod=space&uid=593100]@Icon[/url]         https://www.*ing*ue*oke.com/favicon.ico
// [url=home.php?mod=space&uid=609072]@grant[/url]        none
// ==/UserScript==
 
(function() {
    'use strict';
    var contentList = document.getElementById('content-list')
    if(contentList === null){
        return;
    }
    var bookDescribe = contentList.querySelector('.book-describe').innerText;
    var metas = bookDescribe.split('\n\n');
    var title = metas[0];
    var author = metas[1].split(':')[1];
    var guojia = metas[2].split(':')[1];
    var niandai = metas[3].split(':')[1];
    var description= metas[5];
    var booklist = document.querySelector('.book-list');
    var sections = [];
    var tasks = [];
    booklist.querySelectorAll('a').forEach(function(a,i){
        sections.push({title:a.title,content:i});
        var t = fetch(a.href).then(function(response){
            return response.text()}
                                  ).then(function (text) {
            var div = document.createElement('div');
            div.innerHTML = text;
            var nr1=div.querySelector('#nr1 div');
            sections[i].content = nr1.innerHTML;
        });
        tasks.push(t);
    });
    Promise.all(tasks).then(function(){
        var html = ['<!DOCTYPE html>',
                    '<html lang="zh-CN">',
                    '<head>',
                    '<meta charset="utf-8">',
                    '<meta name="author" content="' + author + '">',
                    '<meta name="description" content="'+ description +'">',
                    '<title>' + title + '</title>',
                    '</head>',
                    '<body>',
                    '<article>',
                    '<h1>' + title + ' <small> '+ author +'</small></h1>'];
        sections.forEach(function(section){
            html.push('<section>');
            html.push('<h2>' + section.title + '</h2>');
            html.push(section.content);
            html.push('</section>');
        });
        html.push('</article>');
        html.push('</body>');
        html.push('</html>');
        contentList.querySelector('.book-describe').innerHTML = '<p><a id="download">点击下载电子书</a></p>' + contentList.querySelector('.book-describe').innerHTML;
        var a = document.getElementById('download');
        a.href = 'data:text/plain;charset=utf-8,'+html.join('\n');
        a.download = title + '.html';
    });
})();
狗尾续貂,改进了样式和下载过大文件可能下载不全的问题。
// ==UserScript==
// @name         星月文学电子书下载
// @namespace    https://www.52pojie.cn/thread-1886476-1-1.html
// @version      2024-01-31
// @description  打包下载星月文学电子书下载!
// @author       bh4ger
// @match        https://www.xingyueboke.com/*/
// @icon         https://www.xingyueboke.com/favicon.ico
// @grant        none
// ==/UserScript==
 
(function() {
    'use strict';
    var contentList = document.getElementById('content-list')
    if(contentList === null){
        return;
    }
    var bookDescribe = contentList.querySelector('.book-describe').innerText;
    var metas = bookDescribe.split('\n\n');
    var title = metas[0];
    var author = metas[1].split(':')[1];
    var guojia = metas[2].split(':')[1];
    var niandai = metas[3].split(':')[1];
    var description= metas[5];
    var booklist = document.querySelector('.book-list');
    var sections = [];
    var tasks = [];
    booklist.querySelectorAll('a').forEach(function(a,i){
        sections.push({title:a.title,content:i});
        var t = fetch(a.href)
        .then(function(response){
            return response.text()
        })
        .then(function (text) {
            var div = document.createElement('div');
            div.innerHTML = text;
            var nr1=div.querySelector('#nr1 div');
            sections[i].content = nr1.innerHTML;
        });
        tasks.push(t);
    });
    Promise.all(tasks).then(function(){
        var html = ['<!DOCTYPE html>',
                    '<html lang="zh-CN">',
                    '<head>',
                    '<meta charset="utf-8">',
                    '<meta name="author" content="' + author + '">',
                    '<meta name="description" content="'+ description +'">',
                    '<title>' + title + '</title>',
                    '</head>',
                    '<body>',
                    '<article>',
                    '<h1>' + title + ' <small> '+ author +'</small></h1>'];
        sections.forEach(function(section){
            html.push('<section>');
            html.push('<h2>' + section.title + '</h2>');
            html.push(section.content);
            html.push('</section>');
        });
        html.push('</article>');
        html.push('</body>');
        html.push('</html>');
        contentList.querySelector('.book-describe').innerHTML = '<div class="scrolltobt"><a id="download">下载电子书</a><br /></br /><a id="singlePage">单页浏览</a></div>' + contentList.querySelector('.book-describe').innerHTML;
        let a = document.getElementById('download');
        a.href = 'data:text/plain;charset=utf-8,'+html.join('\n').replaceAll('#','@');
        a.download = title + '.html';
        let b=document.getElementById('singlePage');
        b.href='javascript:void(0);';
        b.addEventListener("click",function(){
            let win=window.open("about:blank");
            win.document.write(html.join('\n'));
        });
 
    });})();
 
卓越飞翔博客
上一篇: 使用python批量将doc文档转换为docx
下一篇: C#分页WEB+WinForm,都是一句代码实现分页

相关推荐

留言与评论(共有 0 条评论)
   
验证码:
隐藏边栏