toonily spider

toonily 简易爬虫

θα χρειαστεί να εγκαταστήσετε μια επέκταση όπως το Tampermonkey, το Greasemonkey ή το Violentmonkey για να εγκαταστήσετε αυτόν τον κώδικα.

θα χρειαστεί να εγκαταστήσετε μια επέκταση όπως το Tampermonkey ή το Violentmonkey για να εγκαταστήσετε αυτόν τον κώδικα.

θα χρειαστεί να εγκαταστήσετε μια επέκταση όπως το Tampermonkey ή το Violentmonkey για να εγκαταστήσετε αυτόν τον κώδικα.

θα χρειαστεί να εγκαταστήσετε μια επέκταση όπως το Tampermonkey ή το Userscripts για να εγκαταστήσετε αυτόν τον κώδικα.

You will need to install an extension such as Tampermonkey to install this script.

Θα χρειαστεί να εγκαταστήσετε μια επέκταση διαχείρισης κώδικα χρήστη για να εγκαταστήσετε αυτόν τον κώδικα.

(Έχω ήδη έναν διαχειριστή κώδικα χρήστη, επιτρέψτε μου να τον εγκαταστήσω!)

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install an extension such as Stylus to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

You will need to install a user style manager extension to install this style.

(Έχω ήδη έναν διαχειριστή στυλ χρήστη, επιτρέψτε μου να τον εγκαταστήσω!)

// ==UserScript==
// @name         toonily spider
// @namespace    obgnail
// @description  toonily 简易爬虫
// @version      0.3
// @author       obgnail
// @license      MIT
// @match        https://toonily.com/webtoon/*
// @icon         https://www.google.com/s2/favicons?domain=toonily.com
// @grant        GM.xmlHttpRequest
// @run-at       document-body
// ==/UserScript==


(function () {
    'use strict';

    const Limit = 2 // n requests per second

    const DEFAULT_HEADERS = {
        "referer": "https://toonily.com/",
        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36"
    }

    const BUTTON_ID = "btn-read-download"

    let getXmlHttpRequest = () => {
        return (typeof GM !== "undefined" && GM !== null ? GM.xmlHttpRequest : GM_xmlhttpRequest);
    }

    let insertDownloadButton = () => {
        const links = document.getElementById("init-links");
        if (links === null) {
            return
        }

        const button = document.createElement("a");
        button.id = BUTTON_ID
        button.className = "c-btn c-btn_style-1";
        button.href = "javascript:;"
        button.innerHTML = "download";
        button.addEventListener("click", download)

        links.appendChild(button);
    }

    let RequestCount = {
        count: 1,
        total: 0,
        done: () => {
            let button = document.getElementById(BUTTON_ID);
            button.innerText = `download (${RequestCount.count}/${RequestCount.total})`;
            RequestCount.count++;
        },
    }

    class RequestLimit {
        constructor(options) {
            this.unRequsetFn = [];
            this.limit = options.limit || 2;
            this.requestCount = 0;
        }

        async push(fn) {
            if (this.requestCount >= this.limit) {
                await new Promise((resolve) => this.unRequsetFn.push(resolve));
            }
            return this._handlerReq(fn);
        }

        async _handlerReq(fn) {
            this.requestCount++;
            try {
                return await fn();
            } catch (err) {
                return Promise.reject(err);
            } finally {
                this.requestCount--;
                if (this.unRequsetFn.length) {
                    this.unRequsetFn[0]();
                    this.unRequsetFn.shift();
                }
            }
        }
    }

    let requestLimit = new RequestLimit({limit: Limit});

    let request = (url, responseType, callback) => {
        requestLimit.push(() => {
                return new Promise(resolve => {
                    setTimeout(() => {
                        _request(url, responseType, callback)
                        resolve();
                    }, 1000)
                });
            }
        );
    }

    let _request = (url, responseType, callback) => {
        getXmlHttpRequest()({
            method: "GET",
            url: url,
            responseType: responseType,
            headers: DEFAULT_HEADERS,
            onload: resp => {
                if (resp.readyState === 4 && resp.status === 200) {
                    callback(resp)
                } else if (resp.readyState === 4 && resp.status === 404) {
                    callback(null)
                }
            },
            onerror: resp => {
                console.log("request on error", url)
            },
            ontimeout: resp => {
                console.log("request on timeout", url)
            }
        });
    }

    let defaultRequest = (url, callback) => request(url, "text", callback)

    let requestImage = (url, fileName) => {
        request(url, "blob", resp => {
            if (resp === null) {
                console.log("request image err")
                return
            }
            const link = document.createElement('a');
            link.href = window.URL.createObjectURL(resp.response);
            link.download = fileName;
            link.click();
            link.remove();
            RequestCount.done()
        })
    }

    let download = () => {
        let button = document.getElementById(BUTTON_ID);
        button.innerText = `searching...`;
        button.style.cssText += 'pointer-events: none; background-color: #0f0f0f';

        defaultRequest(window.location.href, resp => {
            if (resp === null) {
                console.log("request chapters error")
                return
            }
            const dom = new DOMParser().parseFromString(resp.responseText, "text/html");
            const chapters = parseFirstPage(dom);
            // chapters = [chapters[0], chapters[1]]  // debug
            downloadChapterImages(chapters);
        })
    }

    let parseFirstPage = (dom) => {
        let chapters = []
        const content = dom.querySelectorAll("#manga-content-tabs .listing-chapters_wrap .wp-manga-chapter a")

        for (let i = content.length - 1; i >= 0; i--) {
            chapters.push({
                "name": content[i].innerHTML.trim(),
                "url": content[i].getAttribute("href"),
            })
        }
        return chapters
    }

    let downloadChapterImages = (chapters) => {
        if (chapters === null || chapters.length === 0) {
            console.log("chapters is null")
            return
        }
        chapters.forEach(ele => downloadChapterImage(ele))
    }

    let downloadChapterImage = (chapter) => {
        defaultRequest(chapter.url, resp => {
            const dom = new DOMParser().parseFromString(resp.responseText, "text/html");
            let images = parseDetailPath(dom);

            RequestCount.total += images.length

            images.forEach(ele => {
                requestImage(ele.url, chapter.name + "-" + ele.name)
            })
        })
    }

    let parseDetailPath = (dom) => {
        let images = []
        const content = dom.querySelectorAll(".read-container .reading-content img")
        content.forEach(ele => {
            images.push({
                "name": ele.getAttribute("id"),
                "url": ele.getAttribute("data-src").trim(),
            })
        })
        return images
    }

    insertDownloadButton()
})();