aboutsummaryrefslogtreecommitdiff
path: root/src/plugins/Manganelo.cpp
blob: 7af35a63ec52d48a78904d89d41727198a3f0961 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
#include "../../plugins/Manganelo.hpp"
#include <quickmedia/HtmlSearch.h>
#include <json/reader.h>

namespace QuickMedia {
    SearchResult Manganelo::search(const std::string &url, BodyItems &result_items) {
        std::string website_data;
        if(download_to_string(url, website_data) != DownloadResult::OK)
            return SearchResult::NET_ERR;

        QuickMediaHtmlSearch html_search;
        int result = quickmedia_html_search_init(&html_search, website_data.c_str());
        if(result != 0)
            goto cleanup;

        result = quickmedia_html_find_nodes_xpath(&html_search, "//div[class='chapter-list']/div[class='row']//a",
            [](QuickMediaHtmlNode *node, void *userdata) {
                auto *item_data = (BodyItems*)userdata;
                const char *href = quickmedia_html_node_get_attribute_value(node, "href");
                const char *text = quickmedia_html_node_get_text(node);
                if(href && text) {
                    auto item = std::make_unique<BodyItem>(strip(text));
                    item->url = href;
                    item_data->push_back(std::move(item));
                }
            }, &result_items);

        cleanup:
        quickmedia_html_search_deinit(&html_search);
        return result == 0 ? SearchResult::OK : SearchResult::ERR;
    }

    // Returns true if changed
    static bool remove_html_span(std::string &str) {
        size_t open_tag_start = str.find("<span");
        if(open_tag_start == std::string::npos)
            return false;

        size_t open_tag_end = str.find('>', open_tag_start + 5);
        if(open_tag_end == std::string::npos)
            return false;

        str.erase(open_tag_start, open_tag_end - open_tag_start + 1);

        size_t close_tag = str.find("</span>");
        if(close_tag == std::string::npos)
            return true;

        str.erase(close_tag, 7);
        return true;
    }

    SuggestionResult Manganelo::update_search_suggestions(const std::string &text, BodyItems &result_items) {
        std::string url = "https://manganelo.com/home_json_search";
        std::string search_term = "searchword=";
        search_term += url_param_encode(text);
        CommandArg data_arg = { "--data", std::move(search_term) };

        std::string server_response;
        if(download_to_string(url, server_response, {data_arg}) != DownloadResult::OK)
            return SuggestionResult::NET_ERR;

        if(server_response.empty())
            return SuggestionResult::OK;

        Json::Value json_root;
        Json::CharReaderBuilder json_builder;
        std::unique_ptr<Json::CharReader> json_reader(json_builder.newCharReader());
        std::string json_errors;
        if(!json_reader->parse(&server_response[0], &server_response[server_response.size()], &json_root, &json_errors)) {
            fprintf(stderr, "Manganelo suggestions json error: %s\n", json_errors.c_str());
            return SuggestionResult::ERR;
        }

        if(json_root.isArray()) {
            for(const Json::Value &child : json_root) {
                if(child.isObject()) {
                    Json::Value name = child.get("name", "");
                    Json::Value nameunsigned = child.get("nameunsigned", "");
                    if(name.isString() && name.asCString()[0] != '\0' && nameunsigned.isString() && nameunsigned.asCString()[0] != '\0') {
                        std::string name_str = name.asString();
                        while(remove_html_span(name_str)) {}
                        auto item = std::make_unique<BodyItem>(strip(name_str));
                        item->url = "https://manganelo.com/manga/" + url_param_encode(nameunsigned.asString());
                        Json::Value image = child.get("image", "");
                        if(image.isString() && image.asCString()[0] != '\0')
                            item->thumbnail_url = image.asString();
                        result_items.push_back(std::move(item));
                    }
                }
            }
        }
        return SuggestionResult::OK;
    }

    ImageResult Manganelo::get_number_of_images(const std::string &url, int &num_images) {
        std::lock_guard<std::mutex> lock(image_urls_mutex);
        num_images = 0;
        ImageResult image_result = get_image_urls_for_chapter(url);
        if(image_result != ImageResult::OK)
            return image_result;

        num_images = last_chapter_image_urls.size();
        return ImageResult::OK;
    }

    ImageResult Manganelo::get_image_urls_for_chapter(const std::string &url) {
        if(url == last_chapter_url)
            return ImageResult::OK;

        last_chapter_image_urls.clear();

        std::string website_data;
        if(download_to_string(url, website_data) != DownloadResult::OK)
            return ImageResult::NET_ERR;

        QuickMediaHtmlSearch html_search;
        int result = quickmedia_html_search_init(&html_search, website_data.c_str());
        if(result != 0)
            goto cleanup;

        result = quickmedia_html_find_nodes_xpath(&html_search, "//div[id='vungdoc']/img",
            [](QuickMediaHtmlNode *node, void *userdata) {
                auto *urls = (std::vector<std::string>*)userdata;
                const char *src = quickmedia_html_node_get_attribute_value(node, "src");
                if(src) {
                    // TODO: If image loads too slow, try switching mirror
                    std::string image_url = src;
                    //string_replace_all(image_url, "s3.mkklcdnv3.com", "bu.mkklcdnbuv1.com");
                    urls->emplace_back(std::move(image_url));
                }
            }, &last_chapter_image_urls);

        cleanup:
        quickmedia_html_search_deinit(&html_search);
        if(result == 0)
            last_chapter_url = url;
        return result == 0 ? ImageResult::OK : ImageResult::ERR;
    }

    ImageResult Manganelo::for_each_page_in_chapter(const std::string &chapter_url, PageCallback callback) {
        std::vector<std::string> image_urls;
        {
            std::lock_guard<std::mutex> lock(image_urls_mutex);
            ImageResult image_result = get_image_urls_for_chapter(chapter_url);
            if(image_result != ImageResult::OK)
                return image_result;

            image_urls = last_chapter_image_urls;
        }

        for(const std::string &url : image_urls) {
            if(!callback(url))
                break;
        }
        return ImageResult::OK;
    }
}