From a0dbe64272d051671bc120b1845c7485264b097d Mon Sep 17 00:00:00 2001 From: dec05eba Date: Sun, 7 Jun 2020 04:31:30 +0200 Subject: Add support for mangatown --- src/plugins/Mangadex.cpp | 14 +--- src/plugins/Mangatown.cpp | 207 ++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 211 insertions(+), 10 deletions(-) create mode 100644 src/plugins/Mangatown.cpp (limited to 'src/plugins') diff --git a/src/plugins/Mangadex.cpp b/src/plugins/Mangadex.cpp index 3518d4a..b3c5e36 100644 --- a/src/plugins/Mangadex.cpp +++ b/src/plugins/Mangadex.cpp @@ -5,7 +5,6 @@ #include static const std::string mangadex_url = "https://mangadex.org"; -static const std::string useragent_str = "user-agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Safari/537.36"; namespace QuickMedia { static std::string title_url_extract_manga_id(const std::string &url) { @@ -35,12 +34,10 @@ namespace QuickMedia { }; SearchResult Mangadex::search(const std::string &url, BodyItems &result_items) { - CommandArg user_agent_arg = { "-H", useragent_str }; - std::string manga_id = title_url_extract_manga_id(url); std::string request_url = "https://mangadex.org/api/?id=" + manga_id + "&type=manga"; std::string server_response; - if(download_to_string(request_url, server_response, {std::move(user_agent_arg)}, use_tor) != DownloadResult::OK) + if(download_to_string(request_url, server_response, {}, use_tor, true) != DownloadResult::OK) return SearchResult::NET_ERR; if(server_response.empty()) @@ -170,10 +167,9 @@ namespace QuickMedia { std::string url = "https://mangadex.org/search?title="; url += url_param_encode(text); CommandArg cookie_arg = { "-H", "cookie: mangadex_rememberme_token=" + rememberme_token }; - CommandArg user_agent_arg = { "-H", useragent_str }; std::string website_data; - if(download_to_string(url, website_data, {std::move(cookie_arg), std::move(user_agent_arg)}, use_tor) != DownloadResult::OK) + if(download_to_string(url, website_data, {std::move(cookie_arg)}, use_tor, true) != DownloadResult::OK) return SuggestionResult::NET_ERR; QuickMediaHtmlSearch html_search; @@ -226,10 +222,9 @@ namespace QuickMedia { } bool Mangadex::save_mangadex_cookies(const std::string &url, const std::string &cookie_filepath) { - CommandArg user_agent_arg = { "-H", useragent_str }; CommandArg cookie_arg = { "-c", std::move(cookie_filepath) }; std::string server_response; - if(download_to_string(url, server_response, {std::move(user_agent_arg), std::move(cookie_arg)}, use_tor) != DownloadResult::OK) + if(download_to_string(url, server_response, {std::move(cookie_arg)}, use_tor, true) != DownloadResult::OK) return false; return true; @@ -248,12 +243,11 @@ namespace QuickMedia { if(!save_mangadex_cookies(url, cookie_filepath)) return ImageResult::ERR; - CommandArg user_agent_arg = { "-H", useragent_str }; CommandArg cookie_arg = { "-b", std::move(cookie_filepath) }; std::string manga_id = chapter_url_extract_manga_id(url); std::string request_url = mangadex_url + "/api/?id=" + manga_id + "&server=null&type=chapter"; std::string server_response; - if(download_to_string(request_url, server_response, {std::move(user_agent_arg), std::move(cookie_arg)}, use_tor) != DownloadResult::OK) + if(download_to_string(request_url, server_response, {std::move(cookie_arg)}, use_tor, true) != DownloadResult::OK) return ImageResult::NET_ERR; if(server_response.empty()) diff --git a/src/plugins/Mangatown.cpp b/src/plugins/Mangatown.cpp new file mode 100644 index 0000000..90db349 --- /dev/null +++ b/src/plugins/Mangatown.cpp @@ -0,0 +1,207 @@ +#include "../../plugins/Mangatown.hpp" +#include "../../include/Notification.hpp" +#include +#include + +static const std::string mangatown_url = "https://www.mangatown.com"; + +namespace QuickMedia { + SearchResult Mangatown::search(const std::string &url, BodyItems &result_items) { + std::string website_data; + if(download_to_string(url, website_data, {}, use_tor, true) != DownloadResult::OK) + return SearchResult::NET_ERR; + + QuickMediaHtmlSearch html_search; + int result = quickmedia_html_search_init(&html_search, website_data.c_str()); + if(result != 0) + goto cleanup; + + result = quickmedia_html_find_nodes_xpath(&html_search, "//ul[class='chapter_list']//a", + [](QuickMediaHtmlNode *node, void *userdata) { + auto *item_data = (BodyItems*)userdata; + const char *href = quickmedia_html_node_get_attribute_value(node, "href"); + const char *text = quickmedia_html_node_get_text(node); + if(href && text && strncmp(href, "/manga/", 7) == 0) { + auto item = std::make_unique(strip(text)); + item->url = mangatown_url + href; + item_data->push_back(std::move(item)); + } + }, &result_items); + + cleanup: + quickmedia_html_search_deinit(&html_search); + return result == 0 ? SearchResult::OK : SearchResult::ERR; + } + + SuggestionResult Mangatown::update_search_suggestions(const std::string &text, BodyItems &result_items) { + std::string url = "https://www.mangatown.com/ajax/search/?query="; + url += url_param_encode(text); + + std::string server_response; + if(download_to_string(url, server_response, {}, use_tor, true) != DownloadResult::OK) + return SuggestionResult::NET_ERR; + + if(server_response.empty()) + return SuggestionResult::OK; + + Json::Value json_root; + Json::CharReaderBuilder json_builder; + std::unique_ptr json_reader(json_builder.newCharReader()); + std::string json_errors; + if(!json_reader->parse(&server_response[0], &server_response[server_response.size()], &json_root, &json_errors)) { + fprintf(stderr, "Mangatown suggestions json error: %s\n", json_errors.c_str()); + return SuggestionResult::ERR; + } + + if(!json_root.isObject()) + return SuggestionResult::OK; + + Json::Value &json_data = json_root["data"]; + Json::Value &json_suggestions = json_root["suggestions"]; + if(!json_data.isArray() || !json_suggestions.isArray()) + return SuggestionResult::OK; + + for(const Json::Value &child : json_suggestions) { + if(!child.isString()) { + result_items.push_back(std::make_unique("")); + continue; + } + result_items.push_back(std::make_unique(child.asString())); + } + + size_t index = 0; + for(const Json::Value &child : json_data) { + BodyItem *body_item = nullptr; + if(index < result_items.size()) { + body_item = result_items[index].get(); + } else { + result_items.push_back(std::make_unique("")); + body_item = result_items.back().get(); + } + + ++index; + + if(!child.isString()) + continue; + + body_item->url = mangatown_url + child.asString(); + } + + return SuggestionResult::OK; + } + + static bool is_number_with_zero_fill(const char *str) { + while(*str == '0') { ++str; } + return atoi(str) != 0; + } + + ImageResult Mangatown::get_number_of_images(const std::string &url, int &num_images) { + std::lock_guard lock(image_urls_mutex); + + num_images = last_num_pages; + if(url == last_chapter_url_num_images) + return ImageResult::OK; + + last_num_pages = 0; + + std::string website_data; + if(download_to_string(url, website_data, {}, use_tor, true) != DownloadResult::OK) + return ImageResult::NET_ERR; + + QuickMediaHtmlSearch html_search; + int result = quickmedia_html_search_init(&html_search, website_data.c_str()); + if(result != 0) + goto cleanup; + + result = quickmedia_html_find_nodes_xpath(&html_search, "//div[class='page_select']//option", + [](QuickMediaHtmlNode *node, void *userdata) { + int *last_num_pages = (int*)userdata; + const char *value = quickmedia_html_node_get_attribute_value(node, "value"); + const char *text = quickmedia_html_node_get_text(node); + if(value && strncmp(value, "/manga/", 7) == 0) { + if(is_number_with_zero_fill(text)) { + (*last_num_pages)++; + } + } + }, &last_num_pages); + + last_num_pages /= 2; + num_images = last_num_pages; + + cleanup: + quickmedia_html_search_deinit(&html_search); + + if(result == 0) + last_chapter_url_num_images = url; + if(last_num_pages == 0) { + last_chapter_url_num_images.clear(); + return ImageResult::ERR; + } + return result == 0 ? ImageResult::OK : ImageResult::ERR; + } + + ImageResult Mangatown::for_each_page_in_chapter(const std::string &chapter_url, PageCallback callback) { + int num_pages; + ImageResult image_result = get_number_of_images(chapter_url, num_pages); + if(image_result != ImageResult::OK) + return image_result; + + int result = 0; + int page_index = 1; + + while(true) { + std::string image_src; + std::string website_data; + std::string full_url = chapter_url + std::to_string(page_index++) + ".html"; + if(download_to_string(full_url, website_data, {}, use_tor, true) != DownloadResult::OK) + break; + + QuickMediaHtmlSearch html_search; + result = quickmedia_html_search_init(&html_search, website_data.c_str()); + if(result != 0) + goto cleanup; + + result = quickmedia_html_find_nodes_xpath(&html_search, "//div[id='viewer']//img", + [](QuickMediaHtmlNode *node, void *userdata) { + std::string *image_src = (std::string*)userdata; + const char *src = quickmedia_html_node_get_attribute_value(node, "src"); + if(src && strstr(src, "/store/manga/")) { + if(strncmp(src, "//", 2) == 0) + *image_src = src + 2; + else + *image_src = src; + } + }, &image_src); + + cleanup: + quickmedia_html_search_deinit(&html_search); + + if(result != 0) + return ImageResult::ERR; + + if(image_src.empty()) + break; + + if(!callback(image_src)) + break; + } + + return ImageResult::OK; + } + + bool Mangatown::extract_id_from_url(const std::string &url, std::string &manga_id) { + size_t start_index = url.find("/manga/"); + if(start_index == std::string::npos) + return false; + + start_index += 7; + size_t end_index = url.find("/", start_index); + if(end_index == std::string::npos) { + manga_id = url.substr(start_index); + return true; + } + + manga_id = url.substr(start_index, end_index - start_index); + return true; + } +} \ No newline at end of file -- cgit v1.2.3