2023-04-08 07:41:34 +00:00
|
|
|
#include <regex>
|
|
|
|
|
|
|
|
#include "blankie/murl.h"
|
|
|
|
|
|
|
|
#include "pixivmodels.h"
|
|
|
|
#include "numberhelper.h"
|
|
|
|
|
|
|
|
static inline std::optional<std::string> get_1920x960_cover_image(blankie::murl::Url url);
|
2023-04-09 08:12:05 +00:00
|
|
|
static inline std::optional<std::string> get_original_cover_image(blankie::murl::Url url, const nlohmann::json& cover_image);
|
2023-04-08 07:41:34 +00:00
|
|
|
static inline std::optional<std::string> get_original_profile_picture(blankie::murl::Url url);
|
2023-04-28 08:39:09 +00:00
|
|
|
static inline std::optional<std::string> get_360x360_illust_thumbnail(blankie::murl::Url url);
|
2023-04-08 16:06:56 +00:00
|
|
|
static Images get_profile_pictures(const nlohmann::json& j);
|
2023-05-01 04:10:15 +00:00
|
|
|
static Images get_profile_pictures(const std::string& url);
|
2023-05-07 17:22:48 +00:00
|
|
|
static std::optional<std::pair<uint64_t, uint64_t>> get_thumbnail_size(blankie::murl::Url thumbnail_url, std::optional<std::pair<uint64_t, uint64_t>> original_size);
|
|
|
|
static Images get_illust_images(const nlohmann::json& image, std::optional<nlohmann::json> image_metadata);
|
2023-04-08 07:41:34 +00:00
|
|
|
|
2023-05-07 17:22:48 +00:00
|
|
|
const Image& Images::original_or_thumbnail() const {
|
2023-04-08 07:41:34 +00:00
|
|
|
if (this->original) {
|
|
|
|
return *this->original;
|
|
|
|
}
|
|
|
|
if (!this->thumbnails.empty()) {
|
|
|
|
return this->thumbnails.back();
|
|
|
|
}
|
|
|
|
throw std::runtime_error("Images does not contain any images");
|
|
|
|
}
|
|
|
|
|
2023-05-07 17:22:48 +00:00
|
|
|
const Image& Images::thumbnail_or_original(size_t back) const {
|
2023-04-09 13:50:44 +00:00
|
|
|
if (this->thumbnails.size() > back) {
|
|
|
|
return this->thumbnails[this->thumbnails.size() - back - 1];
|
|
|
|
}
|
2023-04-08 07:41:34 +00:00
|
|
|
if (!this->thumbnails.empty()) {
|
|
|
|
return this->thumbnails.back();
|
|
|
|
}
|
|
|
|
if (this->original) {
|
|
|
|
return *this->original;
|
|
|
|
}
|
|
|
|
throw std::runtime_error("Images does not contain any images");
|
|
|
|
}
|
|
|
|
|
|
|
|
void from_json(const nlohmann::json& j, User& user) {
|
|
|
|
j.at("user_account").get_to(user.username);
|
|
|
|
j.at("user_name").get_to(user.display_name);
|
|
|
|
user.user_id = to_ull(j.at("user_id").get_ref<const nlohmann::json::string_t&>());
|
|
|
|
|
|
|
|
if (j.contains("cover_image") && j["cover_image"].is_object()) {
|
|
|
|
nlohmann::json cover_image = j["cover_image"];
|
|
|
|
std::string c_720x360 = cover_image.at("profile_cover_image").at("720x360").get<std::string>();
|
2023-04-09 08:12:05 +00:00
|
|
|
std::optional<std::string> original = get_original_cover_image(c_720x360, cover_image);
|
2023-04-08 07:41:34 +00:00
|
|
|
std::optional<std::string> c_1920x960 = get_1920x960_cover_image(c_720x360);
|
|
|
|
|
|
|
|
user.cover_images = {std::move(original), {std::move(c_720x360)}};
|
|
|
|
if (c_1920x960) {
|
|
|
|
user.cover_images->thumbnails.push_back(std::move(*c_1920x960));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-08 16:06:56 +00:00
|
|
|
user.profile_pictures = get_profile_pictures(j.at("profile_img"));
|
2023-04-08 07:41:34 +00:00
|
|
|
|
2023-04-08 08:48:36 +00:00
|
|
|
if (j.contains("user_webpage")) {
|
|
|
|
std::string user_webpage = j.at("user_webpage").get<std::string>();
|
|
|
|
if (!user_webpage.empty()) {
|
|
|
|
user.links.push_back({"Webpage", std::move(user_webpage)});
|
|
|
|
}
|
2023-04-08 07:41:34 +00:00
|
|
|
}
|
|
|
|
auto add_social_as_needed = [&](const char* key, const char* public_name) {
|
2023-04-08 08:48:36 +00:00
|
|
|
nlohmann::json social = j["social"];
|
2023-04-08 07:41:34 +00:00
|
|
|
if (!social.contains(key)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string url = social[key].at("url").get<std::string>();
|
|
|
|
user.links.push_back({public_name, std::move(url)});
|
|
|
|
};
|
2023-04-08 08:48:36 +00:00
|
|
|
if (j.contains("social") && j["social"].is_object()) {
|
|
|
|
add_social_as_needed("twitter", "Twitter");
|
|
|
|
add_social_as_needed("instagram", "Instagram");
|
|
|
|
add_social_as_needed("tumblr", "Tumblr");
|
|
|
|
add_social_as_needed("facebook", "Facebook");
|
|
|
|
add_social_as_needed("circlems", "Circle.ms");
|
|
|
|
add_social_as_needed("pawoo", "Pawoo");
|
|
|
|
}
|
2023-04-08 07:41:34 +00:00
|
|
|
}
|
|
|
|
|
2023-04-08 16:06:56 +00:00
|
|
|
void from_json(const nlohmann::json& j, Tag& tag) {
|
|
|
|
j.at("tag").get_to(tag.japanese);
|
|
|
|
if (j.contains("translation")) {
|
|
|
|
tag.english = j["translation"].get<std::string>();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void from_json(const nlohmann::json& j, Illust& illust) {
|
|
|
|
bool full_data = j.contains("illust_details");
|
|
|
|
const nlohmann::json& author_details = j.at("author_details");
|
|
|
|
const nlohmann::json& illust_details = full_data ? j.at("illust_details") : j;
|
2023-05-08 10:47:51 +00:00
|
|
|
std::optional<nlohmann::json> images_metadata = illust_details.contains("illust_images")
|
|
|
|
? std::optional(illust_details["illust_images"])
|
|
|
|
: std::nullopt;
|
2023-04-08 16:06:56 +00:00
|
|
|
|
|
|
|
author_details.at("user_account").get_to(illust.username);
|
2023-04-09 13:31:50 +00:00
|
|
|
author_details.at("user_name").get_to(illust.user_display_name);
|
2023-04-08 16:06:56 +00:00
|
|
|
illust.user_id = to_ull(author_details.at("user_id").get_ref<const nlohmann::json::string_t&>());
|
|
|
|
if (full_data) {
|
|
|
|
illust.user_profile_pictures = get_profile_pictures(author_details.at("profile_img"));
|
|
|
|
}
|
|
|
|
|
|
|
|
illust.illust_id = to_ull(illust_details.at("id").get_ref<const nlohmann::json::string_t&>());
|
|
|
|
illust_details.at("title").get_to(illust.title);
|
2023-04-09 13:31:50 +00:00
|
|
|
illust.ai_generated = illust_details.at("ai_type").get<int>() == 2;
|
2023-04-08 16:06:56 +00:00
|
|
|
illust_details.at("upload_timestamp").get_to(illust.upload_time);
|
|
|
|
|
2023-04-08 16:27:45 +00:00
|
|
|
if (full_data) {
|
2023-04-09 15:15:53 +00:00
|
|
|
if (illust_details.contains("comment") && illust_details["comment"].is_string()) {
|
|
|
|
illust.comment = illust_details["comment"].get<std::string>();
|
2023-04-08 16:27:45 +00:00
|
|
|
}
|
2023-04-08 16:34:55 +00:00
|
|
|
illust_details.at("display_tags").get_to(illust.tags);
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (illust_details.contains("manga_a")) {
|
|
|
|
const nlohmann::json& manga_a = illust_details["manga_a"];
|
|
|
|
illust.images.reserve(manga_a.size());
|
2023-05-07 17:22:48 +00:00
|
|
|
|
|
|
|
for (size_t i = 0; i < manga_a.size(); i++) {
|
2023-05-08 10:47:51 +00:00
|
|
|
illust.images.push_back(get_illust_images(manga_a[i], images_metadata ? std::optional(images_metadata->at(i)) : std::nullopt));
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
|
|
|
} else {
|
2023-05-08 10:47:51 +00:00
|
|
|
illust.images = {get_illust_images(illust_details, images_metadata ? std::optional(images_metadata->at(0)) : std::nullopt)};
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
2023-05-05 16:28:33 +00:00
|
|
|
illust.page_count = to_ull(illust_details.at("page_count").get_ref<const nlohmann::json::string_t&>());
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
|
|
|
|
2023-04-08 16:27:45 +00:00
|
|
|
void from_json(const nlohmann::json& j, Illusts& illusts) {
|
|
|
|
j.at("illusts").get_to(illusts.illusts);
|
|
|
|
j.at("total").get_to(illusts.total_illusts);
|
|
|
|
j.at("lastPage").get_to(illusts.total_pages);
|
|
|
|
}
|
|
|
|
|
2023-05-01 04:10:15 +00:00
|
|
|
void from_json(const nlohmann::json& j, SearchResults& search_results) {
|
|
|
|
const nlohmann::json& tag_translations = j.at("tagTranslation");
|
|
|
|
auto get_translated_tag = [&](const std::string& japanese) -> std::optional<std::string> {
|
|
|
|
if (!tag_translations.is_object() || !tag_translations.contains(japanese)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
const nlohmann::json& tag = tag_translations[japanese];
|
|
|
|
return tag.contains("en")
|
|
|
|
? std::optional(tag["en"].get<std::string>())
|
|
|
|
: std::nullopt;
|
|
|
|
};
|
|
|
|
|
|
|
|
const nlohmann::json& illusts = j.at("illust").at("data");
|
|
|
|
search_results.illusts.illusts.reserve(illusts.size());
|
|
|
|
for (const nlohmann::json& i : illusts) {
|
|
|
|
const nlohmann::json& i_tags = i.at("tags");
|
|
|
|
std::vector<Tag> tags;
|
|
|
|
tags.reserve(i_tags.size());
|
|
|
|
|
|
|
|
for (const nlohmann::json& tag : i_tags) {
|
|
|
|
std::string japanese = tag.get<std::string>();
|
|
|
|
tags.push_back({japanese, get_translated_tag(std::move(japanese))});
|
|
|
|
}
|
|
|
|
|
|
|
|
Illust illust = {
|
|
|
|
.username = "",
|
|
|
|
.user_display_name = i.at("userName").get<std::string>(),
|
|
|
|
.user_id = to_ull(i.at("userId").get<std::string>()),
|
|
|
|
.user_profile_pictures = get_profile_pictures(i.at("profileImageUrl").get<std::string>()),
|
|
|
|
|
|
|
|
.illust_id = to_ull(i.at("id").get<std::string>()),
|
|
|
|
.title = i.at("title").get<std::string>(),
|
|
|
|
.ai_generated = i.at("aiType").get<int>() == 2,
|
|
|
|
// pixiv does have a createDate field, but it can't be portably parsed by strptime
|
|
|
|
// and i cba to use regex for it, especially when it's not even used in this context
|
|
|
|
.upload_time = -1,
|
|
|
|
|
|
|
|
.comment = std::nullopt,
|
|
|
|
.tags = std::move(tags),
|
2023-05-07 17:22:48 +00:00
|
|
|
.images = {get_illust_images(i, std::nullopt)},
|
2023-05-05 16:28:33 +00:00
|
|
|
.page_count = i.at("pageCount").get<size_t>()
|
2023-05-01 04:10:15 +00:00
|
|
|
};
|
|
|
|
search_results.illusts.illusts.push_back(illust);
|
|
|
|
}
|
|
|
|
|
|
|
|
j.at("illust").at("total").get_to(search_results.illusts.total_illusts);
|
|
|
|
search_results.illusts.total_pages = search_results.illusts.total_illusts / 60;
|
|
|
|
if (search_results.illusts.total_illusts % 60 != 0) {
|
|
|
|
search_results.illusts.total_pages++;
|
|
|
|
}
|
|
|
|
if (search_results.illusts.total_pages > 10) {
|
|
|
|
search_results.illusts.total_pages = 10;
|
|
|
|
}
|
|
|
|
|
|
|
|
search_results.tag_translations.reserve(tag_translations.size());
|
|
|
|
for (auto &[key, val] : tag_translations.items()) {
|
|
|
|
std::optional<std::string> translated_tag = get_translated_tag(key);
|
|
|
|
if (translated_tag) {
|
|
|
|
search_results.tag_translations.insert({std::move(key), std::move(*translated_tag)});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void from_json(const nlohmann::json& j, SearchSuggestion& search_suggestion) {
|
|
|
|
j.at("tag_name").get_to(search_suggestion.tag);
|
|
|
|
if (j.at("type").get_ref<const nlohmann::json::string_t&>() == "tag_translation") {
|
|
|
|
search_suggestion.english_tag = j.at("tag_translation").get<std::string>();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-08 07:41:34 +00:00
|
|
|
static std::regex resolution_path_regex("/c/(\\d+x\\d+)(.+)");
|
|
|
|
static inline std::optional<std::string> get_1920x960_cover_image(blankie::murl::Url url) {
|
|
|
|
std::smatch sm;
|
|
|
|
if (!std::regex_match(url.path, sm, resolution_path_regex)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
if (sm[1] == "1920x960") {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
url.path = "/c/1920x960" + sm.str(2);
|
|
|
|
return url.to_string();
|
|
|
|
}
|
|
|
|
|
2023-04-09 08:02:44 +00:00
|
|
|
static std::regex thumbnail_path_regex("/c/[^/]+(/.+)_master\\d+(\\.\\w{3,4})?");
|
2023-04-09 08:12:05 +00:00
|
|
|
static inline std::optional<std::string> get_original_cover_image(blankie::murl::Url url, const nlohmann::json& cover_image) {
|
2023-04-08 07:41:34 +00:00
|
|
|
std::smatch sm;
|
|
|
|
if (!std::regex_match(url.path, sm, thumbnail_path_regex)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
2023-04-09 08:12:05 +00:00
|
|
|
|
|
|
|
url.path = sm.str(1);
|
|
|
|
if (cover_image.contains("profile_cover_ext") && cover_image["profile_cover_ext"].is_string()
|
|
|
|
&& !cover_image["profile_cover_ext"].get_ref<const nlohmann::json::string_t&>().empty()) {
|
|
|
|
url.path += '.';
|
|
|
|
url.path += cover_image["profile_cover_ext"].get<std::string>();
|
|
|
|
} else {
|
|
|
|
url.path += sm.str(2);
|
|
|
|
}
|
2023-04-08 07:41:34 +00:00
|
|
|
return url.to_string();
|
|
|
|
}
|
|
|
|
|
|
|
|
static std::regex profile_picture_thumbnail_path_regex("(/.+)_\\d{2,}(\\.\\w{3,4})");
|
|
|
|
static inline std::optional<std::string> get_original_profile_picture(blankie::murl::Url url) {
|
|
|
|
std::smatch sm;
|
|
|
|
if (!std::regex_match(url.path, sm, profile_picture_thumbnail_path_regex)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
url.path = sm.str(1) + sm.str(2);
|
|
|
|
return url.to_string();
|
|
|
|
}
|
2023-04-08 16:06:56 +00:00
|
|
|
|
|
|
|
static Images get_profile_pictures(const nlohmann::json& j) {
|
|
|
|
Images images;
|
|
|
|
|
|
|
|
if (j.contains("main_s")) {
|
|
|
|
images.thumbnails.push_back(j["main_s"].get<std::string>());
|
|
|
|
}
|
|
|
|
images.thumbnails.push_back(j.at("main").get<std::string>());
|
2023-05-07 17:22:48 +00:00
|
|
|
images.original = get_original_profile_picture(images.thumbnails.back().url);
|
2023-04-08 16:06:56 +00:00
|
|
|
|
|
|
|
return images;
|
|
|
|
}
|
|
|
|
|
2023-05-01 04:10:15 +00:00
|
|
|
static Images get_profile_pictures(const std::string& url) {
|
|
|
|
return {
|
|
|
|
.original = get_original_profile_picture(url),
|
|
|
|
.thumbnails = {url}
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2023-04-28 08:39:09 +00:00
|
|
|
static std::regex illust_360x360_thumbnail_path_regex(
|
|
|
|
"(?:/c/[^/]+?/img-master|/img-original)?"
|
|
|
|
"(/img/.*/\\d+_p\\d+)(?:_master1200|_square1200)?\\.\\w{3,4}"
|
|
|
|
);
|
|
|
|
static inline std::optional<std::string> get_360x360_illust_thumbnail(blankie::murl::Url url) {
|
|
|
|
using namespace std::string_literals;
|
|
|
|
|
|
|
|
std::smatch sm;
|
|
|
|
if (!std::regex_match(url.path, sm, illust_360x360_thumbnail_path_regex)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
url.path = "/c/360x360_10_webp/img-master"s + sm.str(1) + "_square1200.jpg";
|
|
|
|
return url.to_string();
|
|
|
|
}
|
|
|
|
|
2023-05-07 17:22:48 +00:00
|
|
|
static std::regex illust_size_regex(
|
|
|
|
"/c/(\\d+)x(\\d+)[/_].+"
|
|
|
|
);
|
|
|
|
static std::optional<std::pair<uint64_t, uint64_t>> get_thumbnail_size(blankie::murl::Url thumbnail_url, std::optional<std::pair<uint64_t, uint64_t>> original_size) {
|
|
|
|
if (!original_size) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::smatch sm;
|
|
|
|
if (!std::regex_match(thumbnail_url.path, sm, illust_size_regex)) {
|
|
|
|
return std::nullopt;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t thumbnail_width = to_ull(sm.str(1));
|
|
|
|
// uint64_t thumbnail_height = to_ull(sm.str(2));
|
|
|
|
|
|
|
|
std::pair<uint64_t, uint64_t> real_thumbnail_size = {
|
|
|
|
thumbnail_width,
|
|
|
|
// derived from original_size->second / (original_size->first / thumbnail_width)
|
|
|
|
// to make it more accurate without using floats
|
|
|
|
original_size->second * thumbnail_width / original_size->first
|
|
|
|
};
|
|
|
|
return real_thumbnail_size;
|
|
|
|
}
|
|
|
|
|
|
|
|
static Images get_illust_images(const nlohmann::json& image, std::optional<nlohmann::json> image_metadata) {
|
2023-04-08 16:06:56 +00:00
|
|
|
Images images;
|
2023-04-28 08:39:09 +00:00
|
|
|
ssize_t add_360x360_to = -1;
|
2023-05-07 17:22:48 +00:00
|
|
|
std::optional<std::pair<uint64_t, uint64_t>> original_size;
|
|
|
|
|
|
|
|
if (image_metadata) {
|
|
|
|
original_size = {
|
|
|
|
to_ull(image_metadata->at("illust_image_width").get_ref<const nlohmann::json::string_t&>()),
|
|
|
|
to_ull(image_metadata->at("illust_image_height").get_ref<const nlohmann::json::string_t&>())
|
|
|
|
};
|
|
|
|
}
|
2023-04-08 16:06:56 +00:00
|
|
|
|
|
|
|
auto add_if_exists = [&](const char* key) {
|
2023-05-07 17:22:48 +00:00
|
|
|
if (!image.contains(key) || !image[key].is_string()) {
|
|
|
|
return false;
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
2023-05-07 17:22:48 +00:00
|
|
|
std::string url = image[key].get<std::string>();
|
|
|
|
images.thumbnails.push_back({url, get_thumbnail_size(url, original_size)});
|
|
|
|
return true;
|
2023-04-08 16:06:56 +00:00
|
|
|
};
|
|
|
|
add_if_exists("url_ss");
|
|
|
|
add_if_exists("url_placeholder");
|
2023-04-09 14:11:07 +00:00
|
|
|
add_if_exists("url_small");
|
2023-04-28 08:39:09 +00:00
|
|
|
if (!add_if_exists("url_s")) {
|
|
|
|
add_360x360_to = static_cast<ssize_t>(images.thumbnails.size());
|
|
|
|
}
|
2023-04-08 16:06:56 +00:00
|
|
|
add_if_exists("url");
|
2023-05-07 17:22:48 +00:00
|
|
|
if (image.contains("url_big") && image["url_big"].is_string()) {
|
|
|
|
images.original = {image["url_big"].get<std::string>(), original_size};
|
2023-04-08 16:06:56 +00:00
|
|
|
}
|
|
|
|
|
2023-04-28 08:39:09 +00:00
|
|
|
if (add_360x360_to >= 0) {
|
2023-05-07 17:22:48 +00:00
|
|
|
std::optional<std::string> c_360x360 = get_360x360_illust_thumbnail(images.original_or_thumbnail().url);
|
2023-04-28 08:39:09 +00:00
|
|
|
if (c_360x360) {
|
2023-05-07 17:22:48 +00:00
|
|
|
images.thumbnails.insert(images.thumbnails.begin() + add_360x360_to, {*c_360x360, get_thumbnail_size(*c_360x360, original_size)});
|
2023-04-28 08:39:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-08 16:06:56 +00:00
|
|
|
return images;
|
|
|
|
}
|