mirror of
https://github.com/Artikash/Textractor.git
synced 2025-01-10 01:33:51 +08:00
195 lines
5.2 KiB
C++
195 lines
5.2 KiB
C++
#include "qtcommon.h"
|
|
#include "extension.h"
|
|
#include "network.h"
|
|
#include <ctime>
|
|
|
|
extern const wchar_t* TRANSLATION_ERROR;
|
|
|
|
extern Synchronized<std::wstring> translateTo, apiKey;
|
|
|
|
const char* TRANSLATION_PROVIDER = "Google Translate";
|
|
const char* GET_API_KEY_FROM = "https://codelabs.developers.google.com/codelabs/cloud-translation-intro";
|
|
QStringList languages
|
|
{
|
|
"Afrikaans: af",
|
|
"Albanian: sq",
|
|
"Amharic: am",
|
|
"Arabic: ar",
|
|
"Armenian: hy",
|
|
"Azerbaijani: az",
|
|
"Basque: eu",
|
|
"Belarusian: be",
|
|
"Bengali: bn",
|
|
"Bosnian: bs",
|
|
"Bulgarian: bg",
|
|
"Catalan: ca",
|
|
"Cebuano: ceb",
|
|
"Chichewa: ny",
|
|
"Chinese (simplified): zh",
|
|
"Chinese (traditional): zh-TW",
|
|
"Corsican: co",
|
|
"Croatian: hr",
|
|
"Czech: cs",
|
|
"Danish: da",
|
|
"Dutch: nl",
|
|
"English: en",
|
|
"Esperanto: eo",
|
|
"Estonian: et",
|
|
"Filipino: tl",
|
|
"Finnish: fi",
|
|
"French: fr",
|
|
"Frisian: fy",
|
|
"Galician: gl",
|
|
"Georgian: ka",
|
|
"German: de",
|
|
"Greek: el",
|
|
"Gujarati: gu",
|
|
"Haitian Creole: ht",
|
|
"Hausa: ha",
|
|
"Hawaiian: haw",
|
|
"Hebrew: iw",
|
|
"Hindi: hi",
|
|
"Hmong: hmn",
|
|
"Hungarian: hu",
|
|
"Icelandic: is",
|
|
"Igbo: ig",
|
|
"Indonesian: id",
|
|
"Irish: ga",
|
|
"Italian: it",
|
|
"Japanese: ja",
|
|
"Javanese: jw",
|
|
"Kannada: kn",
|
|
"Kazakh: kk",
|
|
"Khmer: km",
|
|
"Kinyarwanda: rw",
|
|
"Korean: ko",
|
|
"Kurdish (Kurmanji): ku",
|
|
"Kyrgyz: ky",
|
|
"Lao: lo",
|
|
"Latin: la",
|
|
"Latvian: lv",
|
|
"Lithuanian: lt",
|
|
"Luxembourgish: lb",
|
|
"Macedonian: mk",
|
|
"Malagasy: mg",
|
|
"Malay: ms",
|
|
"Malayalam: ml",
|
|
"Maltese: mt",
|
|
"Maori: mi",
|
|
"Marathi: mr",
|
|
"Mongolian: mn",
|
|
"Myanmar (Burmese): my",
|
|
"Nepali: ne",
|
|
"Norwegian: no",
|
|
"Odia (Oriya): or",
|
|
"Pashto: ps",
|
|
"Persian: fa",
|
|
"Polish: pl",
|
|
"Portuguese: pt",
|
|
"Punjabi: pa",
|
|
"Romanian: ro",
|
|
"Russian: ru",
|
|
"Samoan: sm",
|
|
"Scots Gaelic: gd",
|
|
"Serbian: sr",
|
|
"Sesotho: st",
|
|
"Shona: sn",
|
|
"Sindhi: sd",
|
|
"Sinhala: si",
|
|
"Slovak: sk",
|
|
"Slovenian: sl",
|
|
"Somali: so",
|
|
"Spanish: es",
|
|
"Sundanese: su",
|
|
"Swahili: sw",
|
|
"Swedish: sv",
|
|
"Tajik: tg",
|
|
"Tamil: ta",
|
|
"Tatar: tt",
|
|
"Telugu: te",
|
|
"Thai: th",
|
|
"Turkish: tr",
|
|
"Turkmen: tk",
|
|
"Ukrainian: uk",
|
|
"Urdu: ur",
|
|
"Uyghur: ug",
|
|
"Uzbek: uz",
|
|
"Vietnamese: vi",
|
|
"Welsh: cy",
|
|
"Xhosa: xh",
|
|
"Yiddish: yi",
|
|
"Yoruba: yo",
|
|
"Zulu: zu"
|
|
};
|
|
|
|
bool translateSelectedOnly = false, rateLimitAll = true, rateLimitSelected = false, useCache = true;
|
|
int tokenCount = 30, tokenRestoreDelay = 60000, maxSentenceSize = 500;
|
|
|
|
unsigned TKK = 0;
|
|
|
|
std::wstring GetTranslationUri(const std::wstring& text)
|
|
{
|
|
// If no TKK available, use this uri. Can't use too much or google will detect unauthorized access
|
|
if (!TKK) return FormatString(L"/translate_a/single?client=gtx&dt=ld&dt=rm&dt=t&tl=%s&q=%s", translateTo.Copy(), Escape(text));
|
|
|
|
// reverse engineered from translate.google.com
|
|
std::wstring escapedText;
|
|
unsigned a = time(NULL) / 3600, b = a; // the first part of TKK
|
|
for (unsigned char ch : WideStringToString(text))
|
|
{
|
|
escapedText += FormatString(L"%%%02X", (int)ch);
|
|
a += ch;
|
|
a += a << 10;
|
|
a ^= a >> 6;
|
|
}
|
|
a += a << 3;
|
|
a ^= a >> 11;
|
|
a += a << 15;
|
|
a ^= TKK;
|
|
a %= 1000000;
|
|
|
|
return FormatString(L"/translate_a/single?client=webapp&dt=ld&dt=rm&dt=t&sl=auto&tl=%s&tk=%u.%u&q=%s", translateTo.Copy(), a, a ^ b, escapedText);
|
|
}
|
|
|
|
bool IsHash(const std::wstring& result)
|
|
{
|
|
return result.size() == 32 && std::all_of(result.begin(), result.end(), [](char ch) { return (ch >= L'0' && ch <= L'9') || (ch >= L'a' && ch <= L'z'); });
|
|
}
|
|
|
|
std::pair<bool, std::wstring> Translate(const std::wstring& text, SentenceInfo)
|
|
{
|
|
if (!apiKey->empty())
|
|
if (HttpRequest httpRequest{
|
|
L"Mozilla/5.0 Textractor",
|
|
L"translation.googleapis.com",
|
|
L"POST",
|
|
FormatString(L"/language/translate/v2?format=text&target=%s&key=%s", translateTo.Copy(), apiKey.Copy()).c_str(),
|
|
FormatString(R"({"q":["%s"]})", JSON::Escape(text))
|
|
})
|
|
{
|
|
// Response formatted as JSON: starts with "translatedText": " and translation is enclosed in quotes followed by a comma
|
|
if (std::wsmatch results; std::regex_search(httpRequest.response, results, std::wregex(L"\"translatedText\": \"(.+?)\","))) return { true, results[1] };
|
|
return { false, FormatString(L"%s: %s", TRANSLATION_ERROR, httpRequest.response) };
|
|
}
|
|
else return { false, FormatString(L"%s (code=%u)", TRANSLATION_ERROR, httpRequest.errorCode) };
|
|
|
|
if (!TKK)
|
|
if (HttpRequest httpRequest{ L"Mozilla/5.0 Textractor", L"translate.google.com", L"GET", L"/" })
|
|
if (std::wsmatch results; std::regex_search(httpRequest.response, results, std::wregex(L"(\\d{7,})'")))
|
|
_InterlockedCompareExchange(&TKK, stoll(results[1]), 0);
|
|
|
|
if (HttpRequest httpRequest{ L"Mozilla/5.0 Textractor", L"translate.googleapis.com", L"GET", GetTranslationUri(text).c_str() })
|
|
{
|
|
// Response formatted as JSON: starts with "[[[" and translation is enclosed in quotes followed by a comma
|
|
if (httpRequest.response[0] == L'[')
|
|
{
|
|
std::wstring translation;
|
|
for (std::wsmatch results; std::regex_search(httpRequest.response, results, std::wregex(L"\\[\"(.*?)\",[n\"]")); httpRequest.response = results.suffix())
|
|
if (!IsHash(results[1])) translation += std::wstring(results[1]) + L" ";
|
|
if (!translation.empty()) return { true, translation };
|
|
}
|
|
return { false, FormatString(L"%s (TKK=%u): %s", TRANSLATION_ERROR, _InterlockedExchange(&TKK, 0), httpRequest.response) };
|
|
}
|
|
else return { false, FormatString(L"%s (code=%u)", TRANSLATION_ERROR, httpRequest.errorCode) };
|
|
}
|