117 lines
3.9 KiB
C++
Raw Normal View History

2024-04-02 15:36:52 +08:00
#include "define.h"
2024-01-08 23:37:00 +08:00
#include <winrt/Windows.Foundation.h>
#include <winrt/Windows.Storage.Pickers.h>
#include <winrt/Windows.Storage.Streams.h>
#include <winrt/Windows.Graphics.Imaging.h>
#include <winrt/Windows.Media.FaceAnalysis.h>
#include <winrt/Windows.Media.Ocr.h>
#include <winrt/Windows.Foundation.Collections.h>
#include <winrt/Windows.Devices.Enumeration.h>
#include <winrt/Windows.Media.Devices.h>
#include <winrt/Windows.Security.Cryptography.h>
#include <winrt/Windows.Globalization.h>
using namespace winrt;
using namespace Windows::Foundation;
using namespace Windows::Storage;
using namespace Windows::Storage::Streams;
using namespace Windows::Graphics::Imaging;
using namespace Windows::Media::Ocr;
using namespace Windows::Devices::Enumeration;
using namespace Windows::Media::Devices;
using namespace Windows::Security::Cryptography;
using namespace Windows::Globalization;
using namespace Windows::Foundation::Collections;
2024-04-02 15:36:52 +08:00
bool check_language_valid(wchar_t *language)
{
2024-01-08 23:37:00 +08:00
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
std::wstring l = language;
2024-04-02 15:36:52 +08:00
try
{
2024-01-08 23:37:00 +08:00
Language language1(l);
return ocrEngine.IsLanguageSupported(language1);
}
2024-04-02 15:36:52 +08:00
catch (...)
{
2024-01-08 23:37:00 +08:00
return false;
}
}
2024-04-02 15:36:52 +08:00
wchar_t **getlanguagelist(int *num)
{
2024-01-08 23:37:00 +08:00
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
auto languages = ocrEngine.AvailableRecognizerLanguages();
2024-04-02 15:36:52 +08:00
auto ret = new wchar_t *[languages.Size()];
2024-01-08 23:37:00 +08:00
int i = 0;
2024-04-02 15:36:52 +08:00
for (auto &&language : languages)
2024-01-08 23:37:00 +08:00
{
2024-04-02 15:36:52 +08:00
// std::wcout << language.LanguageTag().c_str() << L" " << language.DisplayName().c_str() << L" " << language.AbbreviatedName().c_str() << L'\n';
// zh-Hans-CN <20><><EFBFBD><EFBFBD>(<28><><EFBFBD><EFBFBD>й<EFBFBD>) <20><><EFBFBD><EFBFBD>
// ja <20><><EFBFBD><EFBFBD>
2024-01-08 23:37:00 +08:00
auto lang = language.LanguageTag();
size_t len = lang.size() + 1;
ret[i] = new wchar_t[len];
wcscpy_s(ret[i], len, lang.c_str());
i += 1;
}
*num = languages.Size();
return ret;
}
2024-04-02 15:36:52 +08:00
ocrres OCR(wchar_t *fname, wchar_t *lang, wchar_t *space, int *num)
2024-01-08 23:37:00 +08:00
{
2024-04-02 15:36:52 +08:00
// ָ<><D6B8>Ҫʶ<D2AA><CAB6><EFBFBD>ͼ<EFBFBD><CDBC><EFBFBD>ļ<EFBFBD>·<EFBFBD><C2B7>
2024-01-08 23:37:00 +08:00
std::wstring imagePath = fname;
2024-04-02 15:36:52 +08:00
// <20><>ͼ<EFBFBD><CDBC><EFBFBD>ļ<EFBFBD>
2024-01-08 23:37:00 +08:00
StorageFile imageFile = StorageFile::GetFileFromPathAsync(imagePath).get();
IRandomAccessStream imageStream = imageFile.OpenAsync(FileAccessMode::Read).get();
2024-04-02 15:36:52 +08:00
// <20><><EFBFBD><EFBFBD> BitmapDecoder <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ͼ<EFBFBD><CDBC>
2024-01-08 23:37:00 +08:00
BitmapDecoder decoder = BitmapDecoder::CreateAsync(imageStream).get();
2024-04-02 15:36:52 +08:00
// <20>ӽ<EFBFBD><D3BD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>л<EFBFBD>ȡλͼ<CEBB><CDBC><EFBFBD><EFBFBD>
2024-01-08 23:37:00 +08:00
SoftwareBitmap softwareBitmap = decoder.GetSoftwareBitmapAsync().get();
std::wstring l = lang;
Language language(l);
2024-04-02 15:36:52 +08:00
// <20><><EFBFBD><EFBFBD> OcrEngine <20><><EFBFBD><EFBFBD>
2024-01-08 23:37:00 +08:00
OcrEngine ocrEngine = OcrEngine::TryCreateFromLanguage(language);
2024-04-02 15:36:52 +08:00
// <20><><EFBFBD><EFBFBD> OcrResult <20><><EFBFBD>󲢽<EFBFBD><F3B2A2BD><EFBFBD>ʶ<EFBFBD><CAB6>
2024-01-08 23:37:00 +08:00
OcrResult ocrResult = ocrEngine.RecognizeAsync(softwareBitmap).get();
2024-04-02 15:36:52 +08:00
// <20><><EFBFBD>ʶ<EFBFBD><CAB6><EFBFBD><EFBFBD>
auto res = ocrResult.Lines();
std::vector<std::wstring> rets;
std::vector<int> xs, ys, xs2, ys2;
2024-01-08 23:37:00 +08:00
int i = 0;
2024-04-02 15:36:52 +08:00
std::wstring sspace = space; // Ĭ<>ϼ<EFBFBD>ʹ<EFBFBD><CAB9><EFBFBD><EFBFBD>Ҳ<EFBFBD>пո<D0BF>
2024-01-08 23:37:00 +08:00
for (auto line : res)
{
std::wstring xx = L"";
bool start = true;
2024-04-02 15:36:52 +08:00
unsigned int x1 = -1, x2 = 0, y1 = -1, y2 = 0;
for (auto word : line.Words())
{
if (!start)
xx += sspace;
2024-01-08 23:37:00 +08:00
start = false;
xx += word.Text();
2024-04-02 15:36:52 +08:00
auto &rect = word.BoundingRect();
x1 = min(rect.X, x1);
x2 = max(x2, rect.X + rect.Width);
y1 = min(rect.Y, y1);
y2 = max(y2, rect.Y + rect.Height);
2024-01-08 23:37:00 +08:00
}
ys.push_back(y1);
xs.push_back(x1);
xs2.push_back(x2);
ys2.push_back(y2);
2024-04-02 15:36:52 +08:00
rets.emplace_back(xx);
2024-01-08 23:37:00 +08:00
i += 1;
}
*num = res.Size();
2024-04-02 15:36:52 +08:00
return ocrres{vecwstr2c(rets), vecint2c(xs), vecint2c(ys), vecint2c(xs2), vecint2c(ys2)};
2024-01-08 23:37:00 +08:00
}