107 lines
3.3 KiB
C++
Raw Normal View History

2024-04-02 15:36:52 +08:00
#include "define.h"
2024-01-08 23:37:00 +08:00
#include <winrt/Windows.Foundation.h>
#include <winrt/Windows.Storage.Pickers.h>
#include <winrt/Windows.Storage.Streams.h>
#include <winrt/Windows.Graphics.Imaging.h>
#include <winrt/Windows.Media.FaceAnalysis.h>
#include <winrt/Windows.Media.Ocr.h>
#include <winrt/Windows.Foundation.Collections.h>
#include <winrt/Windows.Devices.Enumeration.h>
#include <winrt/Windows.Media.Devices.h>
#include <winrt/Windows.Security.Cryptography.h>
#include <winrt/Windows.Globalization.h>
using namespace winrt;
using namespace Windows::Foundation;
using namespace Windows::Storage;
using namespace Windows::Storage::Streams;
using namespace Windows::Graphics::Imaging;
using namespace Windows::Media::Ocr;
using namespace Windows::Devices::Enumeration;
using namespace Windows::Media::Devices;
using namespace Windows::Security::Cryptography;
using namespace Windows::Globalization;
using namespace Windows::Foundation::Collections;
2024-04-02 15:36:52 +08:00
bool check_language_valid(wchar_t *language)
{
2024-01-08 23:37:00 +08:00
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
std::wstring l = language;
2024-04-02 15:36:52 +08:00
try
{
2024-01-08 23:37:00 +08:00
Language language1(l);
return ocrEngine.IsLanguageSupported(language1);
}
2024-04-02 15:36:52 +08:00
catch (...)
{
2024-01-08 23:37:00 +08:00
return false;
}
}
2024-04-02 15:36:52 +08:00
wchar_t **getlanguagelist(int *num)
{
2024-01-08 23:37:00 +08:00
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
auto languages = ocrEngine.AvailableRecognizerLanguages();
2024-04-02 15:36:52 +08:00
auto ret = new wchar_t *[languages.Size()];
2024-01-08 23:37:00 +08:00
int i = 0;
2024-04-02 15:36:52 +08:00
for (auto &&language : languages)
2024-01-08 23:37:00 +08:00
{
auto lang = language.LanguageTag();
size_t len = lang.size() + 1;
ret[i] = new wchar_t[len];
wcscpy_s(ret[i], len, lang.c_str());
i += 1;
}
*num = languages.Size();
return ret;
}
2024-04-02 15:36:52 +08:00
ocrres OCR(wchar_t *fname, wchar_t *lang, wchar_t *space, int *num)
2024-01-08 23:37:00 +08:00
{
std::wstring imagePath = fname;
StorageFile imageFile = StorageFile::GetFileFromPathAsync(imagePath).get();
IRandomAccessStream imageStream = imageFile.OpenAsync(FileAccessMode::Read).get();
BitmapDecoder decoder = BitmapDecoder::CreateAsync(imageStream).get();
SoftwareBitmap softwareBitmap = decoder.GetSoftwareBitmapAsync().get();
std::wstring l = lang;
Language language(l);
OcrEngine ocrEngine = OcrEngine::TryCreateFromLanguage(language);
OcrResult ocrResult = ocrEngine.RecognizeAsync(softwareBitmap).get();
2024-04-02 15:36:52 +08:00
auto res = ocrResult.Lines();
std::vector<std::wstring> rets;
std::vector<int> xs, ys, xs2, ys2;
2024-01-08 23:37:00 +08:00
int i = 0;
2024-05-03 17:50:26 +08:00
std::wstring sspace = space;
2024-01-08 23:37:00 +08:00
for (auto line : res)
{
std::wstring xx = L"";
bool start = true;
2024-04-02 15:36:52 +08:00
unsigned int x1 = -1, x2 = 0, y1 = -1, y2 = 0;
for (auto word : line.Words())
{
if (!start)
xx += sspace;
2024-01-08 23:37:00 +08:00
start = false;
xx += word.Text();
2024-04-02 15:36:52 +08:00
auto &rect = word.BoundingRect();
x1 = min(rect.X, x1);
x2 = max(x2, rect.X + rect.Width);
y1 = min(rect.Y, y1);
y2 = max(y2, rect.Y + rect.Height);
2024-01-08 23:37:00 +08:00
}
ys.push_back(y1);
xs.push_back(x1);
xs2.push_back(x2);
ys2.push_back(y2);
2024-04-02 15:36:52 +08:00
rets.emplace_back(xx);
2024-01-08 23:37:00 +08:00
i += 1;
}
*num = res.Size();
2024-04-02 15:36:52 +08:00
return ocrres{vecwstr2c(rets), vecint2c(xs), vecint2c(ys), vecint2c(xs2), vecint2c(ys2)};
2024-01-08 23:37:00 +08:00
}