2024-04-02 15:36:52 +08:00
|
|
|
|
#include "pch.h"
|
|
|
|
|
#include "define.h"
|
|
|
|
|
#include <windows.h>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
#include <winrt/Windows.Foundation.h>
|
|
|
|
|
#include <winrt/Windows.Storage.Pickers.h>
|
|
|
|
|
#include <winrt/Windows.Storage.Streams.h>
|
|
|
|
|
#include <winrt/Windows.Graphics.Imaging.h>
|
|
|
|
|
#include <winrt/Windows.Media.FaceAnalysis.h>
|
|
|
|
|
#include <winrt/Windows.Media.Ocr.h>
|
|
|
|
|
|
|
|
|
|
#include <winrt/Windows.Foundation.Collections.h>
|
|
|
|
|
#include <winrt/Windows.Devices.Enumeration.h>
|
|
|
|
|
#include <winrt/Windows.Media.Devices.h>
|
|
|
|
|
|
|
|
|
|
#include <winrt/Windows.Security.Cryptography.h>
|
|
|
|
|
#include <winrt/Windows.Globalization.h>
|
|
|
|
|
#include <iostream>
|
|
|
|
|
#include <fstream>
|
2024-04-02 15:36:52 +08:00
|
|
|
|
#include <vector>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
using namespace winrt;
|
|
|
|
|
|
|
|
|
|
using namespace Windows::Foundation;
|
|
|
|
|
using namespace Windows::Storage;
|
|
|
|
|
using namespace Windows::Storage::Streams;
|
|
|
|
|
using namespace Windows::Graphics::Imaging;
|
|
|
|
|
using namespace Windows::Media::Ocr;
|
|
|
|
|
|
|
|
|
|
using namespace Windows::Devices::Enumeration;
|
|
|
|
|
using namespace Windows::Media::Devices;
|
|
|
|
|
|
|
|
|
|
using namespace Windows::Security::Cryptography;
|
|
|
|
|
using namespace Windows::Globalization;
|
|
|
|
|
using namespace Windows::Foundation::Collections;
|
2024-04-02 15:36:52 +08:00
|
|
|
|
bool check_language_valid(wchar_t *language)
|
|
|
|
|
{
|
2024-01-08 23:37:00 +08:00
|
|
|
|
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
|
|
|
|
|
std::wstring l = language;
|
2024-04-02 15:36:52 +08:00
|
|
|
|
try
|
|
|
|
|
{
|
2024-01-08 23:37:00 +08:00
|
|
|
|
Language language1(l);
|
|
|
|
|
return ocrEngine.IsLanguageSupported(language1);
|
|
|
|
|
}
|
2024-04-02 15:36:52 +08:00
|
|
|
|
catch (...)
|
|
|
|
|
{
|
2024-01-08 23:37:00 +08:00
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-04-02 15:36:52 +08:00
|
|
|
|
wchar_t **getlanguagelist(int *num)
|
|
|
|
|
{
|
2024-01-08 23:37:00 +08:00
|
|
|
|
OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages();
|
|
|
|
|
auto languages = ocrEngine.AvailableRecognizerLanguages();
|
2024-04-02 15:36:52 +08:00
|
|
|
|
auto ret = new wchar_t *[languages.Size()];
|
2024-01-08 23:37:00 +08:00
|
|
|
|
int i = 0;
|
2024-04-02 15:36:52 +08:00
|
|
|
|
for (auto &&language : languages)
|
2024-01-08 23:37:00 +08:00
|
|
|
|
{
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// std::wcout << language.LanguageTag().c_str() << L" " << language.DisplayName().c_str() << L" " << language.AbbreviatedName().c_str() << L'\n';
|
|
|
|
|
// zh-Hans-CN <20><><EFBFBD><EFBFBD>(<28><><EFBFBD>壬<EFBFBD>й<EFBFBD>) <20><><EFBFBD><EFBFBD>
|
|
|
|
|
// ja <20><><EFBFBD><EFBFBD>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
auto lang = language.LanguageTag();
|
|
|
|
|
size_t len = lang.size() + 1;
|
|
|
|
|
ret[i] = new wchar_t[len];
|
|
|
|
|
wcscpy_s(ret[i], len, lang.c_str());
|
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
*num = languages.Size();
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
2024-04-02 15:36:52 +08:00
|
|
|
|
ocrres OCR(wchar_t *fname, wchar_t *lang, wchar_t *space, int *num)
|
2024-01-08 23:37:00 +08:00
|
|
|
|
{
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// ָ<><D6B8>Ҫʶ<D2AA><CAB6><EFBFBD>ͼ<EFBFBD><CDBC><EFBFBD>ļ<EFBFBD>·<EFBFBD><C2B7>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
std::wstring imagePath = fname;
|
|
|
|
|
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20><>ͼ<EFBFBD><CDBC><EFBFBD>ļ<EFBFBD>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
StorageFile imageFile = StorageFile::GetFileFromPathAsync(imagePath).get();
|
|
|
|
|
IRandomAccessStream imageStream = imageFile.OpenAsync(FileAccessMode::Read).get();
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20><><EFBFBD><EFBFBD> BitmapDecoder <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ͼ<EFBFBD><CDBC>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
BitmapDecoder decoder = BitmapDecoder::CreateAsync(imageStream).get();
|
|
|
|
|
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20>ӽ<EFBFBD><D3BD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>л<EFBFBD>ȡλͼ<CEBB><CDBC><EFBFBD><EFBFBD>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
SoftwareBitmap softwareBitmap = decoder.GetSoftwareBitmapAsync().get();
|
|
|
|
|
std::wstring l = lang;
|
|
|
|
|
Language language(l);
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20><><EFBFBD><EFBFBD> OcrEngine <20><><EFBFBD><EFBFBD>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
OcrEngine ocrEngine = OcrEngine::TryCreateFromLanguage(language);
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20><><EFBFBD><EFBFBD> OcrResult <20><><EFBFBD><EFBFBD><F3B2A2BD><EFBFBD>ʶ<EFBFBD><CAB6>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
OcrResult ocrResult = ocrEngine.RecognizeAsync(softwareBitmap).get();
|
2024-04-02 15:36:52 +08:00
|
|
|
|
// <20><><EFBFBD>ʶ<EFBFBD><CAB6><EFBFBD><EFBFBD>
|
|
|
|
|
auto res = ocrResult.Lines();
|
|
|
|
|
std::vector<std::wstring> rets;
|
|
|
|
|
std::vector<int> xs, ys, xs2, ys2;
|
2024-01-08 23:37:00 +08:00
|
|
|
|
int i = 0;
|
2024-04-02 15:36:52 +08:00
|
|
|
|
std::wstring sspace = space; // Ĭ<>ϼ<EFBFBD>ʹ<EFBFBD><CAB9><EFBFBD><EFBFBD>Ҳ<EFBFBD>пո<D0BF>
|
2024-01-08 23:37:00 +08:00
|
|
|
|
for (auto line : res)
|
|
|
|
|
{
|
|
|
|
|
|
|
|
|
|
std::wstring xx = L"";
|
|
|
|
|
bool start = true;
|
2024-04-02 15:36:52 +08:00
|
|
|
|
unsigned int x1 = -1, x2 = 0, y1 = -1, y2 = 0;
|
|
|
|
|
|
|
|
|
|
for (auto word : line.Words())
|
|
|
|
|
{
|
|
|
|
|
if (!start)
|
|
|
|
|
xx += sspace;
|
2024-01-08 23:37:00 +08:00
|
|
|
|
start = false;
|
|
|
|
|
xx += word.Text();
|
2024-04-02 15:36:52 +08:00
|
|
|
|
auto &rect = word.BoundingRect();
|
|
|
|
|
x1 = min(rect.X, x1);
|
|
|
|
|
x2 = max(x2, rect.X + rect.Width);
|
|
|
|
|
y1 = min(rect.Y, y1);
|
|
|
|
|
y2 = max(y2, rect.Y + rect.Height);
|
2024-01-08 23:37:00 +08:00
|
|
|
|
}
|
|
|
|
|
ys.push_back(y1);
|
|
|
|
|
xs.push_back(x1);
|
|
|
|
|
xs2.push_back(x2);
|
|
|
|
|
ys2.push_back(y2);
|
2024-04-02 15:36:52 +08:00
|
|
|
|
rets.emplace_back(xx);
|
2024-01-08 23:37:00 +08:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
*num = res.Size();
|
2024-04-02 15:36:52 +08:00
|
|
|
|
return ocrres{vecwstr2c(rets), vecint2c(xs), vecint2c(ys), vecint2c(xs2), vecint2c(ys2)};
|
2024-01-08 23:37:00 +08:00
|
|
|
|
}
|