#include "define.h" #include #include #include #include #include #include #include #include #include #include #include using namespace winrt; using namespace Windows::Foundation; using namespace Windows::Storage; using namespace Windows::Storage::Streams; using namespace Windows::Graphics::Imaging; using namespace Windows::Media::Ocr; using namespace Windows::Devices::Enumeration; using namespace Windows::Media::Devices; using namespace Windows::Security::Cryptography; using namespace Windows::Globalization; using namespace Windows::Foundation::Collections; bool check_language_valid(wchar_t *language) { OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages(); std::wstring l = language; try { Language language1(l); return ocrEngine.IsLanguageSupported(language1); } catch (...) { return false; } } wchar_t **getlanguagelist(int *num) { OcrEngine ocrEngine = OcrEngine::TryCreateFromUserProfileLanguages(); auto languages = ocrEngine.AvailableRecognizerLanguages(); auto ret = new wchar_t *[languages.Size()]; int i = 0; for (auto &&language : languages) { // std::wcout << language.LanguageTag().c_str() << L" " << language.DisplayName().c_str() << L" " << language.AbbreviatedName().c_str() << L'\n'; // zh-Hans-CN ����(���壬�й�) ���� // ja ���� auto lang = language.LanguageTag(); size_t len = lang.size() + 1; ret[i] = new wchar_t[len]; wcscpy_s(ret[i], len, lang.c_str()); i += 1; } *num = languages.Size(); return ret; } ocrres OCR(wchar_t *fname, wchar_t *lang, wchar_t *space, int *num) { // ָ��Ҫʶ���ͼ���ļ�·�� std::wstring imagePath = fname; // ��ͼ���ļ� StorageFile imageFile = StorageFile::GetFileFromPathAsync(imagePath).get(); IRandomAccessStream imageStream = imageFile.OpenAsync(FileAccessMode::Read).get(); // ���� BitmapDecoder �������ͼ�� BitmapDecoder decoder = BitmapDecoder::CreateAsync(imageStream).get(); // �ӽ������л�ȡλͼ���� SoftwareBitmap softwareBitmap = decoder.GetSoftwareBitmapAsync().get(); std::wstring l = lang; Language language(l); // ���� OcrEngine ���� OcrEngine ocrEngine = OcrEngine::TryCreateFromLanguage(language); // ���� OcrResult ���󲢽���ʶ�� OcrResult ocrResult = ocrEngine.RecognizeAsync(softwareBitmap).get(); // ���ʶ���� auto res = ocrResult.Lines(); std::vector rets; std::vector xs, ys, xs2, ys2; int i = 0; std::wstring sspace = space; // Ĭ�ϼ�ʹ����Ҳ�пո� for (auto line : res) { std::wstring xx = L""; bool start = true; unsigned int x1 = -1, x2 = 0, y1 = -1, y2 = 0; for (auto word : line.Words()) { if (!start) xx += sspace; start = false; xx += word.Text(); auto &rect = word.BoundingRect(); x1 = min(rect.X, x1); x2 = max(x2, rect.X + rect.Width); y1 = min(rect.Y, y1); y2 = max(y2, rect.Y + rect.Height); } ys.push_back(y1); xs.push_back(x1); xs2.push_back(x2); ys2.push_back(y2); rets.emplace_back(xx); i += 1; } *num = res.Size(); return ocrres{vecwstr2c(rets), vecint2c(xs), vecint2c(ys), vecint2c(xs2), vecint2c(ys2)}; }