/dports/graphics/tesseract/tesseract-5.0.0/ |
H A D | README.md | 3 …d Status](https://travis-ci.org/tesseract-ocr/tesseract.svg?branch=master)](https://travis-ci.org/… 5 ![Build status](https://github.com/tesseract-ocr/tesseract/workflows/sw/badge.svg)<br> 7 …lds.io/lgtm/grade/cpp/g/tesseract-ocr/tesseract.svg?logo=lgtm&logoWidth=18)](https://lgtm.com/proj… 8 …hields.io/lgtm/alerts/g/tesseract-ocr/tesseract.svg?logo=lgtm&logoWidth=18)](https://lgtm.com/proj… 17 * [Tesseract OCR](#tesseract-ocr) 65 Open issues can be found in [issue tracker](https://github.com/tesseract-ocr/tesseract/issues), 90 …pers can use `libtesseract` [C](https://github.com/tesseract-ocr/tesseract/blob/main/include/tesse… 91 [C++](https://github.com/tesseract-ocr/tesseract/blob/main/include/tesseract/baseapi.h) API to buil… 106 * [tesseract-ocr](https://groups.google.com/g/tesseract-ocr) - For tesseract users. 107 * [tesseract-dev](https://groups.google.com/g/tesseract-dev) - For tesseract developers. [all …]
|
/dports/graphics/tesseract/tesseract-5.0.0/src/training/common/ |
H A D | commontraining.h | 29 namespace tesseract { 58 namespace tesseract { 96 tesseract::CLASS_TYPE Class; 139 void FreeTrainingSamples(tesseract::LIST CharList); 148 tesseract::CLUSTERER *SetUpForClustering(const tesseract::FEATURE_DEFS_STRUCT &FeatureDefs, 152 tesseract::LIST RemoveInsignificantProtos(tesseract::LIST ProtoList, bool KeepSigProtos, 156 void CleanUpUnusedData(tesseract::LIST ProtoList); 160 tesseract::CLUSTERER *Clusterer, tesseract::CLUSTERCONFIG *Config); 166 tesseract::CLASS_STRUCT *SetUpForFloat2Int(const tesseract::UNICHARSET &unicharset, 172 void FreeNormProtoList(tesseract::LIST CharList); [all …]
|
/dports/graphics/tesseract/tesseract-5.0.0/src/training/ |
H A D | classifier_tester.cpp | 28 using namespace tesseract; 55 *api = new tesseract::TessBaseAPI; in InitializeClassifier() 56 tesseract::OcrEngineMode engine_mode = tesseract::OEM_TESSERACT_ONLY; in InitializeClassifier() 57 tesseract::Tesseract *tesseract = nullptr; in InitializeClassifier() local 58 tesseract::Classify *classify = nullptr; in InitializeClassifier() 64 tesseract = const_cast<tesseract::Tesseract *>((*api)->tesseract()); in InitializeClassifier() 65 classify = static_cast<tesseract::Classify *>(tesseract); in InitializeClassifier() 71 tesseract::ShapeClassifier *shape_classifier = nullptr; in InitializeClassifier() 102 tesseract::CheckSharedLibraryVersion(); in main() 106 tesseract::TessBaseAPI *api; in main() [all …]
|
H A D | mergenf.h | 56 float CompareProtos(tesseract::PROTO_STRUCT *p1, tesseract::PROTO_STRUCT *p2); 58 void ComputeMergedProto(tesseract::PROTO_STRUCT *p1, tesseract::PROTO_STRUCT *p2, float w1, float w… 59 tesseract::PROTO_STRUCT *MergedProto); 61 int FindClosestExistingProto(tesseract::CLASS_TYPE Class, int NumMerged[], 62 tesseract::PROTOTYPE *Prototype); 64 void MakeNewFromOld(tesseract::PROTO_STRUCT *New, tesseract::PROTOTYPE *Old); 66 float SubfeatureEvidence(tesseract::FEATURE Feature, tesseract::PROTO_STRUCT *Proto); 70 bool DummyFastMatch(tesseract::FEATURE Feature, tesseract::PROTO_STRUCT *Proto); 72 void ComputePaddedBoundingBox(tesseract::PROTO_STRUCT *Proto, float TangentPad, float OrthogonalPad,
|
H A D | wordlist2dawg.cpp | 31 using namespace tesseract; 34 tesseract::CheckSharedLibraryVersion(); in main() 37 printf("%s\n", tesseract::TessBaseAPI::Version()); in main() 48 tesseract::Classify classify; in main() 53 tesseract::Trie::RTLReversePolicy reverse_policy = tesseract::Trie::RRP_DO_NO_REVERSE; in main() 58 reverse_policy = static_cast<tesseract::Trie::RTLReversePolicy>(tmp_int); in main() 71 tesseract::Trie trie( in main() 73 tesseract::DAWG_TYPE_WORD, "", SYSTEM_DAWG_PERM, unicharset.size(), in main() 81 std::unique_ptr<tesseract::SquishedDawg> dawg(trie.trie_to_dawg()); in main() 90 tesseract::SquishedDawg words(dawg_filename, in main() [all …]
|
H A D | combine_lang_model.cpp | 25 using namespace tesseract; 50 tesseract::CheckSharedLibraryVersion(); in main() 51 tesseract::ParseCommandLineFlags(argv[0], &argc, &argv, true); in main() 54 std::vector<std::string> words = split(tesseract::ReadFile(FLAGS_words.c_str()), '\n'); in main() 55 std::vector<std::string> puncs = split(tesseract::ReadFile(FLAGS_puncs.c_str()), '\n'); in main() 56 std::vector<std::string> numbers = split(tesseract::ReadFile(FLAGS_numbers.c_str()), '\n'); in main() 68 tesseract::SetupBasicProperties(/*report_errors*/ true, in main() 71 tesseract::SetScriptProperties(FLAGS_script_dir.c_str(), &unicharset); in main() 73 return tesseract::CombineLangModel(unicharset, FLAGS_script_dir.c_str(), in main()
|
H A D | ambiguous_words.cpp | 31 tesseract::CheckSharedLibraryVersion(); in main() 35 printf("%s\n", tesseract::TessBaseAPI::Version()); in main() 57 tesseract::TessBaseAPI api; in main() 62 api.Init(tessdata_dir, lang.c_str(), tesseract::OEM_TESSERACT_ONLY, nullptr, 0, &vars_vec, in main() 64 tesseract::Dict &dict = api.tesseract()->getDict(); in main() 67 tesseract::tprintf("Failed to open input wordlist file %s\n", input_file_str); in main() 75 tesseract::chomp_string(str); // remove newline in main() 76 tesseract::WERD_CHOICE word(str, dict.getUnicharset()); in main()
|
H A D | combine_tessdata.cpp | 27 using namespace tesseract; 44 tesseract::TFile fp; in list_network() 45 if (tm.GetComponent(tesseract::TESSDATA_LSTM, &fp)) { in list_network() 46 tesseract::LSTMRecognizer recognizer; in list_network() 118 tesseract::CheckSharedLibraryVersion(); in main() 121 tesseract::TessdataManager tm; in main() 123 printf("%s\n", tesseract::TessBaseAPI::Version()); in main() 170 filename += tesseract::kTessdataFileSuffixes[i]; in main() 202 tesseract::TFile fp; in main() 203 if (!tm.GetComponent(tesseract::TESSDATA_LSTM, &fp)) { in main() [all …]
|
H A D | dawg2wordlist.cpp | 26 using namespace tesseract; 28 static std::unique_ptr<tesseract::Dawg> LoadSquishedDawg(const UNICHARSET &unicharset, const char *… in LoadSquishedDawg() 30 tesseract::TFile dawg_file; in LoadSquishedDawg() 36 auto retval = std::make_unique<tesseract::SquishedDawg>(tesseract::DAWG_TYPE_WORD, "eng", in LoadSquishedDawg() 58 static int WriteDawgAsWordlist(const UNICHARSET &unicharset, const tesseract::Dawg *dawg, in WriteDawgAsWordlist() 72 tesseract::CheckSharedLibraryVersion(); in main() 75 printf("%s\n", tesseract::TessBaseAPI::Version()); in main()
|
/dports/graphics/tesseract/tesseract-5.0.0/.github/workflows/ |
H A D | vcpkg.yml | 45 D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe --version 85 D:\a\tesseract\tesseract\test\Release\basicapitest.exe 89 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\phototest.tif - --oem 1 --… 90 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\raaj.tif - -l hin --oem 1 … 91 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\viet.tif - -l vie --oem 1 … 92 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\hebrew.png - -l heb --oem 1… 93 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\eurotext.tif - -l fra --oem… 94 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe test\testing\arabic.tif - -l ara --oem 1… 98 … D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe --list-langs --tessdata-dir ..\tessdata 99 …D:\a\tesseract\tesseract\build\bin\Release\tesseract.exe --list-langs --tessdata-dir ..\tessdata_… [all …]
|
H A D | autotools-macos.yml | 2 # autotools build of tesseract and training tools on macos homebrew and macports. 69 - name: Display Version for tesseract, lstmtraining, text2image 71 tesseract -v 78 tesseract --list-langs --tessdata-dir ../tessdata 79 tesseract --list-langs --tessdata-dir ../tessdata_best 80 tesseract --list-langs --tessdata-dir ../tessdata_fast 166 - name: Display Version for tesseract, lstmtraining, text2image 168 tesseract -v 175 tesseract --list-langs --tessdata-dir ../tessdata 176 tesseract --list-langs --tessdata-dir ../tessdata_best [all …]
|
/dports/www/mattermost-server/mattermost-server-6.0.2/vendor/github.com/otiai10/gosseract/v2/ |
H A D | tessbridge.cpp | 14 tesseract::TessBaseAPI* api = new tesseract::TessBaseAPI(); in Create() 19 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in Free() 27 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in Clear() 34 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in ClearPersistentCache() 39 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in Init() 44 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in Init() 74 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in SetVariable() 79 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in SetPixImage() 88 tesseract::TessBaseAPI* api = (tesseract::TessBaseAPI*)a; in SetPageSegMode() 89 tesseract::PageSegMode mode = (tesseract::PageSegMode)m; in SetPageSegMode() [all …]
|
/dports/graphics/mupdf/mupdf-1.18.0-source/ |
H A D | Makethird | 628 -Iscripts/tesseract \ 805 THIRD_CFLAGS += -Ithirdparty/tesseract/include -Iscripts/tesseract 831 -Iscripts/tesseract \ 856 $(OUT)/thirdparty/tesseract/src/api/%.o: thirdparty/tesseract/src/api/%.cpp 859 $(OUT)/thirdparty/tesseract/src/arch/%.o: thirdparty/tesseract/src/arch/%.cpp 862 $(OUT)/thirdparty/tesseract/src/ccmain/%.o: thirdparty/tesseract/src/ccmain/%.cpp 868 $(OUT)/thirdparty/tesseract/src/ccutil/%.o: thirdparty/tesseract/src/ccutil/%.cpp 874 $(OUT)/thirdparty/tesseract/src/dict/%.o: thirdparty/tesseract/src/dict/%.cpp 877 $(OUT)/thirdparty/tesseract/src/lstm/%.o: thirdparty/tesseract/src/lstm/%.cpp 883 $(OUT)/thirdparty/tesseract/src/viewer/%.o: thirdparty/tesseract/src/viewer/%.cpp [all …]
|
/dports/graphics/tesseract/tesseract-5.0.0/unittest/ |
H A D | resultiterator_test.cc | 11 namespace tesseract { namespace 40 api_.SetPageSegMode(tesseract::PSM_AUTO); in SetImage() 64 im_level = tesseract::RIL_BLOCK; in VerifyRebuild() 116 if ((level == tesseract::RIL_WORD || level == tesseract::RIL_SYMBOL) && in VerifyIteratorText() 138 if (maxlevel == tesseract::RIL_SYMBOL) { in VerifyRebuilds() 212 tesseract::TessBaseAPI api_; 343 } while (r_it->Next(tesseract::RIL_WORD)); in TEST_F() 407 while (s_it.Next(tesseract::RIL_SYMBOL) && !s_it.IsAtBeginningOf(tesseract::RIL_WORD)) { in TEST_F() 417 } while (r_it->Next(tesseract::RIL_WORD)); in TEST_F() 560 } while (!s_it.IsAtFinalElement(tesseract::RIL_WORD, tesseract::RIL_SYMBOL) && in TEST_F() [all …]
|
H A D | pagesegmode_test.cc | 25 namespace tesseract { namespace 52 api_.Init(TESSDATA_DIR, "eng", tesseract::OEM_TESSERACT_ONLY); in SetImage() 82 tesseract::TessBaseAPI api_; 95 VerifyRectText(tesseract::PSM_SINGLE_WORD, "183", 1419, 264, 69, 34); in TEST_F() 96 VerifyRectText(tesseract::PSM_SINGLE_WORD, "183", 1411, 252, 78, 62); in TEST_F() 97 VerifyRectText(tesseract::PSM_SINGLE_WORD, "183", 1396, 218, 114, 102); in TEST_F() 99 VerifyRectText(tesseract::PSM_SINGLE_LINE, "What should", 237, 393, 256, 36); in TEST_F() 105 VerifyRectText(tesseract::PSM_SINGLE_WORD, "Whatshould", 237, 393, 256, 36); in TEST_F() 108 VerifyRectText(tesseract::PSM_SINGLE_BLOCK, "both the\nfrom the", 237, 450, 172, 94); in TEST_F() 110 NotRectText(tesseract::PSM_SINGLE_LINE, "both the\nfrom the", 237, 450, 172, 94); in TEST_F() [all …]
|
H A D | baseapi_test.cc | 29 namespace tesseract { namespace 67 static tesseract::TessBaseAPI api; in TEST_F() 73 tesseract::TessBaseAPI api; in TEST_F() 94 tesseract::TessBaseAPI api; in TEST_F() 123 tesseract::TessBaseAPI api; in TEST_F() 142 tesseract::TessBaseAPI api; in TEST_F() 176 tesseract::TessBaseAPI api; in TEST_F() 212 tesseract::TessBaseAPI api; in TEST_F() 331 tesseract::TessBaseAPI tess; in TEST() 341 tesseract::TessBaseAPI tess1, tess2; in TEST() [all …]
|
H A D | layout_test.cc | 28 namespace tesseract { namespace 75 api_.SetPageSegMode(tesseract::PSM_AUTO); in SetImage() 90 char *block_text = it->GetUTF8Text(tesseract::RIL_BLOCK); in VerifyBlockTextOrder() 111 } while (it->Next(tesseract::RIL_BLOCK)); in VerifyBlockTextOrder() 144 } while (it->Next(tesseract::RIL_BLOCK)); in VerifyRoughBlockOrder() 179 } while (word_it.Next(tesseract::RIL_WORD) && in VerifyTotalContainment() 180 !word_it.IsAtBeginningOf(tesseract::RIL_BLOCK)); in VerifyTotalContainment() 182 } while (it->Next(tesseract::RIL_BLOCK)); in VerifyTotalContainment() 187 tesseract::TessBaseAPI api_; 206 tesseract::ResultIterator *it = api_.GetIterator(); in TEST_F() [all …]
|
H A D | mastertrainer_test.cc | 39 using namespace tesseract; 268 EXPECT_EQ(tesseract::CT_SIZE + 1, results.size()); in TEST_F() 269 int result_values[tesseract::CT_SIZE]; in TEST_F() 270 for (int i = 0; i < tesseract::CT_SIZE; ++i) { in TEST_F() 276 EXPECT_EQ(kNumCorrect, result_values[tesseract::CT_UNICHAR_TOP_OK]); in TEST_F() 277 EXPECT_EQ(1, result_values[tesseract::CT_FONT_ATTR_ERR]); in TEST_F() 278 EXPECT_EQ(kNumTopTopErrs, result_values[tesseract::CT_UNICHAR_TOPTOP_ERR]); in TEST_F() 279 EXPECT_EQ(kNumTop1Errs, result_values[tesseract::CT_UNICHAR_TOP1_ERR]); in TEST_F() 280 EXPECT_EQ(kNumTop2Errs, result_values[tesseract::CT_UNICHAR_TOP2_ERR]); in TEST_F() 281 EXPECT_EQ(kNumTopNErrs, result_values[tesseract::CT_UNICHAR_TOPN_ERR]); in TEST_F() [all …]
|
/dports/graphics/tesseract/tesseract-5.0.0/src/ |
H A D | tesseract.cpp | 99 using namespace tesseract; 354 static void FixPageSegMode(tesseract::TessBaseAPI &api, tesseract::PageSegMode pagesegmode) { in FixPageSegMode() 373 tesseract::PageSegMode *pagesegmode, tesseract::OcrEngineMode *enginemode) { in ParseArgs() 650 tesseract::PageSegMode pagesegmode = tesseract::PSM_AUTO; in main() 654 tesseract::OcrEngineMode enginemode = tesseract::OEM_DEFAULT; in main() 692 tesseract::Dict::GlobalDawgCache(); in main() 706 tesseract::SIMDDetect::Update(); in main() 754 tesseract::Orientation orientation; in main() 755 tesseract::WritingDirection direction; in main() 756 tesseract::TextlineOrder order; in main() [all …]
|
/dports/graphics/py-pyocr/pyocr-0.8/tests/ |
H A D | tests_tesseract.py | 12 from pyocr import tesseract 38 self.assertTrue(tesseract.is_available()) 47 tesseract.get_version() 133 tesseract.get_version() 146 tesseract.get_version() 232 tesseract.CharBoxBuilder, 838 builder = tesseract.CharBoxBuilder() 849 builder = tesseract.CharBoxBuilder() 855 builder = tesseract.CharBoxBuilder() 860 builder = tesseract.CharBoxBuilder() [all …]
|
/dports/graphics/tesseract/tesseract-5.0.0/src/ccmain/ |
H A D | paramsd.h | 29 namespace tesseract { 57 explicit ParamContent(tesseract::StringParam *it); 58 explicit ParamContent(tesseract::IntParam *it); 59 explicit ParamContent(tesseract::BoolParam *it); 60 explicit ParamContent(tesseract::DoubleParam *it); 84 tesseract::StringParam *sIt; 85 tesseract::IntParam *iIt; 86 tesseract::BoolParam *bIt; 87 tesseract::DoubleParam *dIt; 101 explicit ParamsEditor(tesseract::Tesseract *, ScrollView *sv = nullptr); in ELISTIZEH() [all …]
|
/dports/graphics/mupdf/mupdf-1.18.0-source/source/fitz/ |
H A D | tessocr.cpp | 147 tesseract::TessBaseAPI *api; 151 api = new tesseract::TessBaseAPI(); 166 tesseract::OcrEngineMode::OEM_DEFAULT, 183 tesseract::TessBaseAPI *api = (tesseract::TessBaseAPI *)api_; 256 tesseract::TessBaseAPI *api = (tesseract::TessBaseAPI *)api_; 299 while (!res_it->Empty(tesseract::RIL_BLOCK)) 301 if (res_it->Empty(tesseract::RIL_WORD)) 303 res_it->Next(tesseract::RIL_WORD); 307 res_it->BoundingBox(tesseract::RIL_TEXTLINE, 310 res_it->BoundingBox(tesseract::RIL_WORD, [all …]
|
/dports/textproc/py-ocrmypdf/ocrmypdf-12.7.2/tests/ |
H A D | test_tesseract.py | 17 from ocrmypdf._exec import tesseract 67 tesseract.get_languages() 74 monkeypatch.setattr(tesseract, 'run', dummy_run) 75 tesseract.generate_hocr( 94 monkeypatch.setattr(tesseract, 'run', dummy_run) 95 tesseract.generate_pdf( 113 tesseract.page_timedout(5) 135 tesseract.tesseract_log_output(in_) 143 with pytest.raises(tesseract.TesseractConfigError): 144 tesseract.tesseract_log_output(b'parameter not found: moo')
|
/dports/graphics/tesseract-data/tessdata-4.1.0/ |
H A D | README.md | 6 [tesseract-ocr/langdata](https://github.com/tesseract-ocr/langdata) on GitHub. 9 These have models for legacy tesseract engine (--oem 0) as well as the new LSTM neural net based en… 13 [tessdata_best](https://github.com/tesseract-ocr/tessdata_best) on GitHub. 16 [tessdata_fast](https://github.com/tesseract-ocr/tessdata_fast) on GitHub 20 The legacy tesseract models (--oem 0) have been removed for Indic and 27 [3.04 tree](https://github.com/tesseract-ocr/tessdata/tree/3.04.00). 30 [Tesseract wiki](https://github.com/tesseract-ocr/tesseract/wiki/Data-Files).
|
/dports/graphics/tesseract/tesseract-5.0.0/src/ccstruct/ |
H A D | ocrpara.h | 26 namespace tesseract { 120 ParagraphModel(tesseract::ParagraphJustification justification, int margin, int first_indent, in ELISTIZEH() 138 : justification_(tesseract::JUSTIFICATION_UNKNOWN) in ELISTIZEH() 166 tesseract::ParagraphJustification justification() const { in ELISTIZEH() 182 return (justification_ == tesseract::JUSTIFICATION_LEFT || in ELISTIZEH() 183 justification_ == tesseract::JUSTIFICATION_RIGHT) && in ELISTIZEH() 194 tesseract::ParagraphJustification justification_; in ELISTIZEH()
|