tesseract
5.0.0-alpha-619-ge9db
|
Typedefs | |
using | DictFunc = int(Dict::*)(void *, const UNICHARSET &, UNICHAR_ID, bool) const |
using | ProbabilityInContextFunc = double(Dict::*)(const char *, const char *, int, const char *, int) |
using | ParamsModelClassifyFunc = float(Dict::*)(const char *, void *) |
using | FillLatticeFunc = void(Wordrec::*)(const MATRIX &, const WERD_CHOICE_LIST &, const UNICHARSET &, BlamerBundle *) |
using | TruthCallback = std::function< void(const UNICHARSET &, int, PageIterator *, Pix *)> |
using | FileReader = bool(*)(const char *filename, GenericVector< char > *data) |
using | FileWriter = bool(*)(const GenericVector< char > &data, const char *filename) |
using | char32 = signed int |
using | DotProductFunction = double(*)(const double *, const double *, int) |
using | SetOfModels = GenericVectorEqEq< const ParagraphModel * > |
using | WordRecognizer = void(Tesseract::*)(const WordData &, WERD_RES **, PointerVector< WERD_RES > *) |
using | ParamsTrainingHypothesisList = GenericVector< ParamsTrainingHypothesis > |
using | UnicharIdVector = GenericVector< UNICHAR_ID > |
using | UnicharAmbigsVector = GenericVector< AmbigSpec_LIST * > |
using | IntKDPair = KDPairInc< int, int > |
using | RSMap = std::unordered_map< int, std::unique_ptr< std::vector< int > >> |
using | RSCounts = std::unordered_map< int, int > |
using | ShapeQueue = GenericHeap< ShapeQueueEntry > |
using | NodeChildVector = GenericVector< NodeChild > |
using | SuccessorList = GenericVector< int > |
using | SuccessorListsVector = GenericVector< SuccessorList * > |
using | DawgVector = GenericVector< Dawg * > |
using | RecodePair = KDPairInc< double, RecodeNode > |
using | RecodeHeap = GenericHeap< RecodePair > |
using | BlobGridSearch = GridSearch< BLOBNBOX, BLOBNBOX_CLIST, BLOBNBOX_C_IT > |
using | ColPartitionGridSearch = GridSearch< ColPartition, ColPartition_CLIST, ColPartition_C_IT > |
using | PartSetVector = GenericVector< ColPartitionSet * > |
using | WidthCallback = std::function< bool(int)> |
using | ColSegmentGrid = BBGrid< ColSegment, ColSegment_CLIST, ColSegment_C_IT > |
using | ColSegmentGridSearch = GridSearch< ColSegment, ColSegment_CLIST, ColSegment_C_IT > |
using | WordGrid = BBGrid< WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT > |
using | WordSearch = GridSearch< WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT > |
using | LigHash = std::unordered_map< std::string, std::string, StringHash > |
using | TestCallback = std::function< STRING(int, const double *, const TessdataManager &, int)> |
using | PainPointHeap = GenericHeap< MatrixCoordPair > |
using | LanguageModelFlagsType = unsigned char |
Used for expressing various language model flags. More... | |
Functions | |
STRING | HOcrEscape (const char *text) |
bool | LoadDataFromFile (const char *filename, GenericVector< char > *data) |
bool | SaveDataToFile (const GenericVector< char > &data, const char *filename) |
template<typename T > | |
bool | cmp_eq (T const &t1, T const &t2) |
template<typename T > | |
int | sort_cmp (const void *t1, const void *t2) |
template<typename T > | |
int | sort_ptr_cmp (const void *t1, const void *t2) |
bool | PSM_OSD_ENABLED (int pageseg_mode) |
bool | PSM_ORIENTATION_ENABLED (int pageseg_mode) |
bool | PSM_COL_FIND_ENABLED (int pageseg_mode) |
bool | PSM_SPARSE (int pageseg_mode) |
bool | PSM_BLOCK_FIND_ENABLED (int pageseg_mode) |
bool | PSM_LINE_FIND_ENABLED (int pageseg_mode) |
bool | PSM_WORD_FIND_ENABLED (int pageseg_mode) |
template<typename T , size_t N> | |
constexpr size_t | countof (T const (&)[N]) noexcept |
bool | DeSerialize (FILE *fp, char *data, size_t n=1) |
bool | DeSerialize (FILE *fp, float *data, size_t n=1) |
bool | DeSerialize (FILE *fp, int8_t *data, size_t n=1) |
bool | DeSerialize (FILE *fp, int16_t *data, size_t n=1) |
bool | DeSerialize (FILE *fp, int32_t *data, size_t n=1) |
bool | DeSerialize (FILE *fp, uint8_t *data, size_t n=1) |
bool | DeSerialize (FILE *fp, uint16_t *data, size_t n=1) |
bool | DeSerialize (FILE *fp, uint32_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const char *data, size_t n=1) |
bool | Serialize (FILE *fp, const float *data, size_t n=1) |
bool | Serialize (FILE *fp, const int8_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const int16_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const int32_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const uint8_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const uint16_t *data, size_t n=1) |
bool | Serialize (FILE *fp, const uint32_t *data, size_t n=1) |
double | DotProductNative (const double *u, const double *v, int n) |
double | DotProductAVX (const double *u, const double *v, int n) |
double | DotProductFMA (const double *u, const double *v, int n) |
double | DotProductSSE (const double *u, const double *v, int n) |
bool | IsTextOrEquationType (PolyBlockType type) |
bool | IsLeftIndented (const EquationDetect::IndentType type) |
bool | IsRightIndented (const EquationDetect::IndentType type) |
bool | AsciiLikelyListItem (const STRING &word) |
int | UnicodeFor (const UNICHARSET *u, const WERD_CHOICE *werd, int pos) |
void | LeftWordAttributes (const UNICHARSET *unicharset, const WERD_CHOICE *werd, const STRING &utf8, bool *is_list, bool *starts_idea, bool *ends_idea) |
void | RightWordAttributes (const UNICHARSET *unicharset, const WERD_CHOICE *werd, const STRING &utf8, bool *is_list, bool *starts_idea, bool *ends_idea) |
bool | ValidFirstLine (const GenericVector< RowScratchRegisters > *rows, int row, const ParagraphModel *model) |
bool | ValidBodyLine (const GenericVector< RowScratchRegisters > *rows, int row, const ParagraphModel *model) |
bool | CrownCompatible (const GenericVector< RowScratchRegisters > *rows, int a, int b, const ParagraphModel *model) |
void | RecomputeMarginsAndClearHypotheses (GenericVector< RowScratchRegisters > *rows, int start, int end, int percentile) |
int | InterwordSpace (const GenericVector< RowScratchRegisters > &rows, int row_start, int row_end) |
bool | FirstWordWouldHaveFit (const RowScratchRegisters &before, const RowScratchRegisters &after, tesseract::ParagraphJustification justification) |
bool | FirstWordWouldHaveFit (const RowScratchRegisters &before, const RowScratchRegisters &after) |
bool | RowsFitModel (const GenericVector< RowScratchRegisters > *rows, int start, int end, const ParagraphModel *model) |
void | CanonicalizeDetectionResults (GenericVector< PARA * > *row_owners, PARA_LIST *paragraphs) |
void | DetectParagraphs (int debug_level, GenericVector< RowInfo > *row_infos, GenericVector< PARA * > *row_owners, PARA_LIST *paragraphs, GenericVector< ParagraphModel * > *models) |
void | DetectParagraphs (int debug_level, bool after_text_recognition, const MutableIterator *block_start, GenericVector< ParagraphModel * > *models) |
bool | StrongModel (const ParagraphModel *model) |
bool | CompareFontInfo (const FontInfo &fi1, const FontInfo &fi2) |
bool | CompareFontSet (const FontSet &fs1, const FontSet &fs2) |
void | FontInfoDeleteCallback (FontInfo f) |
void | FontSetDeleteCallback (FontSet fs) |
bool | read_info (TFile *f, FontInfo *fi) |
bool | write_info (FILE *f, const FontInfo &fi) |
bool | read_spacing_info (TFile *f, FontInfo *fi) |
bool | write_spacing_info (FILE *f, const FontInfo &fi) |
bool | read_set (TFile *f, FontSet *fs) |
bool | write_set (FILE *f, const FontSet &fs) |
int | OtsuThreshold (Pix *src_pix, int left, int top, int width, int height, int **thresholds, int **hi_values) |
void | HistogramRect (Pix *src_pix, int channel, int left, int top, int width, int height, int *histogram) |
int | OtsuStats (const int *histogram, int *H_out, int *omega0_out) |
int | ParamsTrainingFeatureByName (const char *name) |
const char * | ScriptPosToString (enum ScriptPos script_pos) |
void | ExtractFontName (const STRING &filename, STRING *fontname) |
TrainingSample * | BlobToTrainingSample (const TBLOB &blob, bool nonlinear_norm, INT_FX_RESULT_STRUCT *fx_info, GenericVector< INT_FEATURE_STRUCT > *bl_features) |
void | ClearFeatureSpaceWindow (NORM_METHOD norm_method, ScrollView *window) |
double | Tanh (double x) |
double | Logistic (double x) |
template<class Func > | |
void | FuncInplace (int n, double *inout) |
template<class Func > | |
void | FuncMultiply (const double *u, const double *v, int n, double *out) |
template<typename T > | |
void | SoftmaxInPlace (int n, T *inout) |
void | CopyVector (int n, const double *src, double *dest) |
void | AccumulateVector (int n, const double *src, double *dest) |
void | MultiplyVectorsInPlace (int n, const double *src, double *inout) |
void | MultiplyAccumulate (int n, const double *u, const double *v, double *out) |
void | SumVectors (int n, const double *v1, const double *v2, const double *v3, const double *v4, const double *v5, double *sum) |
template<typename T > | |
void | ZeroVector (int n, T *vec) |
template<typename T > | |
void | ClipVector (int n, T lower, T upper, T *vec) |
void | CodeInBinary (int n, int nf, double *vec) |
Pix * | TraceOutlineOnReducedPix (C_OUTLINE *outline, int gridsize, ICOORD bleft, int *left, int *bottom) |
Pix * | TraceBlockOnReducedPix (BLOCK *block, int gridsize, ICOORD bleft, int *left, int *bottom) |
template<class BBC > | |
int | SortByBoxLeft (const void *void1, const void *void2) |
template<class BBC > | |
int | SortRightToLeft (const void *void1, const void *void2) |
template<class BBC > | |
int | SortByBoxBottom (const void *void1, const void *void2) |
template<typename T > | |
void | DeleteObject (T *object) |
void | SetBlobStrokeWidth (Pix *pix, BLOBNBOX *blob) |
void | assign_blobs_to_blocks2 (Pix *pix, BLOCK_LIST *blocks, TO_BLOCK_LIST *port_blocks) |
void | ParseCommandLineFlags (const char *usage, int *argc, char ***argv, const bool remove_flags) |
ShapeTable * | LoadShapeTable (const STRING &file_prefix) |
void | WriteShapeTable (const STRING &file_prefix, const ShapeTable &shape_table) |
MasterTrainer * | LoadTrainingData (int argc, const char *const *argv, bool replication, ShapeTable **shape_table, STRING *file_prefix) |
Pix * | DegradeImage (Pix *input, int exposure, TRand *randomizer, float *rotation) |
Pix * | PrepareDistortedPix (const Pix *pix, bool perspective, bool invert, bool white_noise, bool smooth_noise, bool blur, int box_reduction, TRand *randomizer, GenericVector< TBOX > *boxes) |
void | GeneratePerspectiveDistortion (int width, int height, TRand *randomizer, Pix **pix, GenericVector< TBOX > *boxes) |
int | ProjectiveCoeffs (int width, int height, TRand *randomizer, float **im_coeffs, float **box_coeffs) |
bool | LoadFileLinesToStrings (const char *filename, GenericVector< STRING > *lines) |
bool | WriteFile (const std::string &output_dir, const std::string &lang, const std::string &suffix, const GenericVector< char > &data, FileWriter writer) |
STRING | ReadFile (const std::string &filename, FileReader reader) |
bool | WriteUnicharset (const UNICHARSET &unicharset, const std::string &output_dir, const std::string &lang, FileWriter writer, TessdataManager *traineddata) |
bool | WriteRecoder (const UNICHARSET &unicharset, bool pass_through, const std::string &output_dir, const std::string &lang, FileWriter writer, STRING *radical_table_data, TessdataManager *traineddata) |
int | CombineLangModel (const UNICHARSET &unicharset, const std::string &script_dir, const std::string &version_str, const std::string &output_dir, const std::string &lang, bool pass_through_recoder, const GenericVector< STRING > &words, const GenericVector< STRING > &puncs, const GenericVector< STRING > &numbers, bool lang_is_rtl, FileReader reader, FileWriter writer) |
bool | NormalizeUTF8String (UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNorm grapheme_normalize, const char *str8, std::string *normalized) |
bool | NormalizeCleanAndSegmentUTF8 (UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNormMode g_mode, bool report_errors, const char *str8, std::vector< std::string > *graphemes) |
char32 | OCRNormalize (char32 ch) |
bool | IsOCREquivalent (char32 ch1, char32 ch2) |
bool | IsValidCodepoint (const char32 ch) |
bool | IsWhitespace (const char32 ch) |
bool | IsUTF8Whitespace (const char *text) |
unsigned int | SpanUTF8Whitespace (const char *text) |
unsigned int | SpanUTF8NotWhitespace (const char *text) |
bool | IsInterchangeValid (const char32 ch) |
bool | IsInterchangeValid7BitAscii (const char32 ch) |
char32 | FullwidthToHalfwidth (const char32 ch) |
void | SetupBasicProperties (bool report_errors, bool decompose, UNICHARSET *unicharset) |
void | SetScriptProperties (const std::string &script_dir, UNICHARSET *unicharset) |
std::string | GetXheightString (const std::string &script_dir, const UNICHARSET &unicharset) |
void | SetPropertiesForInputFile (const std::string &script_dir, const std::string &input_unicharset_file, const std::string &output_unicharset_file, const std::string &output_xheights_file) |
void | SetupBasicProperties (bool report_errors, UNICHARSET *unicharset) |
template<class BLOB_CHOICE > | |
int | SortByUnicharID (const void *void1, const void *void2) |
template<class BLOB_CHOICE > | |
int | SortByRating (const void *void1, const void *void2) |
TEST_F (EquationFinderTest, IdentifySpecialText) | |
TEST_F (EquationFinderTest, EstimateTypeForUnichar) | |
TEST_F (EquationFinderTest, IsIndented) | |
TEST_F (EquationFinderTest, IsNearSmallNeighbor) | |
TEST_F (EquationFinderTest, CheckSeedBlobsCount) | |
TEST_F (EquationFinderTest, ComputeForegroundDensity) | |
TEST_F (EquationFinderTest, CountAlignment) | |
TEST_F (EquationFinderTest, ComputeCPsSuperBBox) | |
TEST_F (EquationFinderTest, SplitCPHorLite) | |
TEST_F (EquationFinderTest, SplitCPHor) | |
TEST_F (HeapTest, SortTest) | |
TEST_F (HeapTest, MixedTest) | |
TEST_F (HeapTest, PopWorstTest) | |
TEST_F (HeapTest, RevalueTest) | |
TEST_F (HeapTest, DoublePtrTest) | |
TEST_F (LSTMTrainerTest, RecodeTestKorBase) | |
TEST_F (LSTMTrainerTest, RecodeTestKor) | |
TEST_F (LSTMTrainerTest, EncodeDecodeBothTestKor) | |
TEST_F (LSTMTrainerTest, TestSquashed) | |
TEST_F (LSTMTrainerTest, BasicTest) | |
TEST_F (LSTMTrainerTest, ColorTest) | |
TEST_F (LSTMTrainerTest, BidiTest) | |
TEST_F (LSTMTrainerTest, Test2D) | |
TEST_F (LSTMTrainerTest, TestAdam) | |
TEST_F (LSTMTrainerTest, SpeedTest) | |
TEST_F (LSTMTrainerTest, DeterminismTest) | |
TEST_F (LSTMTrainerTest, SoftmaxBaselineTest) | |
TEST_F (LSTMTrainerTest, SoftmaxTest) | |
TEST_F (LSTMTrainerTest, EncodedSoftmaxTest) | |
TEST_F (LSTMTrainerTest, TestLayerAccess) | |
std::string | CodepointList (const std::vector< char32 > &str32) |
std::string | PrintString32WithUnicodes (const std::string &str) |
std::string | PrintStringVectorWithUnicodes (const std::vector< std::string > &glyphs) |
void | ExpectGraphemeModeResults (const std::string &str, UnicodeNormMode u_mode, int unicode_count, int glyph_count, int grapheme_count, const std::string &target_str) |
TEST_F (NthItemTest, GeneralTest) | |
TEST_F (NthItemTest, BoringTest) | |
TEST_F (NthItemTest, UniqueTest) | |
TEST_F (NthItemTest, EqualTest) | |
Variables | |
const int | kMinRectSize = 10 |
const char | kTesseractReject = '~' |
const char | kUNLVReject = '~' |
const char | kUNLVSuspect = '^' |
const int | kMaxIntSize = 22 |
const int | kNumbersPerBlob = 5 |
const int | kBytesPerNumber = 5 |
const int | kBytesPerBoxFileLine = (kBytesPerNumber + 1) * kNumbersPerBlob + 1 |
const int | kBytesPer64BitNumber = 20 |
const int | kMaxBytesPerLine |
const int | kUniChs [] |
const int | kLatinChs [] |
constexpr int | kNumOutputsPerRegister = 8 |
constexpr int | kMaxOutputRegisters = 8 |
constexpr int | kNumInputsPerRegister = 32 |
constexpr int | kNumInputsPerGroup = 4 |
constexpr int | kNumInputGroups = kNumInputsPerRegister / kNumInputsPerGroup |
DotProductFunction | DotProduct |
const float | kMathDigitDensityTh1 = 0.25 |
const float | kMathDigitDensityTh2 = 0.1 |
const float | kMathItalicDensityTh = 0.5 |
const float | kUnclearDensityTh = 0.25 |
const int | kSeedBlobsCountTh = 10 |
const int | kLeftIndentAlignmentCountTh = 1 |
const int | kMaxCharTopRange = 48 |
const float | kCertaintyScale = 7.0f |
const float | kWorstDictCertainty = -25.0f |
const int | kMaxCircleErosions = 8 |
const ParagraphModel * | kCrownLeft = reinterpret_cast<ParagraphModel *>(static_cast<uintptr_t>(0xDEAD111F)) |
const ParagraphModel * | kCrownRight = reinterpret_cast<ParagraphModel *>(static_cast<uintptr_t>(0xDEAD888F)) |
const int16_t | kMaxBoxEdgeDiff = 2 |
const int | kBoxClipTolerance = 2 |
const int | kNumEndPoints = 3 |
const int | kMinPointsForErrorCount = 16 |
const int | kMaxRealDistance = 2.0 |
const int | kFeaturePadding = 2 |
const int | kImagePadding = 4 |
const int | kHistogramSize = 256 |
const int | kMaxAmbigStringSize = UNICHAR_LEN * (MAX_AMBIG_SIZE + 1) |
const int | kRadicalRadix = 29 |
const char *const | kLRM = "\u200E" |
Left-to-Right Mark. More... | |
const char *const | kRLM = "\u200F" |
Right-to-Left Mark. More... | |
const char *const | kRLE = "\u202A" |
Right-to-Left Embedding. More... | |
const char *const | kPDF = "\u202C" |
Pop Directional Formatting. More... | |
const char | kUniversalAmbigsFile [] |
const int | ksizeofUniversalAmbigsFile = sizeof(kUniversalAmbigsFile) |
const int | kRandomizingCenter = 128 |
const int | case_state_table [6][4] |
const char | kDoNotReverse [] = "RRP_DO_NO_REVERSE" |
const char | kReverseIfHasRTL [] = "RRP_REVERSE_IF_HAS_RTL" |
const char | kForceReverse [] = "RRP_FORCE_REVERSE" |
const char *const | RTLReversePolicyNames [] |
const double | TanhTable [] |
const double | LogisticTable [] |
constexpr int | kTableSize = 4096 |
constexpr double | kScaleFactor = 256.0 |
const int | kMaxInputHeight = 48 |
const double | kStateClip = 100.0 |
const double | kErrClip = 1.0f |
const double | kDictRatio = 2.25 |
const double | kCertOffset = -0.085 |
const int | kMinWinSize = 500 |
const int | kMaxWinSize = 2000 |
const int | kXWinFrameSize = 30 |
const int | kYWinFrameSize = 80 |
const float | kMinCertainty = -20.0f |
const float | kMinProb = exp(kMinCertainty) |
class tesseract::TFNetworkModelDefaultTypeInternal | _TFNetworkModel_default_instance_ |
const int | kAdamCorrectionIterations = 200000 |
const double | kAdamEpsilon = 1e-8 |
const int | kInt8Flag = 1 |
const int | kAdamFlag = 4 |
const int | kDoubleFlag = 128 |
const int | kHistogramBuckets = 16 |
const double | kAlignedFraction = 0.03125 |
const double | kRaggedFraction = 2.5 |
const double | kAlignedGapFraction = 0.75 |
const double | kRaggedGapFraction = 1.0 |
const int | kVLineAlignment = 3 |
const int | kVLineGutter = 1 |
const int | kVLineSearchSize = 150 |
const int | kMinRaggedTabs = 5 |
const int | kMinAlignedTabs = 4 |
const int | kVLineMinLength = 500 |
const double | kMinTabGradient = 4.0 |
const int | kMaxSkewFactor = 15 |
const double | kMaxSmallNeighboursPerPix = 1.0 / 32 |
const int | kMaxLargeOverlapsWithSmall = 3 |
const int | kMaxMediumOverlapsWithSmall = 12 |
const int | kMaxLargeOverlapsWithMedium = 12 |
const int | kOriginalNoiseMultiple = 8 |
const int | kNoisePadding = 4 |
const double | kPhotoOffsetFraction = 0.375 |
const double | kMinGoodTextPARatio = 1.5 |
const int | kMaxIncompatibleColumnCount = 2 |
const double | kHorizontalGapMergeFraction = 0.5 |
const double | kMinGutterWidthGrid = 0.5 |
const double | kMaxDistToPartSizeRatio = 1.5 |
const double | kMaxSpacingDrift = 1.0 / 72 |
const double | kMaxTopSpacingFraction = 0.25 |
const double | kMaxSameBlockLineSpacing = 3 |
const double | kMaxSizeRatio = 1.5 |
const double | kMaxLeaderGapFractionOfMax = 0.25 |
const double | kMaxLeaderGapFractionOfMin = 0.5 |
const int | kMinLeaderCount = 5 |
const int | kMinStrongTextValue = 6 |
const int | kMinChainTextValue = 3 |
const int | kHorzStrongTextlineCount = 8 |
const int | kHorzStrongTextlineHeight = 10 |
const int | kHorzStrongTextlineAspect = 5 |
const double | kMaxBaselineError = 0.4375 |
const double | kMinBaselineCoverage = 0.5 |
const int | kMaxRMSColorNoise = 128 |
const int | kMaxColorDistance = 900 |
const int | kRGBRMSColors = 4 |
const int | kMaxPadFactor = 6 |
const int | kMaxNeighbourDistFactor = 4 |
const int | kMaxCaptionLines = 7 |
const double | kMinCaptionGapRatio = 2.0 |
const double | kMinCaptionGapHeightRatio = 0.5 |
const double | kMarginOverlapFraction = 0.25 |
const double | kBigPartSizeRatio = 1.75 |
const double | kTinyEnoughTextlineOverlapFraction = 0.25 |
const double | kMaxPartitionSpacing = 1.75 |
const int | kSmoothDecisionMargin = 4 |
const double | kMinColumnWidth = 2.0 / 3 |
const double | kMinRectangularFraction = 0.125 |
const double | kMaxRectangularFraction = 0.75 |
const double | kMaxRectangularGradient = 0.1 |
const int | kMinImageFindSize = 100 |
const double | kRMSFitScaling = 8.0 |
const int | kMinColorDifference = 16 |
const int | kThinLineFraction = 20 |
Denominator of resolution makes max pixel width to allow thin lines. More... | |
const int | kMinLineLengthFraction = 4 |
Denominator of resolution makes min pixels to demand line lengths to be. More... | |
const int | kCrackSpacing = 100 |
Spacing of cracks across the page to break up tall vertical lines. More... | |
const int | kLineFindGridSize = 50 |
Grid size used by line finder. Not very critical. More... | |
const int | kMinThickLineWidth = 12 |
const int | kMaxLineResidue = 6 |
const double | kThickLengthMultiple = 0.75 |
const double | kMaxNonLineDensity = 0.25 |
const double | kMaxStaveHeight = 1.0 |
const double | kMinMusicPixelFraction = 0.75 |
const double | kStrokeWidthFractionTolerance = 0.125 |
const double | kStrokeWidthTolerance = 1.5 |
const double | kStrokeWidthFractionCJK = 0.25 |
const double | kStrokeWidthCJK = 2.0 |
const int | kCJKRadius = 2 |
const double | kCJKBrokenDistanceFraction = 0.25 |
const int | kCJKMaxComponents = 8 |
const double | kCJKAspectRatio = 1.25 |
const double | kCJKAspectRatioIncrease = 1.0625 |
const int | kMaxCJKSizeRatio = 5 |
const double | kBrokenCJKIterationFraction = 0.125 |
const double | kDiacriticXPadRatio = 7.0 |
const double | kDiacriticYPadRatio = 1.75 |
const double | kMinDiacriticSizeRatio = 1.0625 |
const double | kMaxDiacriticDistanceRatio = 1.25 |
const double | kMaxDiacriticGapToBaseCharHeight = 1.0 |
const int | kLineTrapLongest = 4 |
const int | kLineTrapShortest = 2 |
const int | kMostlyOneDirRatio = 3 |
const double | kLineResidueAspectRatio = 8.0 |
const int | kLineResiduePadRatio = 3 |
const double | kLineResidueSizeRatio = 1.75 |
const float | kSizeRatioToReject = 2.0 |
const double | kNeighbourSearchFactor = 2.5 |
const double | kNoiseOverlapGrowthFactor = 4.0 |
const double | kNoiseOverlapAreaFactor = 1.0 / 512 |
const int | kTabRadiusFactor = 5 |
const int | kMinVerticalSearch = 3 |
const int | kMaxVerticalSearch = 12 |
const int | kMaxRaggedSearch = 25 |
const int | kMinLinesInColumn = 10 |
const double | kMinFractionalLinesInColumn = 0.125 |
const double | kMaxGutterWidthAbsolute = 2.00 |
const int | kRaggedGutterMultiple = 5 |
const double | kLineFragmentAspectRatio = 10.0 |
const int | kMinEvaluatedTabs = 3 |
const double | kCosMaxSkewAngle = 0.866025 |
const int | kColumnWidthFactor = 20 |
const int | kMaxVerticalSpacing = 500 |
const int | kMaxBlobWidth = 500 |
const double | kSplitPartitionSize = 2.0 |
const double | kAllowTextHeight = 0.5 |
const double | kAllowTextWidth = 0.6 |
const double | kAllowTextArea = 0.8 |
const double | kAllowBlobHeight = 0.3 |
const double | kAllowBlobWidth = 0.4 |
const double | kAllowBlobArea = 0.05 |
const int | kMinBoxesInTextPartition = 10 |
const int | kMaxBoxesInDataPartition = 20 |
const double | kMaxGapInTextPartition = 4.0 |
const double | kMinMaxGapInTextPartition = 0.5 |
const double | kMaxBlobOverlapFactor = 4.0 |
const double | kMaxTableCellXheight = 2.0 |
const int | kMaxColumnHeaderDistance = 4 |
const double | kTableColumnThreshold = 3.0 |
const double | kMinOverlapWithTable = 0.6 |
const int | kSideSpaceMargin = 10 |
const double | kSmallTableProjectionThreshold = 0.35 |
const double | kLargeTableProjectionThreshold = 0.45 |
const int | kLargeTableRowCount = 6 |
const int | kMinRowsInTable = 3 |
const int | kAdjacentLeaderSearchPadding = 2 |
const double | kParagraphEndingPreviousLineRatio = 1.3 |
const double | kMaxParagraphEndingLeftSpaceMultiple = 3.0 |
const double | kMinParagraphEndingTextToWhitespaceRatio = 3.0 |
const double | kMaxXProjectionGapFactor = 2.0 |
const double | kStrokeWidthFractionalTolerance = 0.25 |
const double | kStrokeWidthConstantTolerance = 2.0 |
const double | kHorizontalSpacing = 0.30 |
const double | kVerticalSpacing = -0.2 |
const int | kCellSplitRowThreshold = 0 |
const int | kCellSplitColumnThreshold = 0 |
const int | kLinedTableMinVerticalLines = 3 |
const int | kLinedTableMinHorizontalLines = 3 |
const double | kRequiredColumns = 0.7 |
const double | kMarginFactor = 1.1 |
const double | kMaxRowSize = 2.5 |
const double | kGoodRowNumberOfColumnsSmall [] = { 2, 2, 2, 2, 2, 3, 3 } |
const int | kGoodRowNumberOfColumnsSmallSize |
const double | kGoodRowNumberOfColumnsLarge = 0.7 |
const double | kMinFilledArea = 0.35 |
const int | kGutterMultiple = 4 |
const int | kGutterToNeighbourRatio = 3 |
const int | kSimilarVectorDist = 10 |
const int | kSimilarRaggedDist = 50 |
const int | kMaxFillinMultiple = 11 |
const double | kMinGutterFraction = 0.5 |
const double | kLineCountReciprocal = 4.0 |
const double | kMinAlignedGutter = 0.25 |
const double | kMinRaggedGutter = 1.5 |
double | textord_tabvector_vertical_gap_fraction = 0.5 |
double | textord_tabvector_vertical_box_ratio = 0.5 |
const int | kMaxLineLength = 1024 |
const float | kRotationRange = 0.02f |
const int | kExposureFactor = 16 |
const int | kSaltnPepper = 5 |
const int | kMinRampSize = 1000 |
const double | kRatingEpsilon = 1.0 / 32 |
const int | kMaxOffsetDist = 32 |
const int | kMinLigature = 0xfb00 |
const int | kMaxLigature = 0xfb17 |
const double | kMinDivergenceRate = 50.0 |
const int | kMinStallIterations = 10000 |
const double | kSubTrainerMarginFraction = 3.0 / 128 |
const double | kLearningRateDecay = M_SQRT1_2 |
const int | kNumAdjustmentIterations = 100 |
const int | kErrorGraphInterval = 1000 |
const int | kNumPagesPerBatch = 100 |
const int | kMinStartedErrorRate = 75 |
const double | kStageTransitionThreshold = 10.0 |
const double | kHighConfidence = 0.9375 |
const double | kImprovementFraction = 15.0 / 16.0 |
const double | kBestCheckpointFraction = 31.0 / 32.0 |
const int | kTargetXScale = 5 |
const int | kTargetYScale = 100 |
const int | kMinClusteredShapes = 1 |
const int | kMaxUnicharsPerCluster = 2000 |
const float | kFontMergeDistance = 0.025 |
const float | kInfiniteDist = 999.0f |
const int | kDefaultResolution = 300 |
const int | kTestChar = -1 |
const int | kSquareLimit = 25 |
const int | kPrime1 = 17 |
const int | kPrime2 = 13 |
int | test_data [] = {8, 1, 2, -4, 7, 9, 65536, 4, 9, 0} |
const int | kTrainerIterations = 600 |
const int | kBatchIterations = 100 |
The box file is assumed to contain box definitions, one per line, of the following format for blob-level boxes:
* <UTF8 str> <left> <bottom> <right> <top> <page id> *
and for word/line-level boxes:
* WordStr <left> <bottom> <right> <top> <page id> #<space-delimited word str> *
NOTES: The boxes use tesseract coordinates, i.e. 0,0 is at BOTTOM-LEFT.
<page id>=""> is 0-based, and the page number is used for multipage input (tiff).
In the blob-level form, each line represents a recognizable unit, which may be several UTF-8 bytes, but there is a bounding box around each recognizable unit, and no classifier is needed to train in this mode (bootstrapping.)
In the word/line-level form, the line begins with the literal "WordStr", and the bounding box bounds either a whole line or a whole word. The recognizable units in the word/line are listed after the # at the end of the line and are space delimited, ignoring any original spaces on the line. Eg.
* word -> #w o r d * multi word line -> #m u l t i w o r d l i n e *
The recognizable units must be space-delimited in order to allow multiple unicodes to be used for a single recognizable unit, eg Hindi.
In this mode, the classifier must have been pre-trained with the desired character set, or it will not be able to find the character segmentations.
Make a word from the selected blobs and run Tess on them.
page_res | recognise blobs |
selection_box | within this box |
fp_eval_word_spacing() Evaluation function for fixed pitch word lists.
Basically, count the number of "nice" characters - those which are in tess acceptable words or in dict words and are not rejected. Penalise any potential noise chars
build_menu()
Construct the menu tree used by the command window
process_cmd_win_event()
Process a command returned from the command window (Just call the appropriate command handler)
word_blank_and_set_display() Word processor
Blank display of word then redisplay word according to current display mode settings
using tesseract::BlobGridSearch = typedef GridSearch<BLOBNBOX, BLOBNBOX_CLIST, BLOBNBOX_C_IT> |
Definition at line 31 of file blobgrid.h.
using tesseract::char32 = typedef signed int |
using tesseract::ColPartitionGridSearch = typedef GridSearch<ColPartition, ColPartition_CLIST, ColPartition_C_IT> |
Definition at line 935 of file colpartition.h.
using tesseract::ColSegmentGrid = typedef BBGrid<ColSegment, ColSegment_CLIST, ColSegment_C_IT> |
Definition at line 117 of file tablefind.h.
using tesseract::ColSegmentGridSearch = typedef GridSearch<ColSegment, ColSegment_CLIST, ColSegment_C_IT> |
Definition at line 120 of file tablefind.h.
using tesseract::DawgVector = typedef GenericVector<Dawg *> |
using tesseract::DictFunc = typedef int (Dict::*)(void*, const UNICHARSET&, UNICHAR_ID, bool) const |
using tesseract::DotProductFunction = typedef double (*)(const double*, const double*, int) |
Definition at line 25 of file simddetect.h.
using tesseract::FileReader = typedef bool (*)(const char* filename, GenericVector<char>* data) |
Definition at line 47 of file serialis.h.
using tesseract::FileWriter = typedef bool (*)(const GenericVector<char>& data, const char* filename) |
Definition at line 51 of file serialis.h.
using tesseract::FillLatticeFunc = typedef void (Wordrec::*)(const MATRIX&, const WERD_CHOICE_LIST&, const UNICHARSET&, BlamerBundle*) |
using tesseract::IntKDPair = typedef KDPairInc<int, int> |
using tesseract::LanguageModelFlagsType = typedef unsigned char |
Used for expressing various language model flags.
Definition at line 37 of file lm_state.h.
using tesseract::LigHash = typedef std::unordered_map<std::string, std::string, StringHash> |
Definition at line 53 of file ligature_table.h.
using tesseract::NodeChildVector = typedef GenericVector<NodeChild> |
using tesseract::PainPointHeap = typedef GenericHeap<MatrixCoordPair> |
Definition at line 37 of file lm_pain_points.h.
using tesseract::ParamsModelClassifyFunc = typedef float (Dict::*)(const char*, void*) |
using tesseract::ParamsTrainingHypothesisList = typedef GenericVector<ParamsTrainingHypothesis> |
Definition at line 127 of file params_training_featdef.h.
using tesseract::PartSetVector = typedef GenericVector<ColPartitionSet*> |
Definition at line 33 of file colpartitionset.h.
using tesseract::ProbabilityInContextFunc = typedef double (Dict::*)(const char*, const char*, int, const char*, int) |
using tesseract::RecodeHeap = typedef GenericHeap<RecodePair> |
Definition at line 177 of file recodebeam.h.
using tesseract::RecodePair = typedef KDPairInc<double, RecodeNode> |
Definition at line 176 of file recodebeam.h.
using tesseract::RSCounts = typedef std::unordered_map<int, int> |
Definition at line 48 of file unicharcompress.cpp.
using tesseract::RSMap = typedef std::unordered_map<int, std::unique_ptr<std::vector<int> >> |
Definition at line 46 of file unicharcompress.cpp.
using tesseract::SetOfModels = typedef GenericVectorEqEq<const ParagraphModel *> |
Definition at line 98 of file paragraphs_internal.h.
using tesseract::ShapeQueue = typedef GenericHeap<ShapeQueueEntry> |
Definition at line 155 of file shapetable.h.
using tesseract::SuccessorList = typedef GenericVector<int> |
using tesseract::SuccessorListsVector = typedef GenericVector<SuccessorList *> |
using tesseract::TestCallback = typedef std::function<STRING(int, const double*, const TessdataManager&, int)> |
Definition at line 73 of file lstmtrainer.h.
using tesseract::TruthCallback = typedef std::function<void(const UNICHARSET&, int, PageIterator*, Pix*)> |
using tesseract::UnicharAmbigsVector = typedef GenericVector<AmbigSpec_LIST *> |
using tesseract::UnicharIdVector = typedef GenericVector<UNICHAR_ID> |
using tesseract::WidthCallback = typedef std::function<bool(int)> |
using tesseract::WordGrid = typedef BBGrid<WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT> |
using tesseract::WordRecognizer = typedef void (Tesseract::*)(const WordData&, WERD_RES**, PointerVector<WERD_RES>*) |
Definition at line 170 of file tesseractclass.h.
using tesseract::WordSearch = typedef GridSearch<WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT> |
enum tesseract::AmbigType |
Enumerator | |
---|---|
ACTION_1_CMD_EVENT | |
RECOG_WERDS | |
RECOG_PSEUDO | |
ACTION_2_CMD_EVENT |
Definition at line 486 of file tessedit.cpp.
Enumerator | |
---|---|
COL_UNKNOWN | |
COL_TEXT | |
COL_TABLE | |
COL_MIXED | |
COL_COUNT |
Definition at line 29 of file tablefind.h.
Enumerator | |
---|---|
CST_NOISE | |
CST_FLOWING | |
CST_HEADING | |
CST_PULLOUT | |
CST_COUNT |
Definition at line 47 of file colpartition.h.
Definition at line 69 of file errorcounter.h.
enum tesseract::DawgType |
Enumerator | |
---|---|
ET_RMS | |
ET_DELTA | |
ET_WORD_RECERR | |
ET_CHAR_ERROR | |
ET_SKIP_RATIO | |
ET_COUNT |
Definition at line 37 of file lstmtrainer.h.
Enumerator | |
---|---|
FN_INCOLOR | |
FN_Y0 | |
FN_Y1 | |
FN_Y2 | |
FN_Y3 | |
FN_X0 | |
FN_X1 | |
FN_SHEAR | |
FN_NUM_FACTORS |
Definition at line 58 of file degradeimage.cpp.
|
strong |
Enumerator | |
---|---|
kNone | |
kNormalize |
Definition at line 65 of file normstrngs.h.
|
strong |
Enumerator | |
---|---|
kSingleString | |
kCombined | |
kGlyphSplit | |
kIndividualUnicodes |
Definition at line 48 of file validator.h.
Definition at line 39 of file params_training_featdef.h.
Enumerator | |
---|---|
LR_LEFT | |
LR_RIGHT |
Definition at line 39 of file strokewidth.h.
enum tesseract::LineType |
Enumerator | |
---|---|
LT_START | |
LT_BODY | |
LT_UNKNOWN | |
LT_MULTIPLE |
Definition at line 49 of file paragraphs_internal.h.
Enumerator | |
---|---|
LM_PPTYPE_BLAMER | |
LM_PPTYPE_AMBIG | |
LM_PPTYPE_PATH | |
LM_PPTYPE_SHAPE | |
LM_PPTYPE_NUM |
Definition at line 40 of file lm_pain_points.h.
enum tesseract::LossType |
Enumerator | |
---|---|
NPT_HTEXT | |
NPT_VTEXT | |
NPT_WEAK_HTEXT | |
NPT_WEAK_VTEXT | |
NPT_IMAGE | |
NPT_COUNT |
Definition at line 1501 of file colpartitiongrid.cpp.
Definition at line 43 of file network.h.
Enumerator | |
---|---|
NM_BASELINE | |
NM_CHAR_ISOTROPIC | |
NM_CHAR_ANISOTROPIC |
Definition at line 41 of file normalis.h.
When Tesseract/Cube is initialized we can choose to instantiate/load/run only the Tesseract part, only the Cube part or both along with the combiner. The preference of which engine to use is stored in tessedit_ocr_engine_mode.
ATTENTION: When modifying this enum, please make sure to make the appropriate changes to all the enums mirroring it (e.g. OCREngine in cityblock/workflow/detection/detection_storage.proto). Such enums will mention the connection to OcrEngineMode in the comments.
Enumerator | |
---|---|
OEM_TESSERACT_ONLY | |
OEM_LSTM_ONLY | |
OEM_TESSERACT_LSTM_COMBINED | |
OEM_DEFAULT | |
OEM_COUNT |
Definition at line 265 of file publictypes.h.
|
strong |
Enumerator | |
---|---|
kNone | |
kNormalize |
Definition at line 57 of file normstrngs.h.
+---------------—+ Orientation Example: | 1 Aaaa Aaaa Aaaa | ==================== | Aaa aa aaa aa | To left is a diagram of some (1) English and | aaaaaa A aa aaa. | (2) Chinese text and a (3) photo credit. | 2 | | ####### c c C | Upright Latin characters are represented as A and a. | ####### c c c | '<' represents a latin character rotated | < ####### c c c | anti-clockwise 90 degrees. | < ####### c c | | < ####### . c | Upright Chinese characters are represented C and c. | 3 ####### c | +---------------—+ NOTA BENE: enum values here should match goodoc.proto
If you orient your head so that "up" aligns with Orientation, then the characters will appear "right side up" and readable.
In the example above, both the English and Chinese paragraphs are oriented so their "up" is the top of the page (page up). The photo credit is read with one's head turned leftward ("up" is to page left).
The values of this enum match the convention of Tesseract's osdetect.h
Enumerator | |
---|---|
ORIENTATION_PAGE_UP | |
ORIENTATION_PAGE_RIGHT | |
ORIENTATION_PAGE_DOWN | |
ORIENTATION_PAGE_LEFT |
Definition at line 116 of file publictypes.h.
enum of the elements of the page hierarchy, used in ResultIterator to provide functions that operate on each level without having to have 5x as many functions.
Enumerator | |
---|---|
RIL_BLOCK | |
RIL_PARA | |
RIL_TEXTLINE | |
RIL_WORD | |
RIL_SYMBOL |
Definition at line 216 of file publictypes.h.
Possible modes for page layout analysis. These must be kept in order of decreasing amount of layout analysis to be done, except for OSD_ONLY, so that the inequality test macros below work.
Definition at line 159 of file publictypes.h.
JUSTIFICATION_UNKNOWN The alignment is not clearly one of the other options. This could happen for example if there are only one or two lines of text or the text looks like source code or poetry.
NOTA BENE: Fully justified paragraphs (text aligned to both left and right margins) are marked by Tesseract with JUSTIFICATION_LEFT if their text is written with a left-to-right script and with JUSTIFICATION_RIGHT if their text is written in a right-to-left script.
Interpretation for text read in vertical lines: "Left" is wherever the starting reading position is.
JUSTIFICATION_LEFT Each line, except possibly the first, is flush to the same left tab stop.
JUSTIFICATION_CENTER The text lines of the paragraph are centered about a line going down through their middle of the text lines.
JUSTIFICATION_RIGHT Each line, except possibly the first, is flush to the same right tab stop.
Enumerator | |
---|---|
JUSTIFICATION_UNKNOWN | |
JUSTIFICATION_LEFT | |
JUSTIFICATION_CENTER | |
JUSTIFICATION_RIGHT |
Definition at line 248 of file publictypes.h.
Enumerator | |
---|---|
PFR_OK | |
PFR_SKEW | |
PFR_NOISE |
Definition at line 46 of file strokewidth.h.
enum tesseract::ScriptPos |
Enumerator | |
---|---|
TA_LEFT_ALIGNED | |
TA_LEFT_RAGGED | |
TA_CENTER_JUSTIFIED | |
TA_RIGHT_ALIGNED | |
TA_RIGHT_RAGGED | |
TA_SEPARATOR | |
TA_COUNT |
Definition at line 44 of file tabvector.h.
Definition at line 56 of file tessdatamanager.h.
The text lines are read in the given sequence.
In English, the order is top-to-bottom. In Chinese, vertical text lines are read right-to-left. Mongolian is written in vertical columns top to bottom like Chinese, but the lines order left-to right.
Note that only some combinations make sense. For example, WRITING_DIRECTION_LEFT_TO_RIGHT implies TEXTLINE_ORDER_TOP_TO_BOTTOM
Enumerator | |
---|---|
TEXTLINE_ORDER_LEFT_TO_RIGHT | |
TEXTLINE_ORDER_RIGHT_TO_LEFT | |
TEXTLINE_ORDER_TOP_TO_BOTTOM |
Definition at line 148 of file publictypes.h.
enum tesseract::TopNState |
Enumerator | |
---|---|
TRAINABLE | |
PERFECT | |
UNENCODABLE | |
HI_PRECISION_ERR | |
NOT_BOXED |
Definition at line 47 of file lstmtrainer.h.
Enumerator | |
---|---|
TF_INT_MODE | |
TF_COMPRESS_UNICHARSET |
Definition at line 46 of file lstmrecognizer.h.
|
strong |
Enumerator | |
---|---|
kNFD | |
kNFC | |
kNFKD | |
kNFKC |
Definition at line 48 of file normstrngs.h.
|
strong |
Enumerator | |
---|---|
kNonVirama | |
kDevanagari | |
kBengali | |
kGurmukhi | |
kGujarati | |
kOriya | |
kTamil | |
kTelugu | |
kKannada | |
kMalayalam | |
kSinhala | |
kMyanmar | |
kKhmer | |
kJavanese |
Definition at line 67 of file validator.h.
The grapheme clusters within a line of text are laid out logically in this direction, judged when looking at the text line rotated so that its Orientation is "page up".
For English text, the writing direction is left-to-right. For the Chinese text in the above example, the writing direction is top-to-bottom.
Enumerator | |
---|---|
WRITING_DIRECTION_LEFT_TO_RIGHT | |
WRITING_DIRECTION_RIGHT_TO_LEFT | |
WRITING_DIRECTION_TOP_TO_BOTTOM |
Definition at line 131 of file publictypes.h.
|
inline |
Definition at line 174 of file functions.h.
bool tesseract::AsciiLikelyListItem | ( | const STRING & | word | ) |
Definition at line 296 of file paragraphs.cpp.
void tesseract::assign_blobs_to_blocks2 | ( | Pix * | pix, |
BLOCK_LIST * | blocks, | ||
TO_BLOCK_LIST * | port_blocks | ||
) |
Definition at line 165 of file tordmain.cpp.
TrainingSample * tesseract::BlobToTrainingSample | ( | const TBLOB & | blob, |
bool | nonlinear_norm, | ||
INT_FX_RESULT_STRUCT * | fx_info, | ||
GenericVector< INT_FEATURE_STRUCT > * | bl_features | ||
) |
void tesseract::CanonicalizeDetectionResults | ( | GenericVector< PARA * > * | row_owners, |
PARA_LIST * | paragraphs | ||
) |
Definition at line 2252 of file paragraphs.cpp.
void tesseract::ClearFeatureSpaceWindow | ( | NORM_METHOD | norm_method, |
ScrollView * | window | ||
) |
Clears the given window and draws the featurespace guides for the appropriate normalization method.
Definition at line 987 of file intproto.cpp.
|
inline |
Definition at line 208 of file functions.h.
bool tesseract::cmp_eq | ( | T const & | t1, |
T const & | t2 | ||
) |
Definition at line 375 of file genericvector.h.
|
inline |
Definition at line 214 of file functions.h.
|
inline |
Definition at line 24 of file normstrngs_test.h.
int tesseract::CombineLangModel | ( | const UNICHARSET & | unicharset, |
const std::string & | script_dir, | ||
const std::string & | version_str, | ||
const std::string & | output_dir, | ||
const std::string & | lang, | ||
bool | pass_through_recoder, | ||
const GenericVector< STRING > & | words, | ||
const GenericVector< STRING > & | puncs, | ||
const GenericVector< STRING > & | numbers, | ||
bool | lang_is_rtl, | ||
FileReader | reader, | ||
FileWriter | writer | ||
) |
Definition at line 185 of file lang_model_helpers.cpp.
Definition at line 122 of file fontinfo.cpp.
Definition at line 130 of file fontinfo.cpp.
|
inline |
Definition at line 169 of file functions.h.
|
constexprnoexcept |
Definition at line 41 of file serialis.h.
bool tesseract::CrownCompatible | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | a, | ||
int | b, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1314 of file paragraphs.cpp.
struct Pix * tesseract::DegradeImage | ( | Pix * | input, |
int | exposure, | ||
TRand * | randomizer, | ||
float * | rotation | ||
) |
Definition at line 108 of file degradeimage.cpp.
void tesseract::DeleteObject | ( | T * | object | ) |
Definition at line 155 of file tablefind.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
char * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 41 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
float * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 45 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int16_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 53 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int32_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 57 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int8_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 49 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint16_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 65 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint32_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 69 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint8_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 61 of file serialis.cpp.
void tesseract::DetectParagraphs | ( | int | debug_level, |
bool | after_text_recognition, | ||
const MutableIterator * | block_start, | ||
GenericVector< ParagraphModel * > * | models | ||
) |
Definition at line 2527 of file paragraphs.cpp.
void tesseract::DetectParagraphs | ( | int | debug_level, |
GenericVector< RowInfo > * | row_infos, | ||
GenericVector< PARA * > * | row_owners, | ||
PARA_LIST * | paragraphs, | ||
GenericVector< ParagraphModel * > * | models | ||
) |
Definition at line 2284 of file paragraphs.cpp.
double tesseract::DotProductAVX | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 30 of file dotproductavx.cpp.
double tesseract::DotProductFMA | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 30 of file dotproductfma.cpp.
double tesseract::DotProductNative | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 22 of file dotproduct.cpp.
double tesseract::DotProductSSE | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 31 of file dotproductsse.cpp.
|
inline |
Definition at line 48 of file normstrngs_test.h.
bool tesseract::FirstWordWouldHaveFit | ( | const RowScratchRegisters & | before, |
const RowScratchRegisters & | after | ||
) |
Definition at line 1671 of file paragraphs.cpp.
bool tesseract::FirstWordWouldHaveFit | ( | const RowScratchRegisters & | before, |
const RowScratchRegisters & | after, | ||
tesseract::ParagraphJustification | justification | ||
) |
Definition at line 1646 of file paragraphs.cpp.
void tesseract::FontInfoDeleteCallback | ( | FontInfo | f | ) |
Definition at line 141 of file fontinfo.cpp.
void tesseract::FontSetDeleteCallback | ( | FontSet | fs | ) |
Definition at line 150 of file fontinfo.cpp.
Definition at line 298 of file normstrngs.cpp.
|
inline |
Definition at line 129 of file functions.h.
|
inline |
Definition at line 138 of file functions.h.
void tesseract::GeneratePerspectiveDistortion | ( | int | width, |
int | height, | ||
TRand * | randomizer, | ||
Pix ** | pix, | ||
GenericVector< TBOX > * | boxes | ||
) |
Definition at line 237 of file degradeimage.cpp.
std::string tesseract::GetXheightString | ( | const std::string & | script_dir, |
const UNICHARSET & | unicharset | ||
) |
Definition at line 164 of file unicharset_training_utils.cpp.
void tesseract::HistogramRect | ( | Pix * | src_pix, |
int | channel, | ||
int | left, | ||
int | top, | ||
int | width, | ||
int | height, | ||
int * | histogram | ||
) |
Definition at line 166 of file otsuthr.cpp.
STRING tesseract::HOcrEscape | ( | const char * | text | ) |
Escape a char string - remove &<>"' with HTML codes.
Escape a char string - remove <>&"' with HTML codes.
Definition at line 2307 of file baseapi.cpp.
int tesseract::InterwordSpace | ( | const GenericVector< RowScratchRegisters > & | rows, |
int | row_start, | ||
int | row_end | ||
) |
Definition at line 1623 of file paragraphs.cpp.
bool tesseract::IsInterchangeValid | ( | const char32 | ch | ) |
Definition at line 269 of file normstrngs.cpp.
bool tesseract::IsInterchangeValid7BitAscii | ( | const char32 | ch | ) |
Definition at line 292 of file normstrngs.cpp.
|
inline |
Definition at line 92 of file equationdetect.cpp.
Definition at line 230 of file normstrngs.cpp.
|
inline |
Definition at line 97 of file equationdetect.cpp.
|
inline |
Definition at line 88 of file equationdetect.cpp.
bool tesseract::IsUTF8Whitespace | ( | const char * | text | ) |
Definition at line 245 of file normstrngs.cpp.
bool tesseract::IsValidCodepoint | ( | const char32 | ch | ) |
Definition at line 234 of file normstrngs.cpp.
bool tesseract::IsWhitespace | ( | const char32 | ch | ) |
Definition at line 239 of file normstrngs.cpp.
void tesseract::LeftWordAttributes | ( | const UNICHARSET * | unicharset, |
const WERD_CHOICE * | werd, | ||
const STRING & | utf8, | ||
bool * | is_list, | ||
bool * | starts_idea, | ||
bool * | ends_idea | ||
) |
Definition at line 423 of file paragraphs.cpp.
|
inline |
Definition at line 341 of file genericvector.h.
|
inline |
ShapeTable * tesseract::LoadShapeTable | ( | const STRING & | file_prefix | ) |
Definition at line 154 of file commontraining.cpp.
MasterTrainer * tesseract::LoadTrainingData | ( | int | argc, |
const char *const * | argv, | ||
bool | replication, | ||
ShapeTable ** | shape_table, | ||
STRING * | file_prefix | ||
) |
Creates a MasterTrainer and loads the training data into it: Initializes feature_defs and IntegerFX. Loads the shape_table if shape_table != nullptr. Loads initial unicharset from -U command-line option. If FLAGS_T is set, loads the majority of data from there, else:
Definition at line 211 of file commontraining.cpp.
|
inline |
Definition at line 54 of file functions.h.
|
inline |
Definition at line 184 of file functions.h.
|
inline |
Definition at line 179 of file functions.h.
bool tesseract::NormalizeCleanAndSegmentUTF8 | ( | UnicodeNormMode | u_mode, |
OCRNorm | ocr_normalize, | ||
GraphemeNormMode | g_mode, | ||
bool | report_errors, | ||
const char * | str8, | ||
std::vector< std::string > * | graphemes | ||
) |
Definition at line 188 of file normstrngs.cpp.
bool tesseract::NormalizeUTF8String | ( | UnicodeNormMode | u_mode, |
OCRNorm | ocr_normalize, | ||
GraphemeNorm | grapheme_normalize, | ||
const char * | str8, | ||
std::string * | normalized | ||
) |
Definition at line 163 of file normstrngs.cpp.
Definition at line 220 of file normstrngs.cpp.
int tesseract::OtsuStats | ( | const int * | histogram, |
int * | H_out, | ||
int * | omega0_out | ||
) |
Definition at line 187 of file otsuthr.cpp.
int tesseract::OtsuThreshold | ( | Pix * | src_pix, |
int | left, | ||
int | top, | ||
int | width, | ||
int | height, | ||
int ** | thresholds, | ||
int ** | hi_values | ||
) |
Definition at line 56 of file otsuthr.cpp.
int tesseract::ParamsTrainingFeatureByName | ( | const char * | name | ) |
Definition at line 26 of file params_training_featdef.cpp.
void tesseract::ParseCommandLineFlags | ( | const char * | usage, |
int * | argc, | ||
char *** | argv, | ||
const bool | remove_flags | ||
) |
Definition at line 166 of file commandlineflags.cpp.
Pix * tesseract::PrepareDistortedPix | ( | const Pix * | pix, |
bool | perspective, | ||
bool | invert, | ||
bool | white_noise, | ||
bool | smooth_noise, | ||
bool | blur, | ||
int | box_reduction, | ||
TRand * | randomizer, | ||
GenericVector< TBOX > * | boxes | ||
) |
Definition at line 196 of file degradeimage.cpp.
|
inline |
Definition at line 34 of file normstrngs_test.h.
|
inline |
Definition at line 39 of file normstrngs_test.h.
int tesseract::ProjectiveCoeffs | ( | int | width, |
int | height, | ||
TRand * | randomizer, | ||
float ** | im_coeffs, | ||
float ** | box_coeffs | ||
) |
Definition at line 283 of file degradeimage.cpp.
|
inline |
Definition at line 200 of file publictypes.h.
|
inline |
Definition at line 194 of file publictypes.h.
|
inline |
Definition at line 203 of file publictypes.h.
|
inline |
Definition at line 191 of file publictypes.h.
|
inline |
Inline functions that act on a PageSegMode to determine whether components of layout analysis are enabled. Depend critically on the order of elements of PageSegMode. NOTE that arg is an int for compatibility with INT_PARAM.
Definition at line 188 of file publictypes.h.
|
inline |
Definition at line 197 of file publictypes.h.
|
inline |
Definition at line 206 of file publictypes.h.
Definition at line 156 of file fontinfo.cpp.
Definition at line 229 of file fontinfo.cpp.
Definition at line 173 of file fontinfo.cpp.
STRING tesseract::ReadFile | ( | const std::string & | filename, |
FileReader | reader | ||
) |
Definition at line 57 of file lang_model_helpers.cpp.
void tesseract::RecomputeMarginsAndClearHypotheses | ( | GenericVector< RowScratchRegisters > * | rows, |
int | start, | ||
int | end, | ||
int | percentile | ||
) |
Definition at line 1583 of file paragraphs.cpp.
void tesseract::RightWordAttributes | ( | const UNICHARSET * | unicharset, |
const WERD_CHOICE * | werd, | ||
const STRING & | utf8, | ||
bool * | is_list, | ||
bool * | starts_idea, | ||
bool * | ends_idea | ||
) |
Definition at line 470 of file paragraphs.cpp.
bool tesseract::RowsFitModel | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | start, | ||
int | end, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1826 of file paragraphs.cpp.
|
inline |
Definition at line 362 of file genericvector.h.
const char * tesseract::ScriptPosToString | ( | enum ScriptPos | script_pos | ) |
Definition at line 202 of file ratngs.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const char * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 73 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const float * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 77 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int16_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 85 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int32_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 89 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int8_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 81 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint16_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 97 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint32_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 101 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint8_t * | data, | ||
size_t | n = 1 |
||
) |
Definition at line 93 of file serialis.cpp.
void tesseract::SetBlobStrokeWidth | ( | Pix * | pix, |
BLOBNBOX * | blob | ||
) |
Definition at line 67 of file tordmain.cpp.
void tesseract::SetPropertiesForInputFile | ( | const std::string & | script_dir, |
const std::string & | input_unicharset_file, | ||
const std::string & | output_unicharset_file, | ||
const std::string & | output_xheights_file | ||
) |
Definition at line 183 of file unicharset_training_utils.cpp.
void tesseract::SetScriptProperties | ( | const std::string & | script_dir, |
UNICHARSET * | unicharset | ||
) |
Definition at line 143 of file unicharset_training_utils.cpp.
void tesseract::SetupBasicProperties | ( | bool | report_errors, |
bool | decompose, | ||
UNICHARSET * | unicharset | ||
) |
Definition at line 40 of file unicharset_training_utils.cpp.
|
inline |
Definition at line 38 of file unicharset_training_utils.h.
|
inline |
Definition at line 146 of file functions.h.
int tesseract::sort_cmp | ( | const void * | t1, |
const void * | t2 | ||
) |
Definition at line 384 of file genericvector.h.
int tesseract::sort_ptr_cmp | ( | const void * | t1, |
const void * | t2 | ||
) |
Definition at line 401 of file genericvector.h.
int tesseract::SortByBoxBottom | ( | const void * | void1, |
const void * | void2 | ||
) |
int tesseract::SortByBoxLeft | ( | const void * | void1, |
const void * | void2 | ||
) |
int tesseract::SortByRating | ( | const void * | void1, |
const void * | void2 | ||
) |
Definition at line 81 of file pieces.cpp.
int tesseract::SortByUnicharID | ( | const void * | void1, |
const void * | void2 | ||
) |
Definition at line 73 of file pieces.cpp.
int tesseract::SortRightToLeft | ( | const void * | void1, |
const void * | void2 | ||
) |
unsigned int tesseract::SpanUTF8NotWhitespace | ( | const char * | text | ) |
Definition at line 259 of file normstrngs.cpp.
unsigned int tesseract::SpanUTF8Whitespace | ( | const char * | text | ) |
Definition at line 249 of file normstrngs.cpp.
|
inline |
Definition at line 70 of file paragraphs_internal.h.
|
inline |
Definition at line 192 of file functions.h.
|
inline |
Definition at line 43 of file functions.h.
tesseract::TEST_F | ( | EquationFinderTest | , |
CheckSeedBlobsCount | |||
) |
Definition at line 342 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
ComputeCPsSuperBBox | |||
) |
Definition at line 420 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
ComputeForegroundDensity | |||
) |
Definition at line 380 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
CountAlignment | |||
) |
Definition at line 395 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
EstimateTypeForUnichar | |||
) |
Definition at line 233 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
IdentifySpecialText | |||
) |
Definition at line 181 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
IsIndented | |||
) |
Definition at line 252 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
IsNearSmallNeighbor | |||
) |
Definition at line 313 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
SplitCPHor | |||
) |
Definition at line 506 of file equationdetect_test.cc.
tesseract::TEST_F | ( | EquationFinderTest | , |
SplitCPHorLite | |||
) |
Definition at line 471 of file equationdetect_test.cc.
tesseract::TEST_F | ( | HeapTest | , |
DoublePtrTest | |||
) |
Definition at line 187 of file heap_test.cc.
tesseract::TEST_F | ( | HeapTest | , |
MixedTest | |||
) |
Definition at line 95 of file heap_test.cc.
tesseract::TEST_F | ( | HeapTest | , |
PopWorstTest | |||
) |
Definition at line 114 of file heap_test.cc.
tesseract::TEST_F | ( | HeapTest | , |
RevalueTest | |||
) |
Definition at line 133 of file heap_test.cc.
tesseract::TEST_F | ( | HeapTest | , |
SortTest | |||
) |
Definition at line 82 of file heap_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
BasicTest | |||
) |
Definition at line 29 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
BidiTest | |||
) |
Definition at line 61 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
ColorTest | |||
) |
Definition at line 51 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
DeterminismTest | |||
) |
Definition at line 111 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
EncodeDecodeBothTestKor | |||
) |
Definition at line 41 of file lstm_recode_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
EncodedSoftmaxTest | |||
) |
Definition at line 178 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
RecodeTestKor | |||
) |
Definition at line 29 of file lstm_recode_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
RecodeTestKorBase | |||
) |
Definition at line 19 of file lstm_recode_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
SoftmaxBaselineTest | |||
) |
Definition at line 146 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
SoftmaxTest | |||
) |
Definition at line 166 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
SpeedTest | |||
) |
Definition at line 100 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
Test2D | |||
) |
Definition at line 74 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
TestAdam | |||
) |
Definition at line 89 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
TestLayerAccess | |||
) |
Definition at line 189 of file lstm_test.cc.
tesseract::TEST_F | ( | LSTMTrainerTest | , |
TestSquashed | |||
) |
Definition at line 18 of file lstm_squashed_test.cc.
tesseract::TEST_F | ( | NthItemTest | , |
BoringTest | |||
) |
Definition at line 69 of file nthitem_test.cc.
tesseract::TEST_F | ( | NthItemTest | , |
EqualTest | |||
) |
Definition at line 107 of file nthitem_test.cc.
tesseract::TEST_F | ( | NthItemTest | , |
GeneralTest | |||
) |
Definition at line 45 of file nthitem_test.cc.
tesseract::TEST_F | ( | NthItemTest | , |
UniqueTest | |||
) |
Definition at line 95 of file nthitem_test.cc.
Pix * tesseract::TraceBlockOnReducedPix | ( | BLOCK * | block, |
int | gridsize, | ||
ICOORD | bleft, | ||
int * | left, | ||
int * | bottom | ||
) |
Definition at line 254 of file bbgrid.cpp.
Pix * tesseract::TraceOutlineOnReducedPix | ( | C_OUTLINE * | outline, |
int | gridsize, | ||
ICOORD | bleft, | ||
int * | left, | ||
int * | bottom | ||
) |
Definition at line 228 of file bbgrid.cpp.
int tesseract::UnicodeFor | ( | const UNICHARSET * | u, |
const WERD_CHOICE * | werd, | ||
int | pos | ||
) |
Definition at line 303 of file paragraphs.cpp.
bool tesseract::ValidBodyLine | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | row, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1303 of file paragraphs.cpp.
bool tesseract::ValidFirstLine | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | row, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1292 of file paragraphs.cpp.
bool tesseract::write_info | ( | FILE * | f, |
const FontInfo & | fi | ||
) |
Definition at line 166 of file fontinfo.cpp.
bool tesseract::write_set | ( | FILE * | f, |
const FontSet & | fs | ||
) |
Definition at line 235 of file fontinfo.cpp.
bool tesseract::write_spacing_info | ( | FILE * | f, |
const FontInfo & | fi | ||
) |
Definition at line 201 of file fontinfo.cpp.
bool tesseract::WriteFile | ( | const std::string & | output_dir, |
const std::string & | lang, | ||
const std::string & | suffix, | ||
const GenericVector< char > & | data, | ||
FileWriter | writer | ||
) |
Definition at line 36 of file lang_model_helpers.cpp.
bool tesseract::WriteRecoder | ( | const UNICHARSET & | unicharset, |
bool | pass_through, | ||
const std::string & | output_dir, | ||
const std::string & | lang, | ||
FileWriter | writer, | ||
STRING * | radical_table_data, | ||
TessdataManager * | traineddata | ||
) |
Definition at line 85 of file lang_model_helpers.cpp.
void tesseract::WriteShapeTable | ( | const STRING & | file_prefix, |
const ShapeTable & | shape_table | ||
) |
Definition at line 179 of file commontraining.cpp.
bool tesseract::WriteUnicharset | ( | const UNICHARSET & | unicharset, |
const std::string & | output_dir, | ||
const std::string & | lang, | ||
FileWriter | writer, | ||
TessdataManager * | traineddata | ||
) |
Definition at line 71 of file lang_model_helpers.cpp.
|
inline |
Definition at line 202 of file functions.h.
TFNetworkModelDefaultTypeInternal tesseract::_TFNetworkModel_default_instance_ |
Definition at line 51 of file tfnetwork.pb.h.
const int tesseract::case_state_table[6][4] |
Definition at line 44 of file context.cpp.
DotProductFunction tesseract::DotProduct |
Definition at line 50 of file simddetect.cpp.
const int tesseract::kAdamCorrectionIterations = 200000 |
Definition at line 35 of file weightmatrix.cpp.
const double tesseract::kAdamEpsilon = 1e-8 |
Definition at line 37 of file weightmatrix.cpp.
const int tesseract::kAdamFlag = 4 |
Definition at line 165 of file weightmatrix.cpp.
const int tesseract::kAdjacentLeaderSearchPadding = 2 |
Definition at line 116 of file tablefind.cpp.
const double tesseract::kAlignedFraction = 0.03125 |
Definition at line 38 of file alignedblob.cpp.
const double tesseract::kAlignedGapFraction = 0.75 |
Definition at line 42 of file alignedblob.cpp.
const double tesseract::kAllowBlobArea = 0.05 |
Definition at line 57 of file tablefind.cpp.
const double tesseract::kAllowBlobHeight = 0.3 |
Definition at line 55 of file tablefind.cpp.
const double tesseract::kAllowBlobWidth = 0.4 |
Definition at line 56 of file tablefind.cpp.
const double tesseract::kAllowTextArea = 0.8 |
Definition at line 50 of file tablefind.cpp.
const double tesseract::kAllowTextHeight = 0.5 |
Definition at line 48 of file tablefind.cpp.
const double tesseract::kAllowTextWidth = 0.6 |
Definition at line 49 of file tablefind.cpp.
const int tesseract::kBatchIterations = 100 |
Definition at line 37 of file lstm_test.h.
const double tesseract::kBestCheckpointFraction = 31.0 / 32.0 |
Definition at line 69 of file lstmtrainer.cpp.
const double tesseract::kBigPartSizeRatio = 1.75 |
Definition at line 46 of file colpartitiongrid.cpp.
const int tesseract::kBoxClipTolerance = 2 |
Definition at line 31 of file boxword.cpp.
const double tesseract::kBrokenCJKIterationFraction = 0.125 |
Definition at line 67 of file strokewidth.cpp.
const int tesseract::kBytesPer64BitNumber = 20 |
Max bytes in the decimal representation of int64_t.
Definition at line 1501 of file baseapi.cpp.
const int tesseract::kBytesPerBoxFileLine = (kBytesPerNumber + 1) * kNumbersPerBlob + 1 |
Multiplier for max expected textlength assumes (kBytesPerNumber + space)
Definition at line 1499 of file baseapi.cpp.
const int tesseract::kBytesPerNumber = 5 |
The number of bytes taken by each number. Since we use int16_t for ICOORD, assume only 5 digits max.
Definition at line 1493 of file baseapi.cpp.
const int tesseract::kCellSplitColumnThreshold = 0 |
Definition at line 42 of file tablerecog.cpp.
const int tesseract::kCellSplitRowThreshold = 0 |
Definition at line 41 of file tablerecog.cpp.
const float tesseract::kCertaintyScale = 7.0f |
Definition at line 35 of file linerec.cpp.
const double tesseract::kCertOffset = -0.085 |
Definition at line 50 of file lstmrecognizer.cpp.
const double tesseract::kCJKAspectRatio = 1.25 |
Definition at line 61 of file strokewidth.cpp.
const double tesseract::kCJKAspectRatioIncrease = 1.0625 |
Definition at line 63 of file strokewidth.cpp.
const double tesseract::kCJKBrokenDistanceFraction = 0.25 |
Definition at line 57 of file strokewidth.cpp.
const int tesseract::kCJKMaxComponents = 8 |
Definition at line 59 of file strokewidth.cpp.
const int tesseract::kCJKRadius = 2 |
Definition at line 55 of file strokewidth.cpp.
const int tesseract::kColumnWidthFactor = 20 |
const double tesseract::kCosMaxSkewAngle = 0.866025 |
Definition at line 60 of file tabfind.cpp.
const int tesseract::kCrackSpacing = 100 |
Spacing of cracks across the page to break up tall vertical lines.
Definition at line 45 of file linefind.cpp.
const ParagraphModel * tesseract::kCrownLeft = reinterpret_cast<ParagraphModel *>(static_cast<uintptr_t>(0xDEAD111F)) |
Definition at line 69 of file paragraphs.cpp.
const ParagraphModel * tesseract::kCrownRight = reinterpret_cast<ParagraphModel *>(static_cast<uintptr_t>(0xDEAD888F)) |
Definition at line 71 of file paragraphs.cpp.
const int tesseract::kDefaultResolution = 300 |
Definition at line 69 of file pango_font_info.cpp.
const double tesseract::kDiacriticXPadRatio = 7.0 |
Definition at line 70 of file strokewidth.cpp.
const double tesseract::kDiacriticYPadRatio = 1.75 |
Definition at line 73 of file strokewidth.cpp.
const double tesseract::kDictRatio = 2.25 |
Definition at line 48 of file lstmrecognizer.cpp.
const int tesseract::kDoubleFlag = 128 |
Definition at line 169 of file weightmatrix.cpp.
const int tesseract::kErrorGraphInterval = 1000 |
Definition at line 57 of file lstmtrainer.cpp.
const int tesseract::kExposureFactor = 16 |
Definition at line 75 of file degradeimage.cpp.
const int tesseract::kFeaturePadding = 2 |
Definition at line 36 of file imagedata.h.
const float tesseract::kFontMergeDistance = 0.025 |
Definition at line 48 of file mastertrainer.cpp.
const double tesseract::kGoodRowNumberOfColumnsLarge = 0.7 |
Definition at line 60 of file tablerecog.cpp.
const double tesseract::kGoodRowNumberOfColumnsSmall[] = { 2, 2, 2, 2, 2, 3, 3 } |
Definition at line 56 of file tablerecog.cpp.
const int tesseract::kGoodRowNumberOfColumnsSmallSize |
Definition at line 57 of file tablerecog.cpp.
const int tesseract::kGutterMultiple = 4 |
Definition at line 35 of file tabvector.cpp.
const int tesseract::kGutterToNeighbourRatio = 3 |
Definition at line 37 of file tabvector.cpp.
const double tesseract::kHighConfidence = 0.9375 |
Definition at line 65 of file lstmtrainer.cpp.
const int tesseract::kHistogramBuckets = 16 |
Definition at line 367 of file weightmatrix.cpp.
const double tesseract::kHorizontalGapMergeFraction = 0.5 |
Definition at line 49 of file colfind.cpp.
const double tesseract::kHorizontalSpacing = 0.30 |
Definition at line 35 of file tablerecog.cpp.
const int tesseract::kHorzStrongTextlineAspect = 5 |
Definition at line 67 of file colpartition.cpp.
const int tesseract::kHorzStrongTextlineCount = 8 |
Definition at line 63 of file colpartition.cpp.
const int tesseract::kHorzStrongTextlineHeight = 10 |
Definition at line 65 of file colpartition.cpp.
const int tesseract::kImagePadding = 4 |
Definition at line 38 of file imagedata.h.
const double tesseract::kImprovementFraction = 15.0 / 16.0 |
Definition at line 67 of file lstmtrainer.cpp.
const float tesseract::kInfiniteDist = 999.0f |
Definition at line 905 of file mastertrainer.cpp.
const int tesseract::kInt8Flag = 1 |
Definition at line 163 of file weightmatrix.cpp.
const double tesseract::kLargeTableProjectionThreshold = 0.45 |
Definition at line 106 of file tablefind.cpp.
const int tesseract::kLargeTableRowCount = 6 |
Definition at line 108 of file tablefind.cpp.
const int tesseract::kLatinChs[] |
Latin chars corresponding to the unicode chars above.
Definition at line 1562 of file baseapi.cpp.
const double tesseract::kLearningRateDecay = M_SQRT1_2 |
Definition at line 53 of file lstmtrainer.cpp.
const int tesseract::kLeftIndentAlignmentCountTh = 1 |
Definition at line 85 of file equationdetect.cpp.
const double tesseract::kLineCountReciprocal = 4.0 |
Definition at line 48 of file tabvector.cpp.
const int tesseract::kLinedTableMinHorizontalLines = 3 |
Definition at line 45 of file tablerecog.cpp.
const int tesseract::kLinedTableMinVerticalLines = 3 |
Definition at line 44 of file tablerecog.cpp.
const int tesseract::kLineFindGridSize = 50 |
Grid size used by line finder. Not very critical.
Definition at line 47 of file linefind.cpp.
const double tesseract::kLineFragmentAspectRatio = 10.0 |
Definition at line 54 of file tabfind.cpp.
const double tesseract::kLineResidueAspectRatio = 8.0 |
Definition at line 94 of file strokewidth.cpp.
const int tesseract::kLineResiduePadRatio = 3 |
Definition at line 96 of file strokewidth.cpp.
const double tesseract::kLineResidueSizeRatio = 1.75 |
Definition at line 98 of file strokewidth.cpp.
const int tesseract::kLineTrapLongest = 4 |
Definition at line 87 of file strokewidth.cpp.
const int tesseract::kLineTrapShortest = 2 |
Definition at line 89 of file strokewidth.cpp.
const char *const tesseract::kLRM = "\u200E" |
Left-to-Right Mark.
Definition at line 38 of file unicodes.cpp.
const double tesseract::kMarginFactor = 1.1 |
Definition at line 50 of file tablerecog.cpp.
const double tesseract::kMarginOverlapFraction = 0.25 |
Definition at line 44 of file colpartitiongrid.cpp.
const float tesseract::kMathDigitDensityTh1 = 0.25 |
Definition at line 80 of file equationdetect.cpp.
const float tesseract::kMathDigitDensityTh2 = 0.1 |
Definition at line 81 of file equationdetect.cpp.
const float tesseract::kMathItalicDensityTh = 0.5 |
Definition at line 82 of file equationdetect.cpp.
const int tesseract::kMaxAmbigStringSize = UNICHAR_LEN * (MAX_AMBIG_SIZE + 1) |
Definition at line 41 of file ambigs.cpp.
const double tesseract::kMaxBaselineError = 0.4375 |
Definition at line 70 of file colpartition.cpp.
const double tesseract::kMaxBlobOverlapFactor = 4.0 |
Definition at line 76 of file tablefind.cpp.
const int tesseract::kMaxBlobWidth = 500 |
Definition at line 39 of file tablefind.cpp.
const int16_t tesseract::kMaxBoxEdgeDiff = 2 |
Definition at line 32 of file recogtraining.cpp.
const int tesseract::kMaxBoxesInDataPartition = 20 |
Definition at line 65 of file tablefind.cpp.
const int tesseract::kMaxBytesPerLine |
A maximal single box could occupy kNumbersPerBlob numbers at kBytesPer64BitNumber digits (if someone sneaks in a 64 bit value) and a space plus the newline and the maximum length of a UNICHAR. Test against this on each iteration for safety.
Definition at line 1508 of file baseapi.cpp.
const int tesseract::kMaxCaptionLines = 7 |
Definition at line 38 of file colpartitiongrid.cpp.
const int tesseract::kMaxCharTopRange = 48 |
Definition at line 82 of file fixxht.cpp.
const int tesseract::kMaxCircleErosions = 8 |
Definition at line 66 of file pagesegmain.cpp.
const int tesseract::kMaxCJKSizeRatio = 5 |
Definition at line 65 of file strokewidth.cpp.
const int tesseract::kMaxColorDistance = 900 |
Definition at line 77 of file colpartition.cpp.
const int tesseract::kMaxColumnHeaderDistance = 4 |
Definition at line 84 of file tablefind.cpp.
const double tesseract::kMaxDiacriticDistanceRatio = 1.25 |
Definition at line 79 of file strokewidth.cpp.
const double tesseract::kMaxDiacriticGapToBaseCharHeight = 1.0 |
Definition at line 82 of file strokewidth.cpp.
const double tesseract::kMaxDistToPartSizeRatio = 1.5 |
Definition at line 54 of file colfind.cpp.
const int tesseract::kMaxFillinMultiple = 11 |
Definition at line 44 of file tabvector.cpp.
const double tesseract::kMaxGapInTextPartition = 4.0 |
Definition at line 68 of file tablefind.cpp.
const double tesseract::kMaxGutterWidthAbsolute = 2.00 |
Definition at line 49 of file tabfind.cpp.
const int tesseract::kMaxIncompatibleColumnCount = 2 |
Definition at line 46 of file colfind.cpp.
const int tesseract::kMaxIntSize = 22 |
Max string length of an int.
Definition at line 121 of file baseapi.cpp.
const int tesseract::kMaxLargeOverlapsWithMedium = 12 |
Definition at line 43 of file ccnontextdetect.cpp.
const int tesseract::kMaxLargeOverlapsWithSmall = 3 |
Definition at line 34 of file ccnontextdetect.cpp.
const double tesseract::kMaxLeaderGapFractionOfMax = 0.25 |
Definition at line 53 of file colpartition.cpp.
const double tesseract::kMaxLeaderGapFractionOfMin = 0.5 |
Definition at line 55 of file colpartition.cpp.
const int tesseract::kMaxLigature = 0xfb17 |
Definition at line 64 of file ligature_table.cpp.
const int tesseract::kMaxLineLength = 1024 |
Definition at line 318 of file boxchar.cpp.
const int tesseract::kMaxLineResidue = 6 |
Definition at line 53 of file linefind.cpp.
const int tesseract::kMaxMediumOverlapsWithSmall = 12 |
Definition at line 39 of file ccnontextdetect.cpp.
const int tesseract::kMaxNeighbourDistFactor = 4 |
Definition at line 36 of file colpartitiongrid.cpp.
const double tesseract::kMaxNonLineDensity = 0.25 |
Definition at line 58 of file linefind.cpp.
const int tesseract::kMaxOffsetDist = 32 |
Definition at line 32 of file intfeaturemap.cpp.
|
constexpr |
Definition at line 35 of file intsimdmatrixavx2.cpp.
const int tesseract::kMaxPadFactor = 6 |
Definition at line 33 of file colpartitiongrid.cpp.
const double tesseract::kMaxParagraphEndingLeftSpaceMultiple = 3.0 |
Definition at line 125 of file tablefind.cpp.
const double tesseract::kMaxPartitionSpacing = 1.75 |
Definition at line 61 of file colpartitiongrid.cpp.
const int tesseract::kMaxRaggedSearch = 25 |
Definition at line 39 of file tabfind.cpp.
const int tesseract::kMaxRealDistance = 2.0 |
Definition at line 39 of file detlinefit.cpp.
const double tesseract::kMaxRectangularFraction = 0.75 |
Definition at line 42 of file imagefind.cpp.
const double tesseract::kMaxRectangularGradient = 0.1 |
Definition at line 45 of file imagefind.cpp.
const int tesseract::kMaxRMSColorNoise = 128 |
Definition at line 74 of file colpartition.cpp.
const double tesseract::kMaxRowSize = 2.5 |
Definition at line 53 of file tablerecog.cpp.
const double tesseract::kMaxSameBlockLineSpacing = 3 |
Definition at line 49 of file colpartition.cpp.
const double tesseract::kMaxSizeRatio = 1.5 |
Definition at line 51 of file colpartition.cpp.
const int tesseract::kMaxSkewFactor = 15 |
Definition at line 64 of file alignedblob.cpp.
const double tesseract::kMaxSmallNeighboursPerPix = 1.0 / 32 |
Definition at line 31 of file ccnontextdetect.cpp.
const double tesseract::kMaxSpacingDrift = 1.0 / 72 |
Definition at line 43 of file colpartition.cpp.
const double tesseract::kMaxStaveHeight = 1.0 |
Definition at line 60 of file linefind.cpp.
const double tesseract::kMaxTableCellXheight = 2.0 |
Definition at line 80 of file tablefind.cpp.
const double tesseract::kMaxTopSpacingFraction = 0.25 |
Definition at line 46 of file colpartition.cpp.
const int tesseract::kMaxUnicharsPerCluster = 2000 |
Definition at line 46 of file mastertrainer.cpp.
const int tesseract::kMaxVerticalSearch = 12 |
Definition at line 38 of file tabfind.cpp.
const int tesseract::kMaxVerticalSpacing = 500 |
Definition at line 37 of file tablefind.cpp.
const int tesseract::kMaxWinSize = 2000 |
Definition at line 50 of file network.cpp.
const double tesseract::kMaxXProjectionGapFactor = 2.0 |
Definition at line 135 of file tablefind.cpp.
const double tesseract::kMinAlignedGutter = 0.25 |
Definition at line 50 of file tabvector.cpp.
const int tesseract::kMinAlignedTabs = 4 |
Definition at line 54 of file alignedblob.cpp.
const double tesseract::kMinBaselineCoverage = 0.5 |
Definition at line 72 of file colpartition.cpp.
const int tesseract::kMinBoxesInTextPartition = 10 |
Definition at line 62 of file tablefind.cpp.
const double tesseract::kMinCaptionGapHeightRatio = 0.5 |
Definition at line 42 of file colpartitiongrid.cpp.
const double tesseract::kMinCaptionGapRatio = 2.0 |
Definition at line 40 of file colpartitiongrid.cpp.
const float tesseract::kMinCertainty = -20.0f |
Definition at line 30 of file networkio.cpp.
const int tesseract::kMinChainTextValue = 3 |
Definition at line 61 of file colpartition.cpp.
const int tesseract::kMinClusteredShapes = 1 |
Definition at line 44 of file mastertrainer.cpp.
const int tesseract::kMinColorDifference = 16 |
Definition at line 51 of file imagefind.cpp.
const int tesseract::kMinColumnWidth = 2.0 / 3 |
Definition at line 31 of file colpartitionset.cpp.
const double tesseract::kMinDiacriticSizeRatio = 1.0625 |
Definition at line 76 of file strokewidth.cpp.
const double tesseract::kMinDivergenceRate = 50.0 |
Definition at line 46 of file lstmtrainer.cpp.
const int tesseract::kMinEvaluatedTabs = 3 |
Definition at line 56 of file tabfind.cpp.
const double tesseract::kMinFilledArea = 0.35 |
Definition at line 63 of file tablerecog.cpp.
const double tesseract::kMinFractionalLinesInColumn = 0.125 |
Definition at line 45 of file tabfind.cpp.
const double tesseract::kMinGoodTextPARatio = 1.5 |
Definition at line 59 of file ccnontextdetect.cpp.
const double tesseract::kMinGutterFraction = 0.5 |
Definition at line 46 of file tabvector.cpp.
const double tesseract::kMinGutterWidthGrid = 0.5 |
Definition at line 51 of file colfind.cpp.
const int tesseract::kMinImageFindSize = 100 |
Definition at line 47 of file imagefind.cpp.
const int tesseract::kMinLeaderCount = 5 |
Definition at line 57 of file colpartition.cpp.
const int tesseract::kMinLigature = 0xfb00 |
Definition at line 63 of file ligature_table.cpp.
const int tesseract::kMinLineLengthFraction = 4 |
Denominator of resolution makes min pixels to demand line lengths to be.
Definition at line 43 of file linefind.cpp.
const int tesseract::kMinLinesInColumn = 10 |
Definition at line 41 of file tabfind.cpp.
const double tesseract::kMinMaxGapInTextPartition = 0.5 |
Definition at line 72 of file tablefind.cpp.
const double tesseract::kMinMusicPixelFraction = 0.75 |
Definition at line 62 of file linefind.cpp.
const double tesseract::kMinOverlapWithTable = 0.6 |
Definition at line 96 of file tablefind.cpp.
const double tesseract::kMinParagraphEndingTextToWhitespaceRatio = 3.0 |
Definition at line 131 of file tablefind.cpp.
const int tesseract::kMinPointsForErrorCount = 16 |
Definition at line 36 of file detlinefit.cpp.
const float tesseract::kMinProb = exp(kMinCertainty) |
Definition at line 32 of file networkio.cpp.
const double tesseract::kMinRaggedGutter = 1.5 |
Definition at line 52 of file tabvector.cpp.
const int tesseract::kMinRaggedTabs = 5 |
Definition at line 52 of file alignedblob.cpp.
const int tesseract::kMinRampSize = 1000 |
Definition at line 79 of file degradeimage.cpp.
const double tesseract::kMinRectangularFraction = 0.125 |
Definition at line 40 of file imagefind.cpp.
const int tesseract::kMinRectSize = 10 |
Minimum sensible image size to be worth running tesseract.
Definition at line 104 of file baseapi.cpp.
const int tesseract::kMinRowsInTable = 3 |
Definition at line 111 of file tablefind.cpp.
const int tesseract::kMinStallIterations = 10000 |
Definition at line 48 of file lstmtrainer.cpp.
const int tesseract::kMinStartedErrorRate = 75 |
Definition at line 61 of file lstmtrainer.cpp.
const int tesseract::kMinStrongTextValue = 6 |
Definition at line 59 of file colpartition.cpp.
const double tesseract::kMinTabGradient = 4.0 |
Definition at line 60 of file alignedblob.cpp.
const int tesseract::kMinThickLineWidth = 12 |
Definition at line 49 of file linefind.cpp.
const int tesseract::kMinVerticalSearch = 3 |
Definition at line 37 of file tabfind.cpp.
const int tesseract::kMinWinSize = 500 |
Definition at line 49 of file network.cpp.
const int tesseract::kMostlyOneDirRatio = 3 |
Definition at line 92 of file strokewidth.cpp.
const double tesseract::kNeighbourSearchFactor = 2.5 |
Definition at line 102 of file strokewidth.cpp.
const double tesseract::kNoiseOverlapAreaFactor = 1.0 / 512 |
Definition at line 107 of file strokewidth.cpp.
const double tesseract::kNoiseOverlapGrowthFactor = 4.0 |
Definition at line 104 of file strokewidth.cpp.
const int tesseract::kNoisePadding = 4 |
Definition at line 50 of file ccnontextdetect.cpp.
const int tesseract::kNumAdjustmentIterations = 100 |
Definition at line 55 of file lstmtrainer.cpp.
const int tesseract::kNumbersPerBlob = 5 |
The 5 numbers output for each box (the usual 4 and a page number.)
Definition at line 1488 of file baseapi.cpp.
const int tesseract::kNumEndPoints = 3 |
Definition at line 30 of file detlinefit.cpp.
|
constexpr |
Definition at line 41 of file intsimdmatrixavx2.cpp.
|
constexpr |
Definition at line 39 of file intsimdmatrixavx2.cpp.
|
constexpr |
Definition at line 37 of file intsimdmatrixavx2.cpp.
|
constexpr |
Definition at line 33 of file intsimdmatrixavx2.cpp.
const int tesseract::kNumPagesPerBatch = 100 |
Definition at line 59 of file lstmtrainer.cpp.
const int tesseract::kOriginalNoiseMultiple = 8 |
Definition at line 46 of file ccnontextdetect.cpp.
const double tesseract::kParagraphEndingPreviousLineRatio = 1.3 |
Definition at line 121 of file tablefind.cpp.
const char *const tesseract::kPDF = "\u202C" |
Pop Directional Formatting.
Definition at line 41 of file unicodes.cpp.
const double tesseract::kPhotoOffsetFraction = 0.375 |
Definition at line 53 of file ccnontextdetect.cpp.
const int tesseract::kPrime1 = 17 |
Definition at line 36 of file trainingsampleset.cpp.
const int tesseract::kPrime2 = 13 |
Definition at line 37 of file trainingsampleset.cpp.
const int tesseract::kRadicalRadix = 29 |
Definition at line 31 of file unicharcompress.cpp.
const double tesseract::kRaggedFraction = 2.5 |
Definition at line 40 of file alignedblob.cpp.
const double tesseract::kRaggedGapFraction = 1.0 |
Definition at line 44 of file alignedblob.cpp.
const int tesseract::kRaggedGutterMultiple = 5 |
Definition at line 51 of file tabfind.cpp.
const int tesseract::kRandomizingCenter = 128 |
Definition at line 36 of file trainingsample.cpp.
const double tesseract::kRatingEpsilon = 1.0 / 32 |
Definition at line 31 of file errorcounter.cpp.
const double tesseract::kRequiredColumns = 0.7 |
Definition at line 48 of file tablerecog.cpp.
const char tesseract::kReverseIfHasRTL[] = "RRP_REVERSE_IF_HAS_RTL" |
const int tesseract::kRGBRMSColors = 4 |
Definition at line 36 of file colpartition.h.
const char *const tesseract::kRLE = "\u202A" |
Right-to-Left Embedding.
Definition at line 40 of file unicodes.cpp.
const char *const tesseract::kRLM = "\u200F" |
Right-to-Left Mark.
Definition at line 39 of file unicodes.cpp.
const double tesseract::kRMSFitScaling = 8.0 |
Definition at line 49 of file imagefind.cpp.
const float tesseract::kRotationRange = 0.02f |
Definition at line 73 of file degradeimage.cpp.
const int tesseract::kSaltnPepper = 5 |
Definition at line 77 of file degradeimage.cpp.
|
constexpr |
Definition at line 36 of file functions.h.
const int tesseract::kSeedBlobsCountTh = 10 |
Definition at line 84 of file equationdetect.cpp.
const int tesseract::kSideSpaceMargin = 10 |
Definition at line 101 of file tablefind.cpp.
const int tesseract::kSimilarRaggedDist = 50 |
Definition at line 42 of file tabvector.cpp.
const int tesseract::kSimilarVectorDist = 10 |
Definition at line 39 of file tabvector.cpp.
const int tesseract::ksizeofUniversalAmbigsFile = sizeof(kUniversalAmbigsFile) |
Definition at line 19036 of file universalambigs.cpp.
const float tesseract::kSizeRatioToReject = 2.0 |
Definition at line 100 of file strokewidth.cpp.
const double tesseract::kSmallTableProjectionThreshold = 0.35 |
Definition at line 105 of file tablefind.cpp.
const int tesseract::kSmoothDecisionMargin = 4 |
Definition at line 64 of file colpartitiongrid.cpp.
const double tesseract::kSplitPartitionSize = 2.0 |
Definition at line 43 of file tablefind.cpp.
const int tesseract::kSquareLimit = 25 |
Definition at line 34 of file trainingsampleset.cpp.
const double tesseract::kStageTransitionThreshold = 10.0 |
Definition at line 63 of file lstmtrainer.cpp.
const double tesseract::kStrokeWidthCJK = 2.0 |
Definition at line 52 of file strokewidth.cpp.
const double tesseract::kStrokeWidthConstantTolerance = 2.0 |
Definition at line 140 of file tablefind.cpp.
const double tesseract::kStrokeWidthFractionalTolerance = 0.25 |
Definition at line 139 of file tablefind.cpp.
const double tesseract::kStrokeWidthFractionCJK = 0.25 |
Definition at line 51 of file strokewidth.cpp.
const double tesseract::kStrokeWidthFractionTolerance = 0.125 |
Allowed proportional change in stroke width to be the same font.
Definition at line 44 of file strokewidth.cpp.
const double tesseract::kStrokeWidthTolerance = 1.5 |
Allowed constant change in stroke width to be the same font. Really 1.5 pixels.
Definition at line 49 of file strokewidth.cpp.
const double tesseract::kSubTrainerMarginFraction = 3.0 / 128 |
Definition at line 51 of file lstmtrainer.cpp.
const double tesseract::kTableColumnThreshold = 3.0 |
Definition at line 88 of file tablefind.cpp.
|
constexpr |
Definition at line 34 of file functions.h.
const int tesseract::kTabRadiusFactor = 5 |
Definition at line 35 of file tabfind.cpp.
const int tesseract::kTargetXScale = 5 |
Definition at line 71 of file lstmtrainer.cpp.
const int tesseract::kTargetYScale = 100 |
Definition at line 72 of file lstmtrainer.cpp.
const char tesseract::kTesseractReject = '~' |
Character returned when Tesseract couldn't recognize as anything.
Definition at line 106 of file baseapi.cpp.
const int tesseract::kTestChar = -1 |
Definition at line 32 of file trainingsampleset.cpp.
const double tesseract::kThickLengthMultiple = 0.75 |
Definition at line 56 of file linefind.cpp.
const int tesseract::kThinLineFraction = 20 |
Denominator of resolution makes max pixel width to allow thin lines.
Definition at line 41 of file linefind.cpp.
const double tesseract::kTinyEnoughTextlineOverlapFraction = 0.25 |
Definition at line 48 of file colpartitiongrid.cpp.
const int tesseract::kTrainerIterations = 600 |
Definition at line 35 of file lstm_test.h.
const float tesseract::kUnclearDensityTh = 0.25 |
Definition at line 83 of file equationdetect.cpp.
const int tesseract::kUniChs[] |
Conversion table for non-latin characters. Maps characters out of the latin set into the latin set. TODO(rays) incorporate this translation into unicharset.
Definition at line 1558 of file baseapi.cpp.
const char tesseract::kUniversalAmbigsFile |
Definition at line 24 of file universalambigs.cpp.
const char tesseract::kUNLVReject = '~' |
Character used by UNLV error counter as a reject.
Definition at line 108 of file baseapi.cpp.
const char tesseract::kUNLVSuspect = '^' |
Character used by UNLV as a suspect marker.
Definition at line 110 of file baseapi.cpp.
const double tesseract::kVerticalSpacing = -0.2 |
Definition at line 38 of file tablerecog.cpp.
const int tesseract::kVLineAlignment = 3 |
Definition at line 46 of file alignedblob.cpp.
const int tesseract::kVLineGutter = 1 |
Definition at line 48 of file alignedblob.cpp.
const int tesseract::kVLineMinLength = 500 |
Definition at line 56 of file alignedblob.cpp.
const int tesseract::kVLineSearchSize = 150 |
Definition at line 50 of file alignedblob.cpp.
const float tesseract::kWorstDictCertainty = -25.0f |
Definition at line 37 of file linerec.cpp.
const int tesseract::kXWinFrameSize = 30 |
Definition at line 52 of file network.cpp.
const int tesseract::kYWinFrameSize = 80 |
Definition at line 53 of file network.cpp.
const double tesseract::LogisticTable |
Definition at line 4102 of file functions.cpp.
const char* const tesseract::RTLReversePolicyNames[] |
const double tesseract::TanhTable |
Definition at line 4 of file functions.cpp.
int tesseract::test_data = {8, 1, 2, -4, 7, 9, 65536, 4, 9, 0} |
Definition at line 24 of file heap_test.cc.
double tesseract::textord_tabvector_vertical_box_ratio = 0.5 |
"Fraction of box matches required to declare a line vertical"
Definition at line 58 of file tabvector.cpp.
double tesseract::textord_tabvector_vertical_gap_fraction = 0.5 |
"max fraction of mean blob width allowed for vertical gaps in vertical text"
"Max fraction of mean blob width allowed for vertical gaps in vertical text"
Definition at line 55 of file tabvector.cpp.