tesseract
4.0.0-1-g2a2b
|
Typedefs | |
typedef int(Dict::* | DictFunc) (void *void_dawg_args, const UNICHARSET &unicharset, UNICHAR_ID unichar_id, bool word_end) const |
typedef double(Dict::* | ProbabilityInContextFunc) (const char *lang, const char *context, int context_bytes, const char *character, int character_bytes) |
typedef float(Dict::* | ParamsModelClassifyFunc) (const char *lang, void *path) |
typedef void(Wordrec::* | FillLatticeFunc) (const MATRIX &ratings, const WERD_CHOICE_LIST &best_choices, const UNICHARSET &unicharset, BlamerBundle *blamer_bundle) |
typedef TessCallback4< const UNICHARSET &, int, PageIterator *, Pix * > | TruthCallback |
using | SetOfModels = GenericVectorEqEq< const ParagraphModel * > |
typedef void(Tesseract::* | WordRecognizer) (const WordData &word_data, WERD_RES **in_word, PointerVector< WERD_RES > *out_words) |
using | ParamsTrainingHypothesisList = GenericVector< ParamsTrainingHypothesis > |
using | UnicharIdVector = GenericVector< UNICHAR_ID > |
using | UnicharAmbigsVector = GenericVector< AmbigSpec_LIST * > |
typedef bool(* | FileReader) (const STRING &filename, GenericVector< char > *data) |
typedef bool(* | FileWriter) (const GenericVector< char > &data, const STRING &filename) |
using | IntKDPair = KDPairInc< int, int > |
using | char32 = signed int |
using | RSMap = std::unordered_map< int, std::unique_ptr< std::vector< int > >> |
using | RSCounts = std::unordered_map< int, int > |
using | ShapeQueue = GenericHeap< ShapeQueueEntry > |
using | NodeChildVector = GenericVector< NodeChild > |
using | SuccessorList = GenericVector< int > |
using | SuccessorListsVector = GenericVector< SuccessorList * > |
using | DawgVector = GenericVector< Dawg * > |
typedef TessResultCallback2< bool, const GenericVector< char > &, LSTMTrainer * > * | CheckPointReader |
typedef TessResultCallback3< bool, SerializeAmount, const LSTMTrainer *, GenericVector< char > * > * | CheckPointWriter |
typedef TessResultCallback4< STRING, int, const double *, const TessdataManager &, int > * | TestCallback |
using | RecodePair = KDPairInc< double, RecodeNode > |
using | RecodeHeap = GenericHeap< RecodePair > |
using | BlobGridSearch = GridSearch< BLOBNBOX, BLOBNBOX_CLIST, BLOBNBOX_C_IT > |
using | ColPartitionGridSearch = GridSearch< ColPartition, ColPartition_CLIST, ColPartition_C_IT > |
using | PartSetVector = GenericVector< ColPartitionSet * > |
using | WidthCallback = TessResultCallback1< bool, int > |
using | ColSegmentGrid = BBGrid< ColSegment, ColSegment_CLIST, ColSegment_C_IT > |
using | ColSegmentGridSearch = GridSearch< ColSegment, ColSegment_CLIST, ColSegment_C_IT > |
using | WordGrid = BBGrid< WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT > |
using | WordSearch = GridSearch< WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT > |
using | LigHash = std::unordered_map< std::string, std::string, StringHash > |
using | PainPointHeap = GenericHeap< MatrixCoordPair > |
using | LanguageModelFlagsType = unsigned char |
Used for expressing various language model flags. More... | |
Functions | |
STRING | HOcrEscape (const char *text) |
double | DotProductAVX (const double *u, const double *v, int n) |
double | DotProductSSE (const double *u, const double *v, int n) |
int32_t | IntDotProductSSE (const int8_t *u, const int8_t *v, int n) |
bool | IsTextOrEquationType (PolyBlockType type) |
bool | IsLeftIndented (const EquationDetect::IndentType type) |
bool | IsRightIndented (const EquationDetect::IndentType type) |
bool | AsciiLikelyListItem (const STRING &word) |
int | UnicodeFor (const UNICHARSET *u, const WERD_CHOICE *werd, int pos) |
void | LeftWordAttributes (const UNICHARSET *unicharset, const WERD_CHOICE *werd, const STRING &utf8, bool *is_list, bool *starts_idea, bool *ends_idea) |
void | RightWordAttributes (const UNICHARSET *unicharset, const WERD_CHOICE *werd, const STRING &utf8, bool *is_list, bool *starts_idea, bool *ends_idea) |
bool | ValidFirstLine (const GenericVector< RowScratchRegisters > *rows, int row, const ParagraphModel *model) |
bool | ValidBodyLine (const GenericVector< RowScratchRegisters > *rows, int row, const ParagraphModel *model) |
bool | CrownCompatible (const GenericVector< RowScratchRegisters > *rows, int a, int b, const ParagraphModel *model) |
void | RecomputeMarginsAndClearHypotheses (GenericVector< RowScratchRegisters > *rows, int start, int end, int percentile) |
int | InterwordSpace (const GenericVector< RowScratchRegisters > &rows, int row_start, int row_end) |
bool | FirstWordWouldHaveFit (const RowScratchRegisters &before, const RowScratchRegisters &after, tesseract::ParagraphJustification justification) |
bool | FirstWordWouldHaveFit (const RowScratchRegisters &before, const RowScratchRegisters &after) |
bool | RowsFitModel (const GenericVector< RowScratchRegisters > *rows, int start, int end, const ParagraphModel *model) |
void | CanonicalizeDetectionResults (GenericVector< PARA *> *row_owners, PARA_LIST *paragraphs) |
void | DetectParagraphs (int debug_level, GenericVector< RowInfo > *row_infos, GenericVector< PARA *> *row_owners, PARA_LIST *paragraphs, GenericVector< ParagraphModel *> *models) |
void | DetectParagraphs (int debug_level, bool after_text_recognition, const MutableIterator *block_start, GenericVector< ParagraphModel *> *models) |
bool | StrongModel (const ParagraphModel *model) |
bool | CompareFontInfo (const FontInfo &fi1, const FontInfo &fi2) |
bool | CompareFontSet (const FontSet &fs1, const FontSet &fs2) |
void | FontInfoDeleteCallback (FontInfo f) |
void | FontSetDeleteCallback (FontSet fs) |
bool | read_info (TFile *f, FontInfo *fi) |
bool | write_info (FILE *f, const FontInfo &fi) |
bool | read_spacing_info (TFile *f, FontInfo *fi) |
bool | write_spacing_info (FILE *f, const FontInfo &fi) |
bool | read_set (TFile *f, FontSet *fs) |
bool | write_set (FILE *f, const FontSet &fs) |
void * | ReCachePagesFunc (void *data) |
int | OtsuThreshold (Pix *src_pix, int left, int top, int width, int height, int **thresholds, int **hi_values) |
void | HistogramRect (Pix *src_pix, int channel, int left, int top, int width, int height, int *histogram) |
int | OtsuStats (const int *histogram, int *H_out, int *omega0_out) |
int | ParamsTrainingFeatureByName (const char *name) |
bool | PSM_OSD_ENABLED (int pageseg_mode) |
bool | PSM_ORIENTATION_ENABLED (int pageseg_mode) |
bool | PSM_COL_FIND_ENABLED (int pageseg_mode) |
bool | PSM_SPARSE (int pageseg_mode) |
bool | PSM_BLOCK_FIND_ENABLED (int pageseg_mode) |
bool | PSM_LINE_FIND_ENABLED (int pageseg_mode) |
bool | PSM_WORD_FIND_ENABLED (int pageseg_mode) |
const char * | ScriptPosToString (enum ScriptPos script_pos) |
bool | LoadDataFromFile (const char *filename, GenericVector< char > *data) |
bool | LoadDataFromFile (const STRING &filename, GenericVector< char > *data) |
bool | SaveDataToFile (const GenericVector< char > &data, const STRING &filename) |
bool | LoadFileLinesToStrings (const STRING &filename, GenericVector< STRING > *lines) |
template<typename T > | |
bool | cmp_eq (T const &t1, T const &t2) |
template<typename T > | |
int | sort_cmp (const void *t1, const void *t2) |
template<typename T > | |
int | sort_ptr_cmp (const void *t1, const void *t2) |
bool | DeSerialize (FILE *fp, char *data, size_t n) |
bool | DeSerialize (FILE *fp, float *data, size_t n) |
bool | DeSerialize (FILE *fp, int8_t *data, size_t n) |
bool | DeSerialize (FILE *fp, int16_t *data, size_t n) |
bool | DeSerialize (FILE *fp, int32_t *data, size_t n) |
bool | DeSerialize (FILE *fp, uint8_t *data, size_t n) |
bool | DeSerialize (FILE *fp, uint16_t *data, size_t n) |
bool | DeSerialize (FILE *fp, uint32_t *data, size_t n) |
bool | Serialize (FILE *fp, const char *data, size_t n) |
bool | Serialize (FILE *fp, const float *data, size_t n) |
bool | Serialize (FILE *fp, const int8_t *data, size_t n) |
bool | Serialize (FILE *fp, const int16_t *data, size_t n) |
bool | Serialize (FILE *fp, const int32_t *data, size_t n) |
bool | Serialize (FILE *fp, const uint8_t *data, size_t n) |
bool | Serialize (FILE *fp, const uint16_t *data, size_t n) |
bool | Serialize (FILE *fp, const uint32_t *data, size_t n) |
template<typename T , size_t N> | |
constexpr size_t | countof (T const (&)[N]) noexcept |
void | ExtractFontName (const STRING &filename, STRING *fontname) |
TrainingSample * | BlobToTrainingSample (const TBLOB &blob, bool nonlinear_norm, INT_FX_RESULT_STRUCT *fx_info, GenericVector< INT_FEATURE_STRUCT > *bl_features) |
void | ClearFeatureSpaceWindow (NORM_METHOD norm_method, ScrollView *window) |
double | Tanh (double x) |
double | Logistic (double x) |
template<class Func > | |
void | FuncInplace (int n, double *inout) |
template<class Func > | |
void | FuncMultiply (const double *u, const double *v, int n, double *out) |
template<typename T > | |
void | SoftmaxInPlace (int n, T *inout) |
void | CopyVector (int n, const double *src, double *dest) |
void | AccumulateVector (int n, const double *src, double *dest) |
void | MultiplyVectorsInPlace (int n, const double *src, double *inout) |
void | MultiplyAccumulate (int n, const double *u, const double *v, double *out) |
void | SumVectors (int n, const double *v1, const double *v2, const double *v3, const double *v4, const double *v5, double *sum) |
template<typename T > | |
void | ZeroVector (int n, T *vec) |
template<typename T > | |
void | ClipVector (int n, T lower, T upper, T *vec) |
void | CodeInBinary (int n, int nf, double *vec) |
Pix * | TraceOutlineOnReducedPix (C_OUTLINE *outline, int gridsize, ICOORD bleft, int *left, int *bottom) |
Pix * | TraceBlockOnReducedPix (BLOCK *block, int gridsize, ICOORD bleft, int *left, int *bottom) |
template<class BBC > | |
int | SortByBoxLeft (const void *void1, const void *void2) |
template<class BBC > | |
int | SortRightToLeft (const void *void1, const void *void2) |
template<class BBC > | |
int | SortByBoxBottom (const void *void1, const void *void2) |
template<typename T > | |
void | DeleteObject (T *object) |
void | SetBlobStrokeWidth (Pix *pix, BLOBNBOX *blob) |
void | assign_blobs_to_blocks2 (Pix *pix, BLOCK_LIST *blocks, TO_BLOCK_LIST *port_blocks) |
void | ParseCommandLineFlags (const char *usage, int *argc, char ***argv, const bool remove_flags) |
ShapeTable * | LoadShapeTable (const STRING &file_prefix) |
void | WriteShapeTable (const STRING &file_prefix, const ShapeTable &shape_table) |
MasterTrainer * | LoadTrainingData (int argc, const char *const *argv, bool replication, ShapeTable **shape_table, STRING *file_prefix) |
Pix * | DegradeImage (Pix *input, int exposure, TRand *randomizer, float *rotation) |
Pix * | PrepareDistortedPix (const Pix *pix, bool perspective, bool invert, bool white_noise, bool smooth_noise, bool blur, int box_reduction, TRand *randomizer, GenericVector< TBOX > *boxes) |
void | GeneratePerspectiveDistortion (int width, int height, TRand *randomizer, Pix **pix, GenericVector< TBOX > *boxes) |
int | ProjectiveCoeffs (int width, int height, TRand *randomizer, float **im_coeffs, float **box_coeffs) |
bool | WriteFile (const std::string &output_dir, const std::string &lang, const std::string &suffix, const GenericVector< char > &data, FileWriter writer) |
STRING | ReadFile (const std::string &filename, FileReader reader) |
bool | WriteUnicharset (const UNICHARSET &unicharset, const std::string &output_dir, const std::string &lang, FileWriter writer, TessdataManager *traineddata) |
bool | WriteRecoder (const UNICHARSET &unicharset, bool pass_through, const std::string &output_dir, const std::string &lang, FileWriter writer, STRING *radical_table_data, TessdataManager *traineddata) |
int | CombineLangModel (const UNICHARSET &unicharset, const std::string &script_dir, const std::string &version_str, const std::string &output_dir, const std::string &lang, bool pass_through_recoder, const GenericVector< STRING > &words, const GenericVector< STRING > &puncs, const GenericVector< STRING > &numbers, bool lang_is_rtl, FileReader reader, FileWriter writer) |
bool | NormalizeUTF8String (UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNorm grapheme_normalize, const char *str8, std::string *normalized) |
bool | NormalizeCleanAndSegmentUTF8 (UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNormMode g_mode, bool report_errors, const char *str8, std::vector< std::string > *graphemes) |
char32 | OCRNormalize (char32 ch) |
bool | IsOCREquivalent (char32 ch1, char32 ch2) |
bool | IsValidCodepoint (const char32 ch) |
bool | IsWhitespace (const char32 ch) |
bool | IsUTF8Whitespace (const char *text) |
unsigned int | SpanUTF8Whitespace (const char *text) |
unsigned int | SpanUTF8NotWhitespace (const char *text) |
bool | IsInterchangeValid (const char32 ch) |
bool | IsInterchangeValid7BitAscii (const char32 ch) |
char32 | FullwidthToHalfwidth (const char32 ch) |
void | SetupBasicProperties (bool report_errors, bool decompose, UNICHARSET *unicharset) |
void | SetScriptProperties (const std::string &script_dir, UNICHARSET *unicharset) |
std::string | GetXheightString (const std::string &script_dir, const UNICHARSET &unicharset) |
void | SetPropertiesForInputFile (const std::string &script_dir, const std::string &input_unicharset_file, const std::string &output_unicharset_file, const std::string &output_xheights_file) |
void | SetupBasicProperties (bool report_errors, UNICHARSET *unicharset) |
template<class BLOB_CHOICE > | |
int | SortByUnicharID (const void *void1, const void *void2) |
template<class BLOB_CHOICE > | |
int | SortByRating (const void *void1, const void *void2) |
Variables | |
const int | kMinRectSize = 10 |
const char | kTesseractReject = '~' |
const char | kUNLVReject = '~' |
const char | kUNLVSuspect = '^' |
const char * | kInputFile = "noname.tif" |
const char * | kOldVarsFile = "failed_vars.txt" |
const int | kMaxIntSize = 22 |
const int | kNumbersPerBlob = 5 |
const int | kBytesPerNumber = 5 |
const int | kBytesPerBoxFileLine = (kBytesPerNumber + 1) * kNumbersPerBlob + 1 |
const int | kBytesPer64BitNumber = 20 |
const int | kMaxBytesPerLine |
const int | kUniChs [] |
const int | kLatinChs [] |
const float | kMathDigitDensityTh1 = 0.25 |
const float | kMathDigitDensityTh2 = 0.1 |
const float | kMathItalicDensityTh = 0.5 |
const float | kUnclearDensityTh = 0.25 |
const int | kSeedBlobsCountTh = 10 |
const int | kLeftIndentAlignmentCountTh = 1 |
const int | kMaxCharTopRange = 48 |
const float | kCertaintyScale = 7.0f |
const float | kWorstDictCertainty = -25.0f |
const int | kMaxCircleErosions = 8 |
const ParagraphModel * | kCrownLeft = reinterpret_cast<ParagraphModel *>(0xDEAD111F) |
const ParagraphModel * | kCrownRight = reinterpret_cast<ParagraphModel *>(0xDEAD888F) |
const int16_t | kMaxBoxEdgeDiff = 2 |
const int | kBoxClipTolerance = 2 |
const int | kNumEndPoints = 3 |
const int | kMinPointsForErrorCount = 16 |
const int | kMaxRealDistance = 2.0 |
const int | kFeaturePadding = 2 |
const int | kImagePadding = 4 |
const int | kHistogramSize = 256 |
const int | kMaxAmbigStringSize = UNICHAR_LEN * (MAX_AMBIG_SIZE + 1) |
CCUtilMutex | tprintfMutex |
const char * | kNullChar = "<nul>" |
const int | kRadicalRadix = 29 |
const char * | kUTF8LineSeparator = "\u2028" |
const char * | kUTF8ParagraphSeparator = "\u2029" |
const char * | kLRM = "\u200E" |
const char * | kRLM = "\u200F" |
const char * | kRLE = "\u202A" |
const char * | kPDF = "\u202C" |
const char * | kHyphenLikeUTF8 [] |
const char * | kApostropheLikeUTF8 [] |
const char | kUniversalAmbigsFile [] |
const int | ksizeofUniversalAmbigsFile = sizeof(kUniversalAmbigsFile) |
const double | kRatingEpsilon = 1.0 / 32 |
const int | kMaxOffsetDist = 32 |
const int | kMinClusteredShapes = 1 |
const int | kMaxUnicharsPerCluster = 2000 |
const float | kFontMergeDistance = 0.025 |
const float | kInfiniteDist = 999.0f |
const int | kRandomizingCenter = 128 |
const int | kTestChar = -1 |
const int | kSquareLimit = 25 |
const int | kPrime1 = 17 |
const int | kPrime2 = 13 |
const int | case_state_table [6][4] |
const char | kDoNotReverse [] = "RRP_DO_NO_REVERSE" |
const char | kReverseIfHasRTL [] = "RRP_REVERSE_IF_HAS_RTL" |
const char | kForceReverse [] = "RRP_FORCE_REVERSE" |
const char *const | RTLReversePolicyNames [] |
double | TanhTable [kTableSize] |
double | LogisticTable [kTableSize] |
const int | kTableSize = 4096 |
const double | kScaleFactor = 256.0 |
const int | kMaxInputHeight = 48 |
const double | kStateClip = 100.0 |
const double | kErrClip = 1.0f |
const double | kDictRatio = 2.25 |
const double | kCertOffset = -0.085 |
const double | kMinDivergenceRate = 50.0 |
const int | kMinStallIterations = 10000 |
const double | kSubTrainerMarginFraction = 3.0 / 128 |
const double | kLearningRateDecay = sqrt(0.5) |
const int | kNumAdjustmentIterations = 100 |
const int | kErrorGraphInterval = 1000 |
const int | kNumPagesPerBatch = 100 |
const int | kMinStartedErrorRate = 75 |
const double | kStageTransitionThreshold = 10.0 |
const double | kHighConfidence = 0.9375 |
const double | kImprovementFraction = 15.0 / 16.0 |
const double | kBestCheckpointFraction = 31.0 / 32.0 |
const int | kTargetXScale = 5 |
const int | kTargetYScale = 100 |
const int | kMinWinSize = 500 |
const int | kMaxWinSize = 2000 |
const int | kXWinFrameSize = 30 |
const int | kYWinFrameSize = 80 |
const float | kMinCertainty = -20.0f |
const float | kMinProb = exp(kMinCertainty) |
const char * | kNodeContNames [] = {"Anything", "OnlyDup", "NoDup"} |
const int | kAdamCorrectionIterations = 200000 |
const double | kAdamEpsilon = 1e-8 |
const int | kInt8Flag = 1 |
const int | kAdamFlag = 4 |
const int | kDoubleFlag = 128 |
const int | kHistogramBuckets = 16 |
const double | kAlignedFraction = 0.03125 |
const double | kRaggedFraction = 2.5 |
const double | kAlignedGapFraction = 0.75 |
const double | kRaggedGapFraction = 1.0 |
const int | kVLineAlignment = 3 |
const int | kVLineGutter = 1 |
const int | kVLineSearchSize = 150 |
const int | kMinRaggedTabs = 5 |
const int | kMinAlignedTabs = 4 |
const int | kVLineMinLength = 500 |
const double | kMinTabGradient = 4.0 |
const int | kMaxSkewFactor = 15 |
const double | kMaxSmallNeighboursPerPix = 1.0 / 32 |
const int | kMaxLargeOverlapsWithSmall = 3 |
const int | kMaxMediumOverlapsWithSmall = 12 |
const int | kMaxLargeOverlapsWithMedium = 12 |
const int | kOriginalNoiseMultiple = 8 |
const int | kNoisePadding = 4 |
const double | kPhotoOffsetFraction = 0.375 |
const double | kMinGoodTextPARatio = 1.5 |
const int | kMaxIncompatibleColumnCount = 2 |
const double | kHorizontalGapMergeFraction = 0.5 |
const double | kMinGutterWidthGrid = 0.5 |
const double | kMaxDistToPartSizeRatio = 1.5 |
bool | textord_tabfind_show_initial_partitions = false |
bool | textord_tabfind_show_reject_blobs = false |
int | textord_tabfind_show_partitions = 0 |
bool | textord_tabfind_show_columns = false |
bool | textord_tabfind_show_blocks = false |
bool | textord_tabfind_find_tables = true |
const double | kMaxSpacingDrift = 1.0 / 72 |
const double | kMaxTopSpacingFraction = 0.25 |
const double | kMaxSameBlockLineSpacing = 3 |
const double | kMaxSizeRatio = 1.5 |
const double | kMaxLeaderGapFractionOfMax = 0.25 |
const double | kMaxLeaderGapFractionOfMin = 0.5 |
const int | kMinLeaderCount = 5 |
const int | kMinStrongTextValue = 6 |
const int | kMinChainTextValue = 3 |
const int | kHorzStrongTextlineCount = 8 |
const int | kHorzStrongTextlineHeight = 10 |
const int | kHorzStrongTextlineAspect = 5 |
const double | kMaxBaselineError = 0.4375 |
const double | kMinBaselineCoverage = 0.5 |
const int | kMaxRMSColorNoise = 128 |
const int | kMaxColorDistance = 900 |
const int | kRGBRMSColors = 4 |
bool | textord_tabfind_show_color_fit = false |
const int | kMaxPadFactor = 6 |
const int | kMaxNeighbourDistFactor = 4 |
const int | kMaxCaptionLines = 7 |
const double | kMinCaptionGapRatio = 2.0 |
const double | kMinCaptionGapHeightRatio = 0.5 |
const double | kMarginOverlapFraction = 0.25 |
const double | kBigPartSizeRatio = 1.75 |
const double | kTinyEnoughTextlineOverlapFraction = 0.25 |
const double | kMaxPartitionSpacing = 1.75 |
const int | kSmoothDecisionMargin = 4 |
const double | kMinColumnWidth = 2.0 / 3 |
const double | kMinRectangularFraction = 0.125 |
const double | kMaxRectangularFraction = 0.75 |
const double | kMaxRectangularGradient = 0.1 |
const int | kMinImageFindSize = 100 |
const double | kRMSFitScaling = 8.0 |
const int | kMinColorDifference = 16 |
const int | kThinLineFraction = 20 |
Denominator of resolution makes max pixel width to allow thin lines. More... | |
const int | kMinLineLengthFraction = 4 |
Denominator of resolution makes min pixels to demand line lengths to be. More... | |
const int | kCrackSpacing = 100 |
Spacing of cracks across the page to break up tall vertical lines. More... | |
const int | kLineFindGridSize = 50 |
Grid size used by line finder. Not very critical. More... | |
const int | kMinThickLineWidth = 12 |
const int | kMaxLineResidue = 6 |
const double | kThickLengthMultiple = 0.75 |
const double | kMaxNonLineDensity = 0.25 |
const double | kMaxStaveHeight = 1.0 |
const double | kMinMusicPixelFraction = 0.75 |
int | textord_tabfind_show_strokewidths = 0 |
bool | textord_tabfind_only_strokewidths = false |
const double | kStrokeWidthFractionTolerance = 0.125 |
const double | kStrokeWidthTolerance = 1.5 |
const double | kStrokeWidthFractionCJK = 0.25 |
const double | kStrokeWidthCJK = 2.0 |
const int | kCJKRadius = 2 |
const double | kCJKBrokenDistanceFraction = 0.25 |
const int | kCJKMaxComponents = 8 |
const double | kCJKAspectRatio = 1.25 |
const double | kCJKAspectRatioIncrease = 1.0625 |
const int | kMaxCJKSizeRatio = 5 |
const double | kBrokenCJKIterationFraction = 0.125 |
const double | kDiacriticXPadRatio = 7.0 |
const double | kDiacriticYPadRatio = 1.75 |
const double | kMinDiacriticSizeRatio = 1.0625 |
const double | kMaxDiacriticDistanceRatio = 1.25 |
const double | kMaxDiacriticGapToBaseCharHeight = 1.0 |
const int | kLineTrapLongest = 4 |
const int | kLineTrapShortest = 2 |
const int | kMostlyOneDirRatio = 3 |
const double | kLineResidueAspectRatio = 8.0 |
const int | kLineResiduePadRatio = 3 |
const double | kLineResidueSizeRatio = 1.75 |
const float | kSizeRatioToReject = 2.0 |
const double | kNeighbourSearchFactor = 2.5 |
const double | kNoiseOverlapGrowthFactor = 4.0 |
const double | kNoiseOverlapAreaFactor = 1.0 / 512 |
const int | kTabRadiusFactor = 5 |
const int | kMinVerticalSearch = 3 |
const int | kMaxVerticalSearch = 12 |
const int | kMaxRaggedSearch = 25 |
const int | kMinLinesInColumn = 10 |
const double | kMinFractionalLinesInColumn = 0.125 |
const double | kMaxGutterWidthAbsolute = 2.00 |
const int | kRaggedGutterMultiple = 5 |
const double | kLineFragmentAspectRatio = 10.0 |
const int | kMinEvaluatedTabs = 3 |
const double | kCosMaxSkewAngle = 0.866025 |
bool | textord_tabfind_show_initialtabs = false |
bool | textord_tabfind_show_finaltabs = false |
const int | kColumnWidthFactor = 20 |
const int | kMaxVerticalSpacing = 500 |
const int | kMaxBlobWidth = 500 |
const double | kSplitPartitionSize = 2.0 |
const double | kAllowTextHeight = 0.5 |
const double | kAllowTextWidth = 0.6 |
const double | kAllowTextArea = 0.8 |
const double | kAllowBlobHeight = 0.3 |
const double | kAllowBlobWidth = 0.4 |
const double | kAllowBlobArea = 0.05 |
const int | kMinBoxesInTextPartition = 10 |
const int | kMaxBoxesInDataPartition = 20 |
const double | kMaxGapInTextPartition = 4.0 |
const double | kMinMaxGapInTextPartition = 0.5 |
const double | kMaxBlobOverlapFactor = 4.0 |
const double | kMaxTableCellXheight = 2.0 |
const int | kMaxColumnHeaderDistance = 4 |
const double | kTableColumnThreshold = 3.0 |
const int | kRulingVerticalMargin = 3 |
const double | kMinOverlapWithTable = 0.6 |
const int | kSideSpaceMargin = 10 |
const double | kSmallTableProjectionThreshold = 0.35 |
const double | kLargeTableProjectionThreshold = 0.45 |
const int | kLargeTableRowCount = 6 |
const int | kMinRowsInTable = 3 |
const int | kAdjacentLeaderSearchPadding = 2 |
const double | kParagraphEndingPreviousLineRatio = 1.3 |
const double | kMaxParagraphEndingLeftSpaceMultiple = 3.0 |
const double | kMinParagraphEndingTextToWhitespaceRatio = 3.0 |
const double | kMaxXProjectionGapFactor = 2.0 |
const double | kStrokeWidthFractionalTolerance = 0.25 |
const double | kStrokeWidthConstantTolerance = 2.0 |
bool | textord_show_tables = false |
bool | textord_tablefind_show_mark = false |
bool | textord_tablefind_show_stats = false |
bool | textord_tablefind_recognize_tables = false |
const double | kHorizontalSpacing = 0.30 |
const double | kVerticalSpacing = -0.2 |
const int | kCellSplitRowThreshold = 0 |
const int | kCellSplitColumnThreshold = 0 |
const int | kLinedTableMinVerticalLines = 3 |
const int | kLinedTableMinHorizontalLines = 3 |
const double | kRequiredColumns = 0.7 |
const double | kMarginFactor = 1.1 |
const double | kMaxRowSize = 2.5 |
const double | kGoodRowNumberOfColumnsSmall [] = { 2, 2, 2, 2, 2, 3, 3 } |
const int | kGoodRowNumberOfColumnsSmallSize |
const double | kGoodRowNumberOfColumnsLarge = 0.7 |
const double | kMinFilledArea = 0.35 |
const int | kGutterMultiple = 4 |
const int | kGutterToNeighbourRatio = 3 |
const int | kSimilarVectorDist = 10 |
const int | kSimilarRaggedDist = 50 |
const int | kMaxFillinMultiple = 11 |
const double | kMinGutterFraction = 0.5 |
const double | kLineCountReciprocal = 4.0 |
const double | kMinAlignedGutter = 0.25 |
const double | kMinRaggedGutter = 1.5 |
double | textord_tabvector_vertical_gap_fraction = 0.5 |
double | textord_tabvector_vertical_box_ratio = 0.5 |
const char * | kAlignmentNames [] |
const int | kMaxLineLength = 1024 |
const float | kRotationRange = 0.02f |
const int | kExposureFactor = 16 |
const int | kSaltnPepper = 5 |
const int | kMinRampSize = 1000 |
const int | kMinLigature = 0xfb00 |
const int | kMaxLigature = 0xfb17 |
const int | kDefaultResolution = 300 |
Make a word from the selected blobs and run Tess on them.
page_res | recognise blobs |
selection_box | within this box |
fp_eval_word_spacing() Evaluation function for fixed pitch word lists.
Basically, count the number of "nice" characters - those which are in tess acceptable words or in dict words and are not rejected. Penalise any potential noise chars
build_menu()
Construct the menu tree used by the command window
process_cmd_win_event()
Process a command returned from the command window (Just call the appropriate command handler)
word_blank_and_set_display() Word processor
Blank display of word then redisplay word according to current display mode settings
using tesseract::BlobGridSearch = typedef GridSearch<BLOBNBOX, BLOBNBOX_CLIST, BLOBNBOX_C_IT> |
Definition at line 31 of file blobgrid.h.
using tesseract::char32 = typedef signed int |
typedef TessResultCallback2<bool, const GenericVector<char>&, LSTMTrainer*>* tesseract::CheckPointReader |
Definition at line 69 of file lstmtrainer.h.
typedef TessResultCallback3<bool, SerializeAmount, const LSTMTrainer*, GenericVector<char>*>* tesseract::CheckPointWriter |
Definition at line 78 of file lstmtrainer.h.
using tesseract::ColPartitionGridSearch = typedef GridSearch<ColPartition, ColPartition_CLIST, ColPartition_C_IT> |
Definition at line 936 of file colpartition.h.
using tesseract::ColSegmentGrid = typedef BBGrid<ColSegment, ColSegment_CLIST, ColSegment_C_IT> |
Definition at line 118 of file tablefind.h.
using tesseract::ColSegmentGridSearch = typedef GridSearch<ColSegment, ColSegment_CLIST, ColSegment_C_IT> |
Definition at line 121 of file tablefind.h.
using tesseract::DawgVector = typedef GenericVector<Dawg *> |
typedef int(Dict::* tesseract::DictFunc) (void *void_dawg_args, const UNICHARSET &unicharset, UNICHAR_ID unichar_id, bool word_end) const |
typedef bool(* tesseract::FileReader)(const STRING &filename, GenericVector< char > *data) |
Definition at line 360 of file genericvector.h.
typedef bool(* tesseract::FileWriter)(const GenericVector< char > &data, const STRING &filename) |
Definition at line 363 of file genericvector.h.
typedef void(Wordrec::* tesseract::FillLatticeFunc) (const MATRIX &ratings, const WERD_CHOICE_LIST &best_choices, const UNICHARSET &unicharset, BlamerBundle *blamer_bundle) |
using tesseract::IntKDPair = typedef KDPairInc<int, int> |
using tesseract::LanguageModelFlagsType = typedef unsigned char |
Used for expressing various language model flags.
Definition at line 39 of file lm_state.h.
using tesseract::LigHash = typedef std::unordered_map<std::string, std::string, StringHash> |
Definition at line 36 of file ligature_table.h.
using tesseract::NodeChildVector = typedef GenericVector<NodeChild> |
using tesseract::PainPointHeap = typedef GenericHeap<MatrixCoordPair> |
Definition at line 38 of file lm_pain_points.h.
typedef float(Dict::* tesseract::ParamsModelClassifyFunc) (const char *lang, void *path) |
using tesseract::ParamsTrainingHypothesisList = typedef GenericVector<ParamsTrainingHypothesis> |
Definition at line 127 of file params_training_featdef.h.
using tesseract::PartSetVector = typedef GenericVector<ColPartitionSet*> |
Definition at line 34 of file colpartitionset.h.
typedef double(Dict::* tesseract::ProbabilityInContextFunc) (const char *lang, const char *context, int context_bytes, const char *character, int character_bytes) |
using tesseract::RecodeHeap = typedef GenericHeap<RecodePair> |
Definition at line 176 of file recodebeam.h.
using tesseract::RecodePair = typedef KDPairInc<double, RecodeNode> |
Definition at line 175 of file recodebeam.h.
using tesseract::RSCounts = typedef std::unordered_map<int, int> |
Definition at line 49 of file unicharcompress.cpp.
using tesseract::RSMap = typedef std::unordered_map<int, std::unique_ptr<std::vector<int> >> |
Definition at line 47 of file unicharcompress.cpp.
using tesseract::SetOfModels = typedef GenericVectorEqEq<const ParagraphModel *> |
Definition at line 99 of file paragraphs_internal.h.
using tesseract::ShapeQueue = typedef GenericHeap<ShapeQueueEntry> |
Definition at line 156 of file shapetable.h.
using tesseract::SuccessorList = typedef GenericVector<int> |
using tesseract::SuccessorListsVector = typedef GenericVector<SuccessorList *> |
typedef TessResultCallback4<STRING, int, const double*, const TessdataManager&, int>* tesseract::TestCallback |
Definition at line 83 of file lstmtrainer.h.
typedef TessCallback4<const UNICHARSET &, int, PageIterator *, Pix *> tesseract::TruthCallback |
using tesseract::UnicharAmbigsVector = typedef GenericVector<AmbigSpec_LIST *> |
using tesseract::UnicharIdVector = typedef GenericVector<UNICHAR_ID> |
using tesseract::WidthCallback = typedef TessResultCallback1<bool, int> |
using tesseract::WordGrid = typedef BBGrid<WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT> |
typedef void(Tesseract::* tesseract::WordRecognizer) (const WordData &word_data, WERD_RES **in_word, PointerVector< WERD_RES > *out_words) |
Definition at line 169 of file tesseractclass.h.
using tesseract::WordSearch = typedef GridSearch<WordWithBox, WordWithBox_CLIST, WordWithBox_C_IT> |
enum tesseract::AmbigType |
Enumerator | |
---|---|
NOT_AMBIG | |
REPLACE_AMBIG | |
DEFINITE_AMBIG | |
SIMILAR_AMBIG | |
CASE_AMBIG | |
AMBIG_TYPE_COUNT |
Definition at line 44 of file ambigs.h.
Enumerator | |
---|---|
CS_SEQUENTIAL | |
CS_ROUND_ROBIN |
Definition at line 42 of file imagedata.h.
Enumerator | |
---|---|
CST_FRAGMENT | |
CST_WHOLE | |
CST_IMPROPER | |
CST_NGRAM |
Definition at line 96 of file classify.h.
Enumerator | |
---|---|
ACTION_1_CMD_EVENT | |
RECOG_WERDS | |
RECOG_PSEUDO | |
ACTION_2_CMD_EVENT |
Definition at line 481 of file tessedit.cpp.
Enumerator | |
---|---|
COL_UNKNOWN | |
COL_TEXT | |
COL_TABLE | |
COL_MIXED | |
COL_COUNT |
Definition at line 30 of file tablefind.h.
Enumerator | |
---|---|
CST_NOISE | |
CST_FLOWING | |
CST_HEADING | |
CST_PULLOUT | |
CST_COUNT |
Definition at line 48 of file colpartition.h.
Definition at line 69 of file errorcounter.h.
enum tesseract::DawgType |
Enumerator | |
---|---|
ET_RMS | |
ET_DELTA | |
ET_WORD_RECERR | |
ET_CHAR_ERROR | |
ET_SKIP_RATIO | |
ET_COUNT |
Definition at line 37 of file lstmtrainer.h.
Enumerator | |
---|---|
FN_INCOLOR | |
FN_Y0 | |
FN_Y1 | |
FN_Y2 | |
FN_Y3 | |
FN_X0 | |
FN_X1 | |
FN_SHEAR | |
FN_NUM_FACTORS |
Definition at line 41 of file degradeimage.cpp.
Enumerator | |
---|---|
FD_BATCH | |
FD_HEIGHT | |
FD_WIDTH | |
FD_DIMSIZE |
Definition at line 34 of file stridemap.h.
|
strong |
Enumerator | |
---|---|
kNone | |
kNormalize |
Definition at line 49 of file normstrngs.h.
|
strong |
Enumerator | |
---|---|
kSingleString | |
kCombined | |
kGlyphSplit | |
kIndividualUnicodes |
Definition at line 34 of file validator.h.
Definition at line 39 of file params_training_featdef.h.
Enumerator | |
---|---|
LR_LEFT | |
LR_RIGHT |
Definition at line 39 of file strokewidth.h.
enum tesseract::LineType |
Enumerator | |
---|---|
LT_START | |
LT_BODY | |
LT_UNKNOWN | |
LT_MULTIPLE |
Definition at line 50 of file paragraphs_internal.h.
Enumerator | |
---|---|
LM_PPTYPE_BLAMER | |
LM_PPTYPE_AMBIG | |
LM_PPTYPE_PATH | |
LM_PPTYPE_SHAPE | |
LM_PPTYPE_NUM |
Definition at line 41 of file lm_pain_points.h.
enum tesseract::LossType |
Enumerator | |
---|---|
LT_NONE | |
LT_CTC | |
LT_SOFTMAX | |
LT_LOGISTIC |
Definition at line 29 of file static_shape.h.
Enumerator | |
---|---|
NPT_HTEXT | |
NPT_VTEXT | |
NPT_WEAK_HTEXT | |
NPT_WEAK_VTEXT | |
NPT_IMAGE | |
NPT_COUNT |
Definition at line 1508 of file colpartitiongrid.cpp.
Enumerator | |
---|---|
NF_LAYER_SPECIFIC_LR | |
NF_ADAM |
Definition at line 85 of file network.h.
Definition at line 43 of file network.h.
Enumerator | |
---|---|
NC_ANYTHING | |
NC_ONLY_DUP | |
NC_NO_DUP | |
NC_COUNT |
Definition at line 72 of file recodebeam.h.
Enumerator | |
---|---|
NM_BASELINE | |
NM_CHAR_ISOTROPIC | |
NM_CHAR_ANISOTROPIC |
Definition at line 42 of file normalis.h.
When Tesseract/Cube is initialized we can choose to instantiate/load/run only the Tesseract part, only the Cube part or both along with the combiner. The preference of which engine to use is stored in tessedit_ocr_engine_mode.
ATTENTION: When modifying this enum, please make sure to make the appropriate changes to all the enums mirroring it (e.g. OCREngine in cityblock/workflow/detection/detection_storage.proto). Such enums will mention the connection to OcrEngineMode in the comments.
Enumerator | |
---|---|
OEM_TESSERACT_ONLY | |
OEM_LSTM_ONLY | |
OEM_TESSERACT_LSTM_COMBINED | |
OEM_DEFAULT | |
OEM_COUNT |
Definition at line 268 of file publictypes.h.
|
strong |
Enumerator | |
---|---|
kNone | |
kNormalize |
Definition at line 41 of file normstrngs.h.
+---------------—+ Orientation Example: | 1 Aaaa Aaaa Aaaa | ==================== | Aaa aa aaa aa | To left is a diagram of some (1) English and | aaaaaa A aa aaa. | (2) Chinese text and a (3) photo credit. | 2 | | ####### c c C | Upright Latin characters are represented as A and a. | ####### c c c | '<' represents a latin character rotated | < ####### c c c | anti-clockwise 90 degrees. | < ####### c c | | < ####### . c | Upright Chinese characters are represented C and c. | 3 ####### c | +---------------—+ NOTA BENE: enum values here should match goodoc.proto
If you orient your head so that "up" aligns with Orientation, then the characters will appear "right side up" and readable.
In the example above, both the English and Chinese paragraphs are oriented so their "up" is the top of the page (page up). The photo credit is read with one's head turned leftward ("up" is to page left).
The values of this enum match the convention of Tesseract's osdetect.h
Enumerator | |
---|---|
ORIENTATION_PAGE_UP | |
ORIENTATION_PAGE_RIGHT | |
ORIENTATION_PAGE_DOWN | |
ORIENTATION_PAGE_LEFT |
Definition at line 120 of file publictypes.h.
enum of the elements of the page hierarchy, used in ResultIterator to provide functions that operate on each level without having to have 5x as many functions.
Enumerator | |
---|---|
RIL_BLOCK | |
RIL_PARA | |
RIL_TEXTLINE | |
RIL_WORD | |
RIL_SYMBOL |
Definition at line 219 of file publictypes.h.
Possible modes for page layout analysis. These must be kept in order of decreasing amount of layout analysis to be done, except for OSD_ONLY, so that the inequality test macros below work.
Definition at line 163 of file publictypes.h.
JUSTIFICATION_UNKNOWN The alignment is not clearly one of the other options. This could happen for example if there are only one or two lines of text or the text looks like source code or poetry.
NOTA BENE: Fully justified paragraphs (text aligned to both left and right margins) are marked by Tesseract with JUSTIFICATION_LEFT if their text is written with a left-to-right script and with JUSTIFICATION_RIGHT if their text is written in a right-to-left script.
Interpretation for text read in vertical lines: "Left" is wherever the starting reading position is.
JUSTIFICATION_LEFT Each line, except possibly the first, is flush to the same left tab stop.
JUSTIFICATION_CENTER The text lines of the paragraph are centered about a line going down through their middle of the text lines.
JUSTIFICATION_RIGHT Each line, except possibly the first, is flush to the same right tab stop.
Enumerator | |
---|---|
JUSTIFICATION_UNKNOWN | |
JUSTIFICATION_LEFT | |
JUSTIFICATION_CENTER | |
JUSTIFICATION_RIGHT |
Definition at line 251 of file publictypes.h.
Enumerator | |
---|---|
PFR_OK | |
PFR_SKEW | |
PFR_NOISE |
Definition at line 46 of file strokewidth.h.
enum tesseract::ScriptPos |
Enumerator | |
---|---|
SP_NORMAL | |
SP_SUBSCRIPT | |
SP_SUPERSCRIPT | |
SP_DROPCAP |
Enumerator | |
---|---|
LIGHT | |
NO_BEST_TRAINER | |
FULL |
Definition at line 56 of file lstmtrainer.h.
Enumerator | |
---|---|
SET_PARAM_CONSTRAINT_NONE | |
SET_PARAM_CONSTRAINT_DEBUG_ONLY | |
SET_PARAM_CONSTRAINT_NON_DEBUG_ONLY | |
SET_PARAM_CONSTRAINT_NON_INIT_ONLY |
Definition at line 36 of file params.h.
Enumerator | |
---|---|
STR_NONE | |
STR_UPDATED | |
STR_REPLACED |
Definition at line 63 of file lstmtrainer.h.
Enumerator | |
---|---|
TA_LEFT_ALIGNED | |
TA_LEFT_RAGGED | |
TA_CENTER_JUSTIFIED | |
TA_RIGHT_ALIGNED | |
TA_RIGHT_RAGGED | |
TA_SEPARATOR | |
TA_COUNT |
Definition at line 45 of file tabvector.h.
Definition at line 56 of file tessdatamanager.h.
The text lines are read in the given sequence.
In English, the order is top-to-bottom. In Chinese, vertical text lines are read right-to-left. Mongolian is written in vertical columns top to bottom like Chinese, but the lines order left-to right.
Note that only some combinations make sense. For example, WRITING_DIRECTION_LEFT_TO_RIGHT implies TEXTLINE_ORDER_TOP_TO_BOTTOM
Enumerator | |
---|---|
TEXTLINE_ORDER_LEFT_TO_RIGHT | |
TEXTLINE_ORDER_RIGHT_TO_LEFT | |
TEXTLINE_ORDER_TOP_TO_BOTTOM |
Definition at line 152 of file publictypes.h.
enum tesseract::TopNState |
Enumerator | |
---|---|
TN_TOP2 | |
TN_TOPN | |
TN_ALSO_RAN | |
TN_COUNT |
Definition at line 84 of file recodebeam.h.
Enumerator | |
---|---|
TRAINABLE | |
PERFECT | |
UNENCODABLE | |
HI_PRECISION_ERR | |
NOT_BOXED |
Definition at line 47 of file lstmtrainer.h.
Enumerator | |
---|---|
TF_INT_MODE | |
TF_COMPRESS_UNICHARSET |
Definition at line 46 of file lstmrecognizer.h.
Enumerator | |
---|---|
TS_DISABLED | |
TS_ENABLED | |
TS_TEMP_DISABLE | |
TS_RE_ENABLE |
|
strong |
Enumerator | |
---|---|
kNFD | |
kNFC | |
kNFKD | |
kNFKC |
Definition at line 32 of file normstrngs.h.
|
strong |
Enumerator | |
---|---|
kNonVirama | |
kDevanagari | |
kBengali | |
kGurmukhi | |
kGujarati | |
kOriya | |
kTamil | |
kTelugu | |
kKannada | |
kMalayalam | |
kSinhala | |
kMyanmar | |
kKhmer | |
kJavanese |
Definition at line 53 of file validator.h.
The grapheme clusters within a line of text are laid out logically in this direction, judged when looking at the text line rotated so that its Orientation is "page up".
For English text, the writing direction is left-to-right. For the Chinese text in the above example, the writing direction is top-to-bottom.
Enumerator | |
---|---|
WRITING_DIRECTION_LEFT_TO_RIGHT | |
WRITING_DIRECTION_RIGHT_TO_LEFT | |
WRITING_DIRECTION_TOP_TO_BOTTOM |
Definition at line 135 of file publictypes.h.
|
inline |
Definition at line 191 of file functions.h.
bool tesseract::AsciiLikelyListItem | ( | const STRING & | word | ) |
Definition at line 282 of file paragraphs.cpp.
void tesseract::assign_blobs_to_blocks2 | ( | Pix * | pix, |
BLOCK_LIST * | blocks, | ||
TO_BLOCK_LIST * | port_blocks | ||
) |
Definition at line 168 of file tordmain.cpp.
TrainingSample * tesseract::BlobToTrainingSample | ( | const TBLOB & | blob, |
bool | nonlinear_norm, | ||
INT_FX_RESULT_STRUCT * | fx_info, | ||
GenericVector< INT_FEATURE_STRUCT > * | bl_features | ||
) |
Definition at line 79 of file intfx.cpp.
void tesseract::CanonicalizeDetectionResults | ( | GenericVector< PARA *> * | row_owners, |
PARA_LIST * | paragraphs | ||
) |
Definition at line 2239 of file paragraphs.cpp.
void tesseract::ClearFeatureSpaceWindow | ( | NORM_METHOD | norm_method, |
ScrollView * | window | ||
) |
Clears the given window and draws the featurespace guides for the appropriate normalization method.
Definition at line 998 of file intproto.cpp.
|
inline |
Definition at line 225 of file functions.h.
bool tesseract::cmp_eq | ( | T const & | t1, |
T const & | t2 | ||
) |
Definition at line 415 of file genericvector.h.
|
inline |
Definition at line 231 of file functions.h.
int tesseract::CombineLangModel | ( | const UNICHARSET & | unicharset, |
const std::string & | script_dir, | ||
const std::string & | version_str, | ||
const std::string & | output_dir, | ||
const std::string & | lang, | ||
bool | pass_through_recoder, | ||
const GenericVector< STRING > & | words, | ||
const GenericVector< STRING > & | puncs, | ||
const GenericVector< STRING > & | numbers, | ||
bool | lang_is_rtl, | ||
FileReader | reader, | ||
FileWriter | writer | ||
) |
Definition at line 185 of file lang_model_helpers.cpp.
Definition at line 120 of file fontinfo.cpp.
Definition at line 128 of file fontinfo.cpp.
|
inline |
Definition at line 186 of file functions.h.
|
noexcept |
Definition at line 43 of file serialis.h.
bool tesseract::CrownCompatible | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | a, | ||
int | b, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1301 of file paragraphs.cpp.
struct Pix * tesseract::DegradeImage | ( | Pix * | input, |
int | exposure, | ||
TRand * | randomizer, | ||
float * | rotation | ||
) |
Definition at line 91 of file degradeimage.cpp.
void tesseract::DeleteObject | ( | T * | object | ) |
Definition at line 156 of file tablefind.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
char * | data, | ||
size_t | n | ||
) |
Definition at line 27 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
float * | data, | ||
size_t | n | ||
) |
Definition at line 31 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int8_t * | data, | ||
size_t | n | ||
) |
Definition at line 35 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int16_t * | data, | ||
size_t | n | ||
) |
Definition at line 39 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
int32_t * | data, | ||
size_t | n | ||
) |
Definition at line 43 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint8_t * | data, | ||
size_t | n | ||
) |
Definition at line 47 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint16_t * | data, | ||
size_t | n | ||
) |
Definition at line 51 of file serialis.cpp.
bool tesseract::DeSerialize | ( | FILE * | fp, |
uint32_t * | data, | ||
size_t | n | ||
) |
Definition at line 55 of file serialis.cpp.
void tesseract::DetectParagraphs | ( | int | debug_level, |
GenericVector< RowInfo > * | row_infos, | ||
GenericVector< PARA *> * | row_owners, | ||
PARA_LIST * | paragraphs, | ||
GenericVector< ParagraphModel *> * | models | ||
) |
Definition at line 2271 of file paragraphs.cpp.
void tesseract::DetectParagraphs | ( | int | debug_level, |
bool | after_text_recognition, | ||
const MutableIterator * | block_start, | ||
GenericVector< ParagraphModel *> * | models | ||
) |
Definition at line 2514 of file paragraphs.cpp.
double tesseract::DotProductAVX | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 27 of file dotproductavx.cpp.
double tesseract::DotProductSSE | ( | const double * | u, |
const double * | v, | ||
int | n | ||
) |
Definition at line 27 of file dotproductsse.cpp.
bool tesseract::FirstWordWouldHaveFit | ( | const RowScratchRegisters & | before, |
const RowScratchRegisters & | after, | ||
tesseract::ParagraphJustification | justification | ||
) |
Definition at line 1633 of file paragraphs.cpp.
bool tesseract::FirstWordWouldHaveFit | ( | const RowScratchRegisters & | before, |
const RowScratchRegisters & | after | ||
) |
Definition at line 1658 of file paragraphs.cpp.
void tesseract::FontInfoDeleteCallback | ( | FontInfo | f | ) |
Definition at line 139 of file fontinfo.cpp.
void tesseract::FontSetDeleteCallback | ( | FontSet | fs | ) |
Definition at line 146 of file fontinfo.cpp.
Definition at line 282 of file normstrngs.cpp.
|
inline |
Definition at line 146 of file functions.h.
|
inline |
Definition at line 155 of file functions.h.
void tesseract::GeneratePerspectiveDistortion | ( | int | width, |
int | height, | ||
TRand * | randomizer, | ||
Pix ** | pix, | ||
GenericVector< TBOX > * | boxes | ||
) |
Definition at line 219 of file degradeimage.cpp.
std::string tesseract::GetXheightString | ( | const std::string & | script_dir, |
const UNICHARSET & | unicharset | ||
) |
Definition at line 164 of file unicharset_training_utils.cpp.
void tesseract::HistogramRect | ( | Pix * | src_pix, |
int | channel, | ||
int | left, | ||
int | top, | ||
int | width, | ||
int | height, | ||
int * | histogram | ||
) |
Definition at line 151 of file otsuthr.cpp.
STRING tesseract::HOcrEscape | ( | const char * | text | ) |
Escape a char string - remove <>&"' with HTML codes.
Escape a char string - remove &<>"' with HTML codes.
Definition at line 2632 of file baseapi.cpp.
int32_t tesseract::IntDotProductSSE | ( | const int8_t * | u, |
const int8_t * | v, | ||
int | n | ||
) |
Definition at line 31 of file dotproductsse.cpp.
int tesseract::InterwordSpace | ( | const GenericVector< RowScratchRegisters > & | rows, |
int | row_start, | ||
int | row_end | ||
) |
Definition at line 1610 of file paragraphs.cpp.
bool tesseract::IsInterchangeValid | ( | const char32 | ch | ) |
Definition at line 253 of file normstrngs.cpp.
bool tesseract::IsInterchangeValid7BitAscii | ( | const char32 | ch | ) |
Definition at line 276 of file normstrngs.cpp.
|
inline |
Definition at line 93 of file equationdetect.cpp.
Definition at line 214 of file normstrngs.cpp.
|
inline |
Definition at line 98 of file equationdetect.cpp.
|
inline |
Definition at line 89 of file equationdetect.cpp.
bool tesseract::IsUTF8Whitespace | ( | const char * | text | ) |
Definition at line 229 of file normstrngs.cpp.
bool tesseract::IsValidCodepoint | ( | const char32 | ch | ) |
Definition at line 218 of file normstrngs.cpp.
bool tesseract::IsWhitespace | ( | const char32 | ch | ) |
Definition at line 223 of file normstrngs.cpp.
void tesseract::LeftWordAttributes | ( | const UNICHARSET * | unicharset, |
const WERD_CHOICE * | werd, | ||
const STRING & | utf8, | ||
bool * | is_list, | ||
bool * | starts_idea, | ||
bool * | ends_idea | ||
) |
Definition at line 409 of file paragraphs.cpp.
|
inline |
Definition at line 367 of file genericvector.h.
|
inline |
Definition at line 386 of file genericvector.h.
|
inline |
Definition at line 403 of file genericvector.h.
ShapeTable * tesseract::LoadShapeTable | ( | const STRING & | file_prefix | ) |
Definition at line 162 of file commontraining.cpp.
MasterTrainer * tesseract::LoadTrainingData | ( | int | argc, |
const char *const * | argv, | ||
bool | replication, | ||
ShapeTable ** | shape_table, | ||
STRING * | file_prefix | ||
) |
Creates a MasterTrainer and loads the training data into it: Initializes feature_defs and IntegerFX. Loads the shape_table if shape_table != nullptr. Loads initial unicharset from -U command-line option. If FLAGS_T is set, loads the majority of data from there, else:
Definition at line 219 of file commontraining.cpp.
|
inline |
Definition at line 63 of file functions.h.
|
inline |
Definition at line 201 of file functions.h.
|
inline |
Definition at line 196 of file functions.h.
bool tesseract::NormalizeCleanAndSegmentUTF8 | ( | UnicodeNormMode | u_mode, |
OCRNorm | ocr_normalize, | ||
GraphemeNormMode | g_mode, | ||
bool | report_errors, | ||
const char * | str8, | ||
std::vector< std::string > * | graphemes | ||
) |
Definition at line 172 of file normstrngs.cpp.
bool tesseract::NormalizeUTF8String | ( | UnicodeNormMode | u_mode, |
OCRNorm | ocr_normalize, | ||
GraphemeNorm | grapheme_normalize, | ||
const char * | str8, | ||
std::string * | normalized | ||
) |
Definition at line 147 of file normstrngs.cpp.
Definition at line 204 of file normstrngs.cpp.
int tesseract::OtsuStats | ( | const int * | histogram, |
int * | H_out, | ||
int * | omega0_out | ||
) |
Definition at line 174 of file otsuthr.cpp.
int tesseract::OtsuThreshold | ( | Pix * | src_pix, |
int | left, | ||
int | top, | ||
int | width, | ||
int | height, | ||
int ** | thresholds, | ||
int ** | hi_values | ||
) |
Definition at line 39 of file otsuthr.cpp.
int tesseract::ParamsTrainingFeatureByName | ( | const char * | name | ) |
Definition at line 26 of file params_training_featdef.cpp.
void tesseract::ParseCommandLineFlags | ( | const char * | usage, |
int * | argc, | ||
char *** | argv, | ||
const bool | remove_flags | ||
) |
Definition at line 154 of file commandlineflags.cpp.
Pix * tesseract::PrepareDistortedPix | ( | const Pix * | pix, |
bool | perspective, | ||
bool | invert, | ||
bool | white_noise, | ||
bool | smooth_noise, | ||
bool | blur, | ||
int | box_reduction, | ||
TRand * | randomizer, | ||
GenericVector< TBOX > * | boxes | ||
) |
Definition at line 178 of file degradeimage.cpp.
int tesseract::ProjectiveCoeffs | ( | int | width, |
int | height, | ||
TRand * | randomizer, | ||
float ** | im_coeffs, | ||
float ** | box_coeffs | ||
) |
Definition at line 265 of file degradeimage.cpp.
|
inline |
Definition at line 203 of file publictypes.h.
|
inline |
Definition at line 197 of file publictypes.h.
|
inline |
Definition at line 206 of file publictypes.h.
|
inline |
Definition at line 194 of file publictypes.h.
|
inline |
Inline functions that act on a PageSegMode to determine whether components of layout analysis are enabled. Depend critically on the order of elements of PageSegMode. NOTE that arg is an int for compatibility with INT_PARAM.
Definition at line 191 of file publictypes.h.
|
inline |
Definition at line 200 of file publictypes.h.
|
inline |
Definition at line 152 of file fontinfo.cpp.
Definition at line 225 of file fontinfo.cpp.
Definition at line 169 of file fontinfo.cpp.
STRING tesseract::ReadFile | ( | const std::string & | filename, |
FileReader | reader | ||
) |
Definition at line 57 of file lang_model_helpers.cpp.
void* tesseract::ReCachePagesFunc | ( | void * | data | ) |
Definition at line 369 of file imagedata.cpp.
void tesseract::RecomputeMarginsAndClearHypotheses | ( | GenericVector< RowScratchRegisters > * | rows, |
int | start, | ||
int | end, | ||
int | percentile | ||
) |
Definition at line 1570 of file paragraphs.cpp.
void tesseract::RightWordAttributes | ( | const UNICHARSET * | unicharset, |
const WERD_CHOICE * | werd, | ||
const STRING & | utf8, | ||
bool * | is_list, | ||
bool * | starts_idea, | ||
bool * | ends_idea | ||
) |
Definition at line 456 of file paragraphs.cpp.
bool tesseract::RowsFitModel | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | start, | ||
int | end, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1813 of file paragraphs.cpp.
|
inline |
Definition at line 393 of file genericvector.h.
const char * tesseract::ScriptPosToString | ( | enum ScriptPos | script_pos | ) |
Definition at line 200 of file ratngs.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const char * | data, | ||
size_t | n | ||
) |
Definition at line 59 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const float * | data, | ||
size_t | n | ||
) |
Definition at line 63 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int8_t * | data, | ||
size_t | n | ||
) |
Definition at line 67 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int16_t * | data, | ||
size_t | n | ||
) |
Definition at line 71 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const int32_t * | data, | ||
size_t | n | ||
) |
Definition at line 75 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint8_t * | data, | ||
size_t | n | ||
) |
Definition at line 79 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint16_t * | data, | ||
size_t | n | ||
) |
Definition at line 83 of file serialis.cpp.
bool tesseract::Serialize | ( | FILE * | fp, |
const uint32_t * | data, | ||
size_t | n | ||
) |
Definition at line 87 of file serialis.cpp.
void tesseract::SetBlobStrokeWidth | ( | Pix * | pix, |
BLOBNBOX * | blob | ||
) |
Definition at line 69 of file tordmain.cpp.
void tesseract::SetPropertiesForInputFile | ( | const std::string & | script_dir, |
const std::string & | input_unicharset_file, | ||
const std::string & | output_unicharset_file, | ||
const std::string & | output_xheights_file | ||
) |
Definition at line 183 of file unicharset_training_utils.cpp.
void tesseract::SetScriptProperties | ( | const std::string & | script_dir, |
UNICHARSET * | unicharset | ||
) |
Definition at line 143 of file unicharset_training_utils.cpp.
|
inline |
Definition at line 38 of file unicharset_training_utils.h.
void tesseract::SetupBasicProperties | ( | bool | report_errors, |
bool | decompose, | ||
UNICHARSET * | unicharset | ||
) |
Definition at line 40 of file unicharset_training_utils.cpp.
|
inline |
Definition at line 163 of file functions.h.
int tesseract::sort_cmp | ( | const void * | t1, |
const void * | t2 | ||
) |
Definition at line 424 of file genericvector.h.
int tesseract::sort_ptr_cmp | ( | const void * | t1, |
const void * | t2 | ||
) |
Definition at line 441 of file genericvector.h.
int tesseract::SortByBoxBottom | ( | const void * | void1, |
const void * | void2 | ||
) |
int tesseract::SortByBoxLeft | ( | const void * | void1, |
const void * | void2 | ||
) |
int tesseract::SortByRating | ( | const void * | void1, |
const void * | void2 | ||
) |
Definition at line 84 of file pieces.cpp.
int tesseract::SortByUnicharID | ( | const void * | void1, |
const void * | void2 | ||
) |
Definition at line 76 of file pieces.cpp.
int tesseract::SortRightToLeft | ( | const void * | void1, |
const void * | void2 | ||
) |
unsigned int tesseract::SpanUTF8NotWhitespace | ( | const char * | text | ) |
Definition at line 243 of file normstrngs.cpp.
unsigned int tesseract::SpanUTF8Whitespace | ( | const char * | text | ) |
Definition at line 233 of file normstrngs.cpp.
|
inline |
Definition at line 71 of file paragraphs_internal.h.
|
inline |
Definition at line 209 of file functions.h.
|
inline |
Definition at line 45 of file functions.h.
Pix * tesseract::TraceBlockOnReducedPix | ( | BLOCK * | block, |
int | gridsize, | ||
ICOORD | bleft, | ||
int * | left, | ||
int * | bottom | ||
) |
Definition at line 255 of file bbgrid.cpp.
Pix * tesseract::TraceOutlineOnReducedPix | ( | C_OUTLINE * | outline, |
int | gridsize, | ||
ICOORD | bleft, | ||
int * | left, | ||
int * | bottom | ||
) |
Definition at line 229 of file bbgrid.cpp.
int tesseract::UnicodeFor | ( | const UNICHARSET * | u, |
const WERD_CHOICE * | werd, | ||
int | pos | ||
) |
Definition at line 289 of file paragraphs.cpp.
bool tesseract::ValidBodyLine | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | row, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1290 of file paragraphs.cpp.
bool tesseract::ValidFirstLine | ( | const GenericVector< RowScratchRegisters > * | rows, |
int | row, | ||
const ParagraphModel * | model | ||
) |
Definition at line 1279 of file paragraphs.cpp.
bool tesseract::write_info | ( | FILE * | f, |
const FontInfo & | fi | ||
) |
Definition at line 162 of file fontinfo.cpp.
bool tesseract::write_set | ( | FILE * | f, |
const FontSet & | fs | ||
) |
Definition at line 231 of file fontinfo.cpp.
bool tesseract::write_spacing_info | ( | FILE * | f, |
const FontInfo & | fi | ||
) |
Definition at line 197 of file fontinfo.cpp.
bool tesseract::WriteFile | ( | const std::string & | output_dir, |
const std::string & | lang, | ||
const std::string & | suffix, | ||
const GenericVector< char > & | data, | ||
FileWriter | writer | ||
) |
Definition at line 36 of file lang_model_helpers.cpp.
bool tesseract::WriteRecoder | ( | const UNICHARSET & | unicharset, |
bool | pass_through, | ||
const std::string & | output_dir, | ||
const std::string & | lang, | ||
FileWriter | writer, | ||
STRING * | radical_table_data, | ||
TessdataManager * | traineddata | ||
) |
Definition at line 85 of file lang_model_helpers.cpp.
void tesseract::WriteShapeTable | ( | const STRING & | file_prefix, |
const ShapeTable & | shape_table | ||
) |
Definition at line 187 of file commontraining.cpp.
bool tesseract::WriteUnicharset | ( | const UNICHARSET & | unicharset, |
const std::string & | output_dir, | ||
const std::string & | lang, | ||
FileWriter | writer, | ||
TessdataManager * | traineddata | ||
) |
Definition at line 71 of file lang_model_helpers.cpp.
|
inline |
Definition at line 219 of file functions.h.
const int tesseract::case_state_table[6][4] |
Definition at line 35 of file context.cpp.
const int tesseract::kAdamCorrectionIterations = 200000 |
Definition at line 37 of file weightmatrix.cpp.
const double tesseract::kAdamEpsilon = 1e-8 |
Definition at line 39 of file weightmatrix.cpp.
const int tesseract::kAdamFlag = 4 |
Definition at line 144 of file weightmatrix.cpp.
const int tesseract::kAdjacentLeaderSearchPadding = 2 |
Definition at line 117 of file tablefind.cpp.
const double tesseract::kAlignedFraction = 0.03125 |
Definition at line 39 of file alignedblob.cpp.
const double tesseract::kAlignedGapFraction = 0.75 |
Definition at line 43 of file alignedblob.cpp.
const char* tesseract::kAlignmentNames[] |
Definition at line 510 of file tabvector.cpp.
const double tesseract::kAllowBlobArea = 0.05 |
Definition at line 58 of file tablefind.cpp.
const double tesseract::kAllowBlobHeight = 0.3 |
Definition at line 56 of file tablefind.cpp.
const double tesseract::kAllowBlobWidth = 0.4 |
Definition at line 57 of file tablefind.cpp.
const double tesseract::kAllowTextArea = 0.8 |
Definition at line 51 of file tablefind.cpp.
const double tesseract::kAllowTextHeight = 0.5 |
Definition at line 49 of file tablefind.cpp.
const double tesseract::kAllowTextWidth = 0.6 |
Definition at line 50 of file tablefind.cpp.
const char * tesseract::kApostropheLikeUTF8 |
Definition at line 48 of file unicodes.cpp.
const double tesseract::kBestCheckpointFraction = 31.0 / 32.0 |
Definition at line 68 of file lstmtrainer.cpp.
const double tesseract::kBigPartSizeRatio = 1.75 |
Definition at line 49 of file colpartitiongrid.cpp.
const int tesseract::kBoxClipTolerance = 2 |
Definition at line 31 of file boxword.cpp.
const double tesseract::kBrokenCJKIterationFraction = 0.125 |
Definition at line 68 of file strokewidth.cpp.
const int tesseract::kBytesPer64BitNumber = 20 |
Max bytes in the decimal representation of int64_t.
Definition at line 1828 of file baseapi.cpp.
const int tesseract::kBytesPerBoxFileLine = (kBytesPerNumber + 1) * kNumbersPerBlob + 1 |
Multiplier for max expected textlength assumes (kBytesPerNumber + space)
Definition at line 1826 of file baseapi.cpp.
const int tesseract::kBytesPerNumber = 5 |
The number of bytes taken by each number. Since we use int16_t for ICOORD, assume only 5 digits max.
Definition at line 1820 of file baseapi.cpp.
const int tesseract::kCellSplitColumnThreshold = 0 |
Definition at line 42 of file tablerecog.cpp.
const int tesseract::kCellSplitRowThreshold = 0 |
Definition at line 41 of file tablerecog.cpp.
const float tesseract::kCertaintyScale = 7.0f |
Definition at line 36 of file linerec.cpp.
const double tesseract::kCertOffset = -0.085 |
Definition at line 47 of file lstmrecognizer.cpp.
const double tesseract::kCJKAspectRatio = 1.25 |
Definition at line 62 of file strokewidth.cpp.
const double tesseract::kCJKAspectRatioIncrease = 1.0625 |
Definition at line 64 of file strokewidth.cpp.
const double tesseract::kCJKBrokenDistanceFraction = 0.25 |
Definition at line 58 of file strokewidth.cpp.
const int tesseract::kCJKMaxComponents = 8 |
Definition at line 60 of file strokewidth.cpp.
const int tesseract::kCJKRadius = 2 |
Definition at line 56 of file strokewidth.cpp.
const int tesseract::kColumnWidthFactor = 20 |
const double tesseract::kCosMaxSkewAngle = 0.866025 |
Definition at line 61 of file tabfind.cpp.
const int tesseract::kCrackSpacing = 100 |
Spacing of cracks across the page to break up tall vertical lines.
Definition at line 43 of file linefind.cpp.
const ParagraphModel * tesseract::kCrownLeft = reinterpret_cast<ParagraphModel *>(0xDEAD111F) |
Definition at line 55 of file paragraphs.cpp.
const ParagraphModel * tesseract::kCrownRight = reinterpret_cast<ParagraphModel *>(0xDEAD888F) |
Definition at line 57 of file paragraphs.cpp.
const int tesseract::kDefaultResolution = 300 |
Definition at line 71 of file pango_font_info.cpp.
const double tesseract::kDiacriticXPadRatio = 7.0 |
Definition at line 71 of file strokewidth.cpp.
const double tesseract::kDiacriticYPadRatio = 1.75 |
Definition at line 74 of file strokewidth.cpp.
const double tesseract::kDictRatio = 2.25 |
Definition at line 45 of file lstmrecognizer.cpp.
const int tesseract::kDoubleFlag = 128 |
Definition at line 148 of file weightmatrix.cpp.
const int tesseract::kErrorGraphInterval = 1000 |
Definition at line 56 of file lstmtrainer.cpp.
const int tesseract::kExposureFactor = 16 |
Definition at line 58 of file degradeimage.cpp.
const int tesseract::kFeaturePadding = 2 |
Definition at line 37 of file imagedata.h.
const float tesseract::kFontMergeDistance = 0.025 |
Definition at line 49 of file mastertrainer.cpp.
const double tesseract::kGoodRowNumberOfColumnsLarge = 0.7 |
Definition at line 60 of file tablerecog.cpp.
const double tesseract::kGoodRowNumberOfColumnsSmall[] = { 2, 2, 2, 2, 2, 3, 3 } |
Definition at line 56 of file tablerecog.cpp.
const int tesseract::kGoodRowNumberOfColumnsSmallSize |
Definition at line 57 of file tablerecog.cpp.
const int tesseract::kGutterMultiple = 4 |
Definition at line 36 of file tabvector.cpp.
const int tesseract::kGutterToNeighbourRatio = 3 |
Definition at line 38 of file tabvector.cpp.
const double tesseract::kHighConfidence = 0.9375 |
Definition at line 64 of file lstmtrainer.cpp.
const int tesseract::kHistogramBuckets = 16 |
Definition at line 341 of file weightmatrix.cpp.
const double tesseract::kHorizontalGapMergeFraction = 0.5 |
Definition at line 50 of file colfind.cpp.
const double tesseract::kHorizontalSpacing = 0.30 |
Definition at line 35 of file tablerecog.cpp.
const int tesseract::kHorzStrongTextlineAspect = 5 |
Definition at line 67 of file colpartition.cpp.
const int tesseract::kHorzStrongTextlineCount = 8 |
Definition at line 63 of file colpartition.cpp.
const int tesseract::kHorzStrongTextlineHeight = 10 |
Definition at line 65 of file colpartition.cpp.
const char * tesseract::kHyphenLikeUTF8 |
The following are confusable internal word punctuation symbols which we normalize to the first variant when matching in dawgs.
Definition at line 32 of file unicodes.cpp.
const int tesseract::kImagePadding = 4 |
Definition at line 39 of file imagedata.h.
const double tesseract::kImprovementFraction = 15.0 / 16.0 |
Definition at line 66 of file lstmtrainer.cpp.
const float tesseract::kInfiniteDist = 999.0f |
Definition at line 906 of file mastertrainer.cpp.
const char* tesseract::kInputFile = "noname.tif" |
Filename used for input image file, from which to derive a name to search for a possible UNLV zone file, if none is specified by SetInputName.
Definition at line 108 of file baseapi.cpp.
const int tesseract::kInt8Flag = 1 |
Definition at line 142 of file weightmatrix.cpp.
const double tesseract::kLargeTableProjectionThreshold = 0.45 |
Definition at line 107 of file tablefind.cpp.
const int tesseract::kLargeTableRowCount = 6 |
Definition at line 109 of file tablefind.cpp.
const int tesseract::kLatinChs[] |
Latin chars corresponding to the unicode chars above.
Definition at line 1889 of file baseapi.cpp.
const double tesseract::kLearningRateDecay = sqrt(0.5) |
Definition at line 52 of file lstmtrainer.cpp.
const int tesseract::kLeftIndentAlignmentCountTh = 1 |
Definition at line 86 of file equationdetect.cpp.
const double tesseract::kLineCountReciprocal = 4.0 |
Definition at line 49 of file tabvector.cpp.
const int tesseract::kLinedTableMinHorizontalLines = 3 |
Definition at line 45 of file tablerecog.cpp.
const int tesseract::kLinedTableMinVerticalLines = 3 |
Definition at line 44 of file tablerecog.cpp.
const int tesseract::kLineFindGridSize = 50 |
Grid size used by line finder. Not very critical.
Definition at line 45 of file linefind.cpp.
const double tesseract::kLineFragmentAspectRatio = 10.0 |
Definition at line 55 of file tabfind.cpp.
const double tesseract::kLineResidueAspectRatio = 8.0 |
Definition at line 95 of file strokewidth.cpp.
const int tesseract::kLineResiduePadRatio = 3 |
Definition at line 97 of file strokewidth.cpp.
const double tesseract::kLineResidueSizeRatio = 1.75 |
Definition at line 99 of file strokewidth.cpp.
const int tesseract::kLineTrapLongest = 4 |
Definition at line 88 of file strokewidth.cpp.
const int tesseract::kLineTrapShortest = 2 |
Definition at line 90 of file strokewidth.cpp.
const char * tesseract::kLRM = "\u200E" |
Definition at line 27 of file unicodes.cpp.
const double tesseract::kMarginFactor = 1.1 |
Definition at line 50 of file tablerecog.cpp.
const double tesseract::kMarginOverlapFraction = 0.25 |
Definition at line 47 of file colpartitiongrid.cpp.
const float tesseract::kMathDigitDensityTh1 = 0.25 |
Definition at line 81 of file equationdetect.cpp.
const float tesseract::kMathDigitDensityTh2 = 0.1 |
Definition at line 82 of file equationdetect.cpp.
const float tesseract::kMathItalicDensityTh = 0.5 |
Definition at line 83 of file equationdetect.cpp.
const int tesseract::kMaxAmbigStringSize = UNICHAR_LEN * (MAX_AMBIG_SIZE + 1) |
Definition at line 36 of file ambigs.cpp.
const double tesseract::kMaxBaselineError = 0.4375 |
Definition at line 70 of file colpartition.cpp.
const double tesseract::kMaxBlobOverlapFactor = 4.0 |
Definition at line 77 of file tablefind.cpp.
const int tesseract::kMaxBlobWidth = 500 |
Definition at line 40 of file tablefind.cpp.
const int16_t tesseract::kMaxBoxEdgeDiff = 2 |
Definition at line 31 of file recogtraining.cpp.
const int tesseract::kMaxBoxesInDataPartition = 20 |
Definition at line 66 of file tablefind.cpp.
const int tesseract::kMaxBytesPerLine |
A maximal single box could occupy kNumbersPerBlob numbers at kBytesPer64BitNumber digits (if someone sneaks in a 64 bit value) and a space plus the newline and the maximum length of a UNICHAR. Test against this on each iteration for safety.
Definition at line 1835 of file baseapi.cpp.
const int tesseract::kMaxCaptionLines = 7 |
Definition at line 41 of file colpartitiongrid.cpp.
const int tesseract::kMaxCharTopRange = 48 |
Definition at line 67 of file fixxht.cpp.
const int tesseract::kMaxCircleErosions = 8 |
Definition at line 53 of file pagesegmain.cpp.
const int tesseract::kMaxCJKSizeRatio = 5 |
Definition at line 66 of file strokewidth.cpp.
const int tesseract::kMaxColorDistance = 900 |
Definition at line 77 of file colpartition.cpp.
const int tesseract::kMaxColumnHeaderDistance = 4 |
Definition at line 85 of file tablefind.cpp.
const double tesseract::kMaxDiacriticDistanceRatio = 1.25 |
Definition at line 80 of file strokewidth.cpp.
const double tesseract::kMaxDiacriticGapToBaseCharHeight = 1.0 |
Definition at line 83 of file strokewidth.cpp.
const double tesseract::kMaxDistToPartSizeRatio = 1.5 |
Definition at line 55 of file colfind.cpp.
const int tesseract::kMaxFillinMultiple = 11 |
Definition at line 45 of file tabvector.cpp.
const double tesseract::kMaxGapInTextPartition = 4.0 |
Definition at line 69 of file tablefind.cpp.
const double tesseract::kMaxGutterWidthAbsolute = 2.00 |
Definition at line 50 of file tabfind.cpp.
const int tesseract::kMaxIncompatibleColumnCount = 2 |
Definition at line 47 of file colfind.cpp.
const int tesseract::kMaxIntSize = 22 |
Max string length of an int.
Definition at line 114 of file baseapi.cpp.
const int tesseract::kMaxLargeOverlapsWithMedium = 12 |
Definition at line 44 of file ccnontextdetect.cpp.
const int tesseract::kMaxLargeOverlapsWithSmall = 3 |
Definition at line 35 of file ccnontextdetect.cpp.
const double tesseract::kMaxLeaderGapFractionOfMax = 0.25 |
Definition at line 53 of file colpartition.cpp.
const double tesseract::kMaxLeaderGapFractionOfMin = 0.5 |
Definition at line 55 of file colpartition.cpp.
const int tesseract::kMaxLigature = 0xfb17 |
Definition at line 46 of file ligature_table.cpp.
const int tesseract::kMaxLineLength = 1024 |
Definition at line 318 of file boxchar.cpp.
const int tesseract::kMaxLineResidue = 6 |
Definition at line 51 of file linefind.cpp.
const int tesseract::kMaxMediumOverlapsWithSmall = 12 |
Definition at line 40 of file ccnontextdetect.cpp.
const int tesseract::kMaxNeighbourDistFactor = 4 |
Definition at line 39 of file colpartitiongrid.cpp.
const double tesseract::kMaxNonLineDensity = 0.25 |
Definition at line 56 of file linefind.cpp.
const int tesseract::kMaxOffsetDist = 32 |
Definition at line 32 of file intfeaturemap.cpp.
const int tesseract::kMaxPadFactor = 6 |
Definition at line 36 of file colpartitiongrid.cpp.
const double tesseract::kMaxParagraphEndingLeftSpaceMultiple = 3.0 |
Definition at line 126 of file tablefind.cpp.
const double tesseract::kMaxPartitionSpacing = 1.75 |
Definition at line 64 of file colpartitiongrid.cpp.
const int tesseract::kMaxRaggedSearch = 25 |
Definition at line 40 of file tabfind.cpp.
const int tesseract::kMaxRealDistance = 2.0 |
Definition at line 39 of file detlinefit.cpp.
const double tesseract::kMaxRectangularFraction = 0.75 |
Definition at line 43 of file imagefind.cpp.
const double tesseract::kMaxRectangularGradient = 0.1 |
Definition at line 46 of file imagefind.cpp.
const int tesseract::kMaxRMSColorNoise = 128 |
Definition at line 74 of file colpartition.cpp.
const double tesseract::kMaxRowSize = 2.5 |
Definition at line 53 of file tablerecog.cpp.
const double tesseract::kMaxSameBlockLineSpacing = 3 |
Definition at line 49 of file colpartition.cpp.
const double tesseract::kMaxSizeRatio = 1.5 |
Definition at line 51 of file colpartition.cpp.
const int tesseract::kMaxSkewFactor = 15 |
Definition at line 65 of file alignedblob.cpp.
const double tesseract::kMaxSmallNeighboursPerPix = 1.0 / 32 |
Definition at line 32 of file ccnontextdetect.cpp.
const double tesseract::kMaxSpacingDrift = 1.0 / 72 |
Definition at line 43 of file colpartition.cpp.
const double tesseract::kMaxStaveHeight = 1.0 |
Definition at line 58 of file linefind.cpp.
const double tesseract::kMaxTableCellXheight = 2.0 |
Definition at line 81 of file tablefind.cpp.
const double tesseract::kMaxTopSpacingFraction = 0.25 |
Definition at line 46 of file colpartition.cpp.
const int tesseract::kMaxUnicharsPerCluster = 2000 |
Definition at line 47 of file mastertrainer.cpp.
const int tesseract::kMaxVerticalSearch = 12 |
Definition at line 39 of file tabfind.cpp.
const int tesseract::kMaxVerticalSpacing = 500 |
Definition at line 38 of file tablefind.cpp.
const int tesseract::kMaxWinSize = 2000 |
Definition at line 51 of file network.cpp.
const double tesseract::kMaxXProjectionGapFactor = 2.0 |
Definition at line 136 of file tablefind.cpp.
const double tesseract::kMinAlignedGutter = 0.25 |
Definition at line 51 of file tabvector.cpp.
const int tesseract::kMinAlignedTabs = 4 |
Definition at line 55 of file alignedblob.cpp.
const double tesseract::kMinBaselineCoverage = 0.5 |
Definition at line 72 of file colpartition.cpp.
const int tesseract::kMinBoxesInTextPartition = 10 |
Definition at line 63 of file tablefind.cpp.
const double tesseract::kMinCaptionGapHeightRatio = 0.5 |
Definition at line 45 of file colpartitiongrid.cpp.
const double tesseract::kMinCaptionGapRatio = 2.0 |
Definition at line 43 of file colpartitiongrid.cpp.
const float tesseract::kMinCertainty = -20.0f |
Definition at line 30 of file networkio.cpp.
const int tesseract::kMinChainTextValue = 3 |
Definition at line 61 of file colpartition.cpp.
const int tesseract::kMinClusteredShapes = 1 |
Definition at line 45 of file mastertrainer.cpp.
const int tesseract::kMinColorDifference = 16 |
Definition at line 52 of file imagefind.cpp.
const int tesseract::kMinColumnWidth = 2.0 / 3 |
Definition at line 32 of file colpartitionset.cpp.
const double tesseract::kMinDiacriticSizeRatio = 1.0625 |
Definition at line 77 of file strokewidth.cpp.
const double tesseract::kMinDivergenceRate = 50.0 |
Definition at line 45 of file lstmtrainer.cpp.
const int tesseract::kMinEvaluatedTabs = 3 |
Definition at line 57 of file tabfind.cpp.
const double tesseract::kMinFilledArea = 0.35 |
Definition at line 63 of file tablerecog.cpp.
const double tesseract::kMinFractionalLinesInColumn = 0.125 |
Definition at line 46 of file tabfind.cpp.
const double tesseract::kMinGoodTextPARatio = 1.5 |
Definition at line 60 of file ccnontextdetect.cpp.
const double tesseract::kMinGutterFraction = 0.5 |
Definition at line 47 of file tabvector.cpp.
const double tesseract::kMinGutterWidthGrid = 0.5 |
Definition at line 52 of file colfind.cpp.
const int tesseract::kMinImageFindSize = 100 |
Definition at line 48 of file imagefind.cpp.
const int tesseract::kMinLeaderCount = 5 |
Definition at line 57 of file colpartition.cpp.
const int tesseract::kMinLigature = 0xfb00 |
Definition at line 45 of file ligature_table.cpp.
const int tesseract::kMinLineLengthFraction = 4 |
Denominator of resolution makes min pixels to demand line lengths to be.
Definition at line 41 of file linefind.cpp.
const int tesseract::kMinLinesInColumn = 10 |
Definition at line 42 of file tabfind.cpp.
const double tesseract::kMinMaxGapInTextPartition = 0.5 |
Definition at line 73 of file tablefind.cpp.
const double tesseract::kMinMusicPixelFraction = 0.75 |
Definition at line 60 of file linefind.cpp.
const double tesseract::kMinOverlapWithTable = 0.6 |
Definition at line 97 of file tablefind.cpp.
const double tesseract::kMinParagraphEndingTextToWhitespaceRatio = 3.0 |
Definition at line 132 of file tablefind.cpp.
const int tesseract::kMinPointsForErrorCount = 16 |
Definition at line 36 of file detlinefit.cpp.
const float tesseract::kMinProb = exp(kMinCertainty) |
Definition at line 32 of file networkio.cpp.
const double tesseract::kMinRaggedGutter = 1.5 |
Definition at line 53 of file tabvector.cpp.
const int tesseract::kMinRaggedTabs = 5 |
Definition at line 53 of file alignedblob.cpp.
const int tesseract::kMinRampSize = 1000 |
Definition at line 62 of file degradeimage.cpp.
const double tesseract::kMinRectangularFraction = 0.125 |
Definition at line 41 of file imagefind.cpp.
const int tesseract::kMinRectSize = 10 |
Minimum sensible image size to be worth running tesseract.
Definition at line 97 of file baseapi.cpp.
const int tesseract::kMinRowsInTable = 3 |
Definition at line 112 of file tablefind.cpp.
const int tesseract::kMinStallIterations = 10000 |
Definition at line 47 of file lstmtrainer.cpp.
const int tesseract::kMinStartedErrorRate = 75 |
Definition at line 60 of file lstmtrainer.cpp.
const int tesseract::kMinStrongTextValue = 6 |
Definition at line 59 of file colpartition.cpp.
const double tesseract::kMinTabGradient = 4.0 |
Definition at line 61 of file alignedblob.cpp.
const int tesseract::kMinThickLineWidth = 12 |
Definition at line 47 of file linefind.cpp.
const int tesseract::kMinVerticalSearch = 3 |
Definition at line 38 of file tabfind.cpp.
const int tesseract::kMinWinSize = 500 |
Definition at line 50 of file network.cpp.
const int tesseract::kMostlyOneDirRatio = 3 |
Definition at line 93 of file strokewidth.cpp.
const double tesseract::kNeighbourSearchFactor = 2.5 |
Definition at line 103 of file strokewidth.cpp.
const char* tesseract::kNodeContNames[] = {"Anything", "OnlyDup", "NoDup"} |
Definition at line 45 of file recodebeam.cpp.
const double tesseract::kNoiseOverlapAreaFactor = 1.0 / 512 |
Definition at line 108 of file strokewidth.cpp.
const double tesseract::kNoiseOverlapGrowthFactor = 4.0 |
Definition at line 105 of file strokewidth.cpp.
const int tesseract::kNoisePadding = 4 |
Definition at line 51 of file ccnontextdetect.cpp.
const char* tesseract::kNullChar = "<nul>" |
Definition at line 30 of file unicharcompress.cpp.
const int tesseract::kNumAdjustmentIterations = 100 |
Definition at line 54 of file lstmtrainer.cpp.
const int tesseract::kNumbersPerBlob = 5 |
The 5 numbers output for each box (the usual 4 and a page number.)
Definition at line 1815 of file baseapi.cpp.
const int tesseract::kNumEndPoints = 3 |
Definition at line 30 of file detlinefit.cpp.
const int tesseract::kNumPagesPerBatch = 100 |
Definition at line 58 of file lstmtrainer.cpp.
const char* tesseract::kOldVarsFile = "failed_vars.txt" |
Temp file used for storing current parameters before applying retry values.
Definition at line 112 of file baseapi.cpp.
const int tesseract::kOriginalNoiseMultiple = 8 |
Definition at line 47 of file ccnontextdetect.cpp.
const double tesseract::kParagraphEndingPreviousLineRatio = 1.3 |
Definition at line 122 of file tablefind.cpp.
const char * tesseract::kPDF = "\u202C" |
Definition at line 30 of file unicodes.cpp.
const double tesseract::kPhotoOffsetFraction = 0.375 |
Definition at line 54 of file ccnontextdetect.cpp.
const int tesseract::kPrime1 = 17 |
Definition at line 36 of file trainingsampleset.cpp.
const int tesseract::kPrime2 = 13 |
Definition at line 37 of file trainingsampleset.cpp.
const int tesseract::kRadicalRadix = 29 |
Definition at line 32 of file unicharcompress.cpp.
const double tesseract::kRaggedFraction = 2.5 |
Definition at line 41 of file alignedblob.cpp.
const double tesseract::kRaggedGapFraction = 1.0 |
Definition at line 45 of file alignedblob.cpp.
const int tesseract::kRaggedGutterMultiple = 5 |
Definition at line 52 of file tabfind.cpp.
const int tesseract::kRandomizingCenter = 128 |
Definition at line 35 of file trainingsample.cpp.
const double tesseract::kRatingEpsilon = 1.0 / 32 |
Definition at line 31 of file errorcounter.cpp.
const double tesseract::kRequiredColumns = 0.7 |
Definition at line 48 of file tablerecog.cpp.
const char tesseract::kReverseIfHasRTL[] = "RRP_REVERSE_IF_HAS_RTL" |
const int tesseract::kRGBRMSColors = 4 |
Definition at line 37 of file colpartition.h.
const char * tesseract::kRLE = "\u202A" |
Definition at line 29 of file unicodes.cpp.
const char * tesseract::kRLM = "\u200F" |
Definition at line 28 of file unicodes.cpp.
const double tesseract::kRMSFitScaling = 8.0 |
Definition at line 50 of file imagefind.cpp.
const float tesseract::kRotationRange = 0.02f |
Definition at line 56 of file degradeimage.cpp.
const int tesseract::kRulingVerticalMargin = 3 |
Definition at line 93 of file tablefind.cpp.
const int tesseract::kSaltnPepper = 5 |
Definition at line 60 of file degradeimage.cpp.
const double tesseract::kScaleFactor = 256.0 |
Definition at line 39 of file functions.h.
const int tesseract::kSeedBlobsCountTh = 10 |
Definition at line 85 of file equationdetect.cpp.
const int tesseract::kSideSpaceMargin = 10 |
Definition at line 102 of file tablefind.cpp.
const int tesseract::kSimilarRaggedDist = 50 |
Definition at line 43 of file tabvector.cpp.
const int tesseract::kSimilarVectorDist = 10 |
Definition at line 40 of file tabvector.cpp.
const int tesseract::ksizeofUniversalAmbigsFile = sizeof(kUniversalAmbigsFile) |
Definition at line 27 of file universalambigs.h.
const float tesseract::kSizeRatioToReject = 2.0 |
Definition at line 101 of file strokewidth.cpp.
const double tesseract::kSmallTableProjectionThreshold = 0.35 |
Definition at line 106 of file tablefind.cpp.
const int tesseract::kSmoothDecisionMargin = 4 |
Definition at line 67 of file colpartitiongrid.cpp.
const double tesseract::kSplitPartitionSize = 2.0 |
Definition at line 44 of file tablefind.cpp.
const int tesseract::kSquareLimit = 25 |
Definition at line 34 of file trainingsampleset.cpp.
const double tesseract::kStageTransitionThreshold = 10.0 |
Definition at line 62 of file lstmtrainer.cpp.
const double tesseract::kStrokeWidthCJK = 2.0 |
Definition at line 53 of file strokewidth.cpp.
const double tesseract::kStrokeWidthConstantTolerance = 2.0 |
Definition at line 141 of file tablefind.cpp.
const double tesseract::kStrokeWidthFractionalTolerance = 0.25 |
Definition at line 140 of file tablefind.cpp.
const double tesseract::kStrokeWidthFractionCJK = 0.25 |
Definition at line 52 of file strokewidth.cpp.
const double tesseract::kStrokeWidthFractionTolerance = 0.125 |
Allowed proportional change in stroke width to be the same font.
Definition at line 45 of file strokewidth.cpp.
const double tesseract::kStrokeWidthTolerance = 1.5 |
Allowed constant change in stroke width to be the same font. Really 1.5 pixels.
Definition at line 50 of file strokewidth.cpp.
const double tesseract::kSubTrainerMarginFraction = 3.0 / 128 |
Definition at line 50 of file lstmtrainer.cpp.
const double tesseract::kTableColumnThreshold = 3.0 |
Definition at line 89 of file tablefind.cpp.
const int tesseract::kTableSize = 4096 |
Definition at line 37 of file functions.h.
const int tesseract::kTabRadiusFactor = 5 |
Definition at line 36 of file tabfind.cpp.
const int tesseract::kTargetXScale = 5 |
Definition at line 70 of file lstmtrainer.cpp.
const int tesseract::kTargetYScale = 100 |
Definition at line 71 of file lstmtrainer.cpp.
const char tesseract::kTesseractReject = '~' |
Character returned when Tesseract couldn't recognize as anything.
Definition at line 99 of file baseapi.cpp.
const int tesseract::kTestChar = -1 |
Definition at line 32 of file trainingsampleset.cpp.
const double tesseract::kThickLengthMultiple = 0.75 |
Definition at line 54 of file linefind.cpp.
const int tesseract::kThinLineFraction = 20 |
Denominator of resolution makes max pixel width to allow thin lines.
Definition at line 39 of file linefind.cpp.
const double tesseract::kTinyEnoughTextlineOverlapFraction = 0.25 |
Definition at line 51 of file colpartitiongrid.cpp.
const float tesseract::kUnclearDensityTh = 0.25 |
Definition at line 84 of file equationdetect.cpp.
const int tesseract::kUniChs[] |
Conversion table for non-latin characters. Maps characters out of the latin set into the latin set. TODO(rays) incorporate this translation into unicharset.
Definition at line 1885 of file baseapi.cpp.
const char tesseract::kUniversalAmbigsFile |
Definition at line 26 of file universalambigs.h.
const char tesseract::kUNLVReject = '~' |
Character used by UNLV error counter as a reject.
Definition at line 101 of file baseapi.cpp.
const char tesseract::kUNLVSuspect = '^' |
Character used by UNLV as a suspect marker.
Definition at line 103 of file baseapi.cpp.
const char * tesseract::kUTF8LineSeparator = "\u2028" |
Definition at line 25 of file unicodes.cpp.
const char * tesseract::kUTF8ParagraphSeparator = "\u2029" |
Definition at line 26 of file unicodes.cpp.
const double tesseract::kVerticalSpacing = -0.2 |
Definition at line 38 of file tablerecog.cpp.
const int tesseract::kVLineAlignment = 3 |
Definition at line 47 of file alignedblob.cpp.
const int tesseract::kVLineGutter = 1 |
Definition at line 49 of file alignedblob.cpp.
const int tesseract::kVLineMinLength = 500 |
Definition at line 57 of file alignedblob.cpp.
const int tesseract::kVLineSearchSize = 150 |
Definition at line 51 of file alignedblob.cpp.
const float tesseract::kWorstDictCertainty = -25.0f |
Definition at line 38 of file linerec.cpp.
const int tesseract::kXWinFrameSize = 30 |
Definition at line 53 of file network.cpp.
const int tesseract::kYWinFrameSize = 80 |
Definition at line 54 of file network.cpp.
double tesseract::LogisticTable |
Definition at line 24 of file functions.cpp.
const char* const tesseract::RTLReversePolicyNames[] |
double tesseract::TanhTable |
Definition at line 23 of file functions.cpp.
bool tesseract::textord_show_tables = false |
"Show table regions"
Definition at line 143 of file tablefind.cpp.
bool tesseract::textord_tabfind_find_tables = true |
"run table detection"
Definition at line 65 of file colfind.cpp.
bool tesseract::textord_tabfind_only_strokewidths = false |
"Only run stroke widths"
Definition at line 42 of file strokewidth.cpp.
bool tesseract::textord_tabfind_show_blocks = false |
"Show final block bounds"
Definition at line 64 of file colfind.cpp.
bool tesseract::textord_tabfind_show_color_fit = false |
"Show stroke widths"
Definition at line 32 of file colpartitiongrid.cpp.
bool tesseract::textord_tabfind_show_columns = false |
"Show column bounds"
Definition at line 63 of file colfind.cpp.
bool tesseract::textord_tabfind_show_finaltabs = false |
"Show tab vectors"
Definition at line 64 of file tabfind.cpp.
bool tesseract::textord_tabfind_show_initial_partitions = false |
"Show partition bounds"
Definition at line 58 of file colfind.cpp.
bool tesseract::textord_tabfind_show_initialtabs = false |
"Show tab candidates"
Definition at line 63 of file tabfind.cpp.
int tesseract::textord_tabfind_show_partitions = 0 |
"Show partition bounds, waiting if >1"
Definition at line 62 of file colfind.cpp.
bool tesseract::textord_tabfind_show_reject_blobs = false |
"Show blobs rejected as noise"
Definition at line 60 of file colfind.cpp.
int tesseract::textord_tabfind_show_strokewidths = 0 |
"Show stroke widths"
Definition at line 41 of file strokewidth.cpp.
bool tesseract::textord_tablefind_recognize_tables = false |
"Enables the table recognizer for table layout and filtering."
Definition at line 149 of file tablefind.cpp.
bool tesseract::textord_tablefind_show_mark = false |
"Debug table marking steps in detail"
Definition at line 145 of file tablefind.cpp.
bool tesseract::textord_tablefind_show_stats = false |
"Show page stats used in table finding"
Definition at line 147 of file tablefind.cpp.
double tesseract::textord_tabvector_vertical_box_ratio = 0.5 |
"Fraction of box matches required to declare a line vertical"
Definition at line 59 of file tabvector.cpp.
double tesseract::textord_tabvector_vertical_gap_fraction = 0.5 |
"max fraction of mean blob width allowed for vertical gaps in vertical text"
"Max fraction of mean blob width allowed for vertical gaps in vertical text"
Definition at line 56 of file tabvector.cpp.
CCUtilMutex tesseract::tprintfMutex |
Definition at line 59 of file ccutil.cpp.