All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
tesseract::GeometricClassifierState Struct Reference

Public Member Functions

 GeometricClassifierState (int dbg_level, GenericVector< RowScratchRegisters > *r, int r_start, int r_end)
 
void AssumeLeftJustification ()
 
void AssumeRightJustification ()
 
const GenericVector< Cluster > & AlignTabs () const
 
const GenericVector< Cluster > & OffsideTabs () const
 
bool IsFullRow (int i) const
 
int AlignsideTabIndex (int row_idx) const
 
bool FirstWordWouldHaveFit (int row_a, int row_b)
 
void PrintRows () const
 
void Fail (int min_debug_level, const char *why) const
 
ParagraphModel Model () const
 

Public Attributes

int debug_level
 
GenericVector
< RowScratchRegisters > * 
rows
 
int row_start
 
int row_end
 
int tolerance
 
bool ltr
 
GenericVector< Clusterleft_tabs
 
GenericVector< Clusterright_tabs
 
tesseract::ParagraphJustification just
 
int margin
 
int first_indent
 
int body_indent
 
int eop_threshold
 

Detailed Description

Definition at line 854 of file paragraphs.cpp.

Constructor & Destructor Documentation

tesseract::GeometricClassifierState::GeometricClassifierState ( int  dbg_level,
GenericVector< RowScratchRegisters > *  r,
int  r_start,
int  r_end 
)
inline

Definition at line 855 of file paragraphs.cpp.

858  : debug_level(dbg_level), rows(r), row_start(r_start), row_end(r_end),
859  margin(0) {
860  tolerance = InterwordSpace(*r, r_start, r_end);
861  CalculateTabStops(r, r_start, r_end, tolerance,
862  &left_tabs, &right_tabs);
863  if (debug_level >= 3) {
864  tprintf("Geometry: TabStop cluster tolerance = %d; "
865  "%d left tabs; %d right tabs\n",
866  tolerance, left_tabs.size(), right_tabs.size());
867  }
868  ltr = (*r)[r_start].ri_->ltr;
869  }
void CalculateTabStops(GenericVector< RowScratchRegisters > *rows, int row_start, int row_end, int tolerance, GenericVector< Cluster > *left_tabs, GenericVector< Cluster > *right_tabs)
Definition: paragraphs.cpp:691
GenericVector< RowScratchRegisters > * rows
Definition: paragraphs.cpp:932
#define tprintf(...)
Definition: tprintf.h:31
GenericVector< Cluster > left_tabs
Definition: paragraphs.cpp:945
int InterwordSpace(const GenericVector< RowScratchRegisters > &rows, int row_start, int row_end)
GenericVector< Cluster > right_tabs
Definition: paragraphs.cpp:946

Member Function Documentation

int tesseract::GeometricClassifierState::AlignsideTabIndex ( int  row_idx) const
inline

Definition at line 904 of file paragraphs.cpp.

904  {
905  return ClosestCluster(AlignTabs(), (*rows)[row_idx].AlignsideIndent(just));
906  }
GenericVector< RowScratchRegisters > * rows
Definition: paragraphs.cpp:932
const GenericVector< Cluster > & AlignTabs() const
Definition: paragraphs.cpp:882
int ClosestCluster(const GenericVector< Cluster > &clusters, int value)
Definition: paragraphs.cpp:665
tesseract::ParagraphJustification just
Definition: paragraphs.cpp:949
const GenericVector<Cluster>& tesseract::GeometricClassifierState::AlignTabs ( ) const
inline

Definition at line 882 of file paragraphs.cpp.

882  {
884  return left_tabs;
885  }
GenericVector< Cluster > left_tabs
Definition: paragraphs.cpp:945
tesseract::ParagraphJustification just
Definition: paragraphs.cpp:949
GenericVector< Cluster > right_tabs
Definition: paragraphs.cpp:946
void tesseract::GeometricClassifierState::AssumeLeftJustification ( )
inline

Definition at line 871 of file paragraphs.cpp.

void tesseract::GeometricClassifierState::AssumeRightJustification ( )
inline

Definition at line 876 of file paragraphs.cpp.

void tesseract::GeometricClassifierState::Fail ( int  min_debug_level,
const char *  why 
) const
inline

Definition at line 917 of file paragraphs.cpp.

917  {
918  if (debug_level < min_debug_level) return;
919  tprintf("# %s\n", why);
920  PrintRows();
921  }
#define tprintf(...)
Definition: tprintf.h:31
bool tesseract::GeometricClassifierState::FirstWordWouldHaveFit ( int  row_a,
int  row_b 
)
inline

Definition at line 910 of file paragraphs.cpp.

910  {
912  (*rows)[row_a], (*rows)[row_b], just);
913  }
bool FirstWordWouldHaveFit(const RowScratchRegisters &before, const RowScratchRegisters &after)
GenericVector< RowScratchRegisters > * rows
Definition: paragraphs.cpp:932
tesseract::ParagraphJustification just
Definition: paragraphs.cpp:949
bool tesseract::GeometricClassifierState::IsFullRow ( int  i) const
inline

Definition at line 899 of file paragraphs.cpp.

899  {
900  return ClosestCluster(left_tabs, (*rows)[i].lindent_) == 0 &&
901  ClosestCluster(right_tabs, (*rows)[i].rindent_) == 0;
902  }
GenericVector< RowScratchRegisters > * rows
Definition: paragraphs.cpp:932
GenericVector< Cluster > left_tabs
Definition: paragraphs.cpp:945
int ClosestCluster(const GenericVector< Cluster > &clusters, int value)
Definition: paragraphs.cpp:665
GenericVector< Cluster > right_tabs
Definition: paragraphs.cpp:946
ParagraphModel tesseract::GeometricClassifierState::Model ( ) const
inline
const GenericVector<Cluster>& tesseract::GeometricClassifierState::OffsideTabs ( ) const
inline

Definition at line 892 of file paragraphs.cpp.

892  {
894  return right_tabs;
895  }
GenericVector< Cluster > left_tabs
Definition: paragraphs.cpp:945
tesseract::ParagraphJustification just
Definition: paragraphs.cpp:949
GenericVector< Cluster > right_tabs
Definition: paragraphs.cpp:946
void tesseract::GeometricClassifierState::PrintRows ( ) const
inline

Definition at line 915 of file paragraphs.cpp.

915 { PrintRowRange(*rows, row_start, row_end); }
GenericVector< RowScratchRegisters > * rows
Definition: paragraphs.cpp:932

Member Data Documentation

int tesseract::GeometricClassifierState::body_indent

Definition at line 952 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::debug_level

Definition at line 928 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::eop_threshold

Definition at line 955 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::first_indent

Definition at line 951 of file paragraphs.cpp.

tesseract::ParagraphJustification tesseract::GeometricClassifierState::just

Definition at line 949 of file paragraphs.cpp.

GenericVector<Cluster> tesseract::GeometricClassifierState::left_tabs

Definition at line 945 of file paragraphs.cpp.

bool tesseract::GeometricClassifierState::ltr

Definition at line 941 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::margin

Definition at line 950 of file paragraphs.cpp.

GenericVector<Cluster> tesseract::GeometricClassifierState::right_tabs

Definition at line 946 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::row_end

Definition at line 934 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::row_start

Definition at line 933 of file paragraphs.cpp.

GenericVector<RowScratchRegisters>* tesseract::GeometricClassifierState::rows

Definition at line 932 of file paragraphs.cpp.

int tesseract::GeometricClassifierState::tolerance

Definition at line 937 of file paragraphs.cpp.


The documentation for this struct was generated from the following file: