22 #include "allheaders.h"
30 int scaled_yres,
int rect_left,
int rect_top,
31 int rect_width,
int rect_height)
32 : page_res_(page_res),
33 tesseract_(tesseract),
38 include_upper_dots_(false),
39 include_lower_dots_(false),
41 scaled_yres_(scaled_yres),
42 rect_left_(rect_left),
44 rect_width_(rect_width),
45 rect_height_(rect_height) {
61 : page_res_(src.page_res_),
62 tesseract_(src.tesseract_),
64 word_length_(src.word_length_),
65 blob_index_(src.blob_index_),
67 include_upper_dots_(src.include_upper_dots_),
68 include_lower_dots_(src.include_lower_dots_),
70 scaled_yres_(src.scaled_yres_),
71 rect_left_(src.rect_left_),
72 rect_top_(src.rect_top_),
73 rect_width_(src.rect_width_),
74 rect_height_(src.rect_height_) {
114 while (next_para.
cmp(*
it_) <= 0) {
210 if (
Empty(element))
return true;
219 if (next.
Empty(element))
return true;
220 while (element > level) {
266 int* right,
int* bottom)
const {
326 int* right,
int* bottom)
const {
327 return BoundingBox(level, 0, left, top, right, bottom);
332 int* right,
int* bottom)
const {
373 Pta* pta = ptaCreate(it.length());
375 for (it.mark_cycle_pt(); !it.cycled_list(); it.forward(), ++num_pts) {
408 int left, top, right, bottom;
414 Box* box = boxCreate(left, top, right - left, bottom - top);
421 int mask_x = left - mask_box.
left();
424 pixRasterop(pix,
MAX(0, -mask_x),
MAX(0, -mask_y), pixGetWidth(pix),
425 pixGetHeight(pix), PIX_SRC & PIX_DST, mask,
MAX(0, mask_x),
445 int* left,
int* top)
const {
447 if (!
BoundingBox(level, left, top, &right, &bottom))
449 if (original_img ==
NULL)
453 *left =
MAX(*left - padding, 0);
454 *top =
MAX(*top - padding, 0);
457 Box* box = boxCreate(*left, *top, right - *left, bottom - *top);
458 Pix* grey_pix = pixClipRectangle(original_img, box,
NULL);
465 int mask_x = *left - mask_box.
left();
466 int mask_y = *top - (pixGetHeight(original_img) - mask_box.
top());
467 int width = pixGetWidth(grey_pix);
468 int height = pixGetHeight(grey_pix);
469 Pix* resized_mask = pixCreate(width, height, 1);
470 pixRasterop(resized_mask,
MAX(0, -mask_x),
MAX(0, -mask_y), width, height,
471 PIX_SRC, mask,
MAX(0, mask_x),
MAX(0, mask_y));
473 pixDilateBrick(resized_mask, resized_mask, 2 * padding + 1,
475 pixInvert(resized_mask, resized_mask);
476 pixSetMasked(grey_pix, resized_mask,
MAX_UINT32);
477 pixDestroy(&resized_mask);
488 int* x1,
int* y1,
int* x2,
int* y2)
const {
495 int left = box.
left();
497 int right = box.
right();
512 float *deskew_angle)
const {
516 FCOORD up_in_image(0.0, 1.0);
520 if (up_in_image.
x() == 0.0F) {
521 if (up_in_image.
y() > 0.0F) {
526 }
else if (up_in_image.
x() > 0.0F) {
543 bool is_mongolian =
false;
544 *textline_order = is_vertical_text
552 *deskew_angle = -skew.
angle();
558 int *first_line_indent)
const {
577 if (word_res ==
NULL) {
590 tprintf(
"Corrupted word! best_choice[len=%d] = %s, box_word[len=%d]: ",
virtual void RestartParagraph()
tesseract::BoxWord * box_word
bool right_to_left() const
WERD_CHOICE * best_choice
TBOX restricted_bounding_box(bool upper_dots, bool lower_dots) const
bool BoundingBoxInternal(PageIteratorLevel level, int *left, int *top, int *right, int *bottom) const
const TBOX & BlobBox(int index) const
bool Empty(PageIteratorLevel level) const
void rotate(const FCOORD vec)
virtual bool Next(PageIteratorLevel level)
BLOCK_RES * prev_block() const
void unrotate(const FCOORD &vec)
bool BoundingBox(PageIteratorLevel level, int *left, int *top, int *right, int *bottom) const
const PageIterator & operator=(const PageIterator &src)
TBOX bounding_box() const
Pix * GetBinaryImage(PageIteratorLevel level) const
WERD_RES * restart_page_with_empties()
T ClipToRange(const T &x, const T &lower_bound, const T &upper_bound)
bool IsWithinFirstTextlineOfParagraph() const
float base_line(float xpos) const
TBOX restricted_bounding_box(bool upper_dots, bool lower_dots) const
const STRING & unichar_string() const
PolyBlockType BlockType() const
float angle() const
find angle
BLOCK_RES * block() const
bool PositionedAtSameWord(const PAGE_RES_IT *other) const
TESS_LOCAL void BeginWord(int offset)
void rotate(const FCOORD &vec)
FCOORD classify_rotation() const
bool SetWordBlamerBundle(BlamerBundle *blamer_bundle)
inT16 y() const
access_function
FCOORD re_rotation() const
Pta * BlockPolygon() const
Pix * GetImage(PageIteratorLevel level, int padding, Pix *original_img, int *left, int *top) const
TBOX bounding_union(const TBOX &box) const
TBOX bounding_box() const
TBOX restricted_bounding_box(bool upper_dots, bool lower_dots) const
WERD_RES * forward_block()
bool Baseline(PageIteratorLevel level, int *x1, int *y1, int *x2, int *y2) const
ICOORDELT_LIST * points()
int cmp(const PAGE_RES_IT &other) const
PageIterator(PAGE_RES *page_res, Tesseract *tesseract, int scale, int scaled_yres, int rect_left, int rect_top, int rect_width, int rect_height)
WERD_RES * forward_with_empties()
Pix * render_mask(TBOX *mask_box)
bool is_very_first_or_continuation
int Cmp(const PageIterator &other) const
inT16 x() const
access function
const TBOX & bounding_box() const
void Orientation(tesseract::Orientation *orientation, tesseract::WritingDirection *writing_direction, tesseract::TextlineOrder *textline_order, float *deskew_angle) const
void ParagraphInfo(tesseract::ParagraphJustification *justification, bool *is_list_item, bool *is_crown, int *first_line_indent) const
virtual bool IsAtFinalElement(PageIteratorLevel level, PageIteratorLevel element) const
virtual void RestartRow()
const ParagraphModel * model
virtual bool IsAtBeginningOf(PageIteratorLevel level) const
const char * string() const
WERD_RES * forward_paragraph()
POLY_BLOCK * poly_block() const
ROW_RES * prev_row() const
PolyBlockType isA() const
BlamerBundle * blamer_bundle
C_BLOB_LIST * cblob_list()
void rotate(const FCOORD &vec)