tessapi/4.0.0/a01145_source.html

 // Copyright 2008 Google Inc. All Rights Reserved.
 // Author: shobhitsaxena@google.com (Shobhit Saxena)
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 // http://www.apache.org/licenses/LICENSE-2.0
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #ifndef TESSERACT_TEXTORD_DEVNAGARI_PROCESSING_H_
 #define TESSERACT_TEXTORD_DEVNAGARI_PROCESSING_H_

 #include "allheaders.h"
 #include "debugpixa.h"
 #include "ocrblock.h"
 #include "params.h"

 struct Pix;
 struct Box;
 struct Boxa;

 extern
 INT_VAR_H(devanagari_split_debuglevel, 0,
           "Debug level for split shiro-rekha process.");

 extern
 BOOL_VAR_H(devanagari_split_debugimage, 0,
            "Whether to create a debug image for split shiro-rekha process.");

 class TBOX;

 namespace tesseract {

 class PixelHistogram {
  public:
   PixelHistogram() {
     hist_ = nullptr;
     length_ = 0;
   }

   ~PixelHistogram() {
     Clear();
   }

   void Clear() {
     delete[] hist_;
     length_ = 0;
   }

   int* hist() const { return hist_; }

   int length() const {
     return length_;
   }

   // Methods to construct histograms from images. These clear any existing data.
   void ConstructVerticalCountHist(Pix* pix);
   void ConstructHorizontalCountHist(Pix* pix);

   // This method returns the global-maxima for the histogram. The frequency of
   // the global maxima is returned in count, if specified.
   int GetHistogramMaximum(int* count) const;

  private:
   int* hist_;
   int length_;
 };

 class ShiroRekhaSplitter {
  public:
   enum SplitStrategy {
     NO_SPLIT = 0,   // No splitting is performed for the phase.
     MINIMAL_SPLIT,  // Blobs are split minimally.
     MAXIMAL_SPLIT   // Blobs are split maximally.
   };

   ShiroRekhaSplitter();
   virtual ~ShiroRekhaSplitter();

   // Top-level method to perform splitting based on current settings.
   // Returns true if a split was actually performed.
   // If split_for_pageseg is true, the pageseg_split_strategy_ is used for
   // splitting. If false, the ocr_split_strategy_ is used.
   bool Split(bool split_for_pageseg, DebugPixa* pixa_debug);

   // Clears the memory held by this object.
   void Clear();

   // Refreshes the words in the segmentation block list by using blobs in the
   // input blob list.
   // The segmentation block list must be set.
   void RefreshSegmentationWithNewBlobs(C_BLOB_LIST* new_blobs);

   // Returns true if the split strategies for pageseg and ocr are different.
   bool HasDifferentSplitStrategies() const {
     return pageseg_split_strategy_ != ocr_split_strategy_;
   }

   // This only keeps a copy of the block list pointer. At split call, the list
   // object should still be alive. This block list is used as a golden
   // segmentation when performing splitting.
   void set_segmentation_block_list(BLOCK_LIST* block_list) {
     segmentation_block_list_ = block_list;
   }

   static const int kUnspecifiedXheight = -1;

   void set_global_xheight(int xheight) {
     global_xheight_ = xheight;
   }

   void set_perform_close(bool perform) {
     perform_close_ = perform;
   }

   // Returns the image obtained from shiro-rekha splitting. The returned object
   // is owned by this class. Callers may want to clone the returned pix to keep
   // it alive beyond the life of ShiroRekhaSplitter object.
   Pix* splitted_image() {
     return splitted_image_;
   }

   // On setting the input image, a clone of it is owned by this class.
   void set_orig_pix(Pix* pix);

   // Returns the input image provided to the object. This object is owned by
   // this class. Callers may want to clone the returned pix to work with it.
   Pix* orig_pix() {
     return orig_pix_;
   }

   SplitStrategy ocr_split_strategy() const {
     return ocr_split_strategy_;
   }

   void set_ocr_split_strategy(SplitStrategy strategy) {
     ocr_split_strategy_ = strategy;
   }

   SplitStrategy pageseg_split_strategy() const {
     return pageseg_split_strategy_;
   }

   void set_pageseg_split_strategy(SplitStrategy strategy) {
     pageseg_split_strategy_ = strategy;
   }

   BLOCK_LIST* segmentation_block_list() {
     return segmentation_block_list_;
   }

   // This method returns the computed mode-height of blobs in the pix.
   // It also prunes very small blobs from calculation. Could be used to provide
   // a global xheight estimate for images which have the same point-size text.
   static int GetModeHeight(Pix* pix);

  private:
   // Method to perform a close operation on the input image. The xheight
   // estimate decides the size of sel used.
   static void PerformClose(Pix* pix, int xheight_estimate);

   // This method resolves the cc bbox to a particular row and returns the row's
   // xheight. This uses block_list_ if available, else just returns the
   // global_xheight_ estimate currently set in the object.
   int GetXheightForCC(Box* cc_bbox);

   // Returns a list of regions (boxes) which should be cleared in the original
   // image so as to perform shiro-rekha splitting. Pix is assumed to carry one
   // (or less) word only. Xheight measure could be the global estimate, the row
   // estimate, or unspecified. If unspecified, over splitting may occur, since a
   // conservative estimate of stroke width along with an associated multiplier
   // is used in its place. It is advisable to have a specified xheight when
   // splitting for classification/training.
   void SplitWordShiroRekha(SplitStrategy split_strategy,
                            Pix* pix,
                            int xheight,
                            int word_left,
                            int word_top,
                            Boxa* regions_to_clear);

   // Returns a new box object for the corresponding TBOX, based on the original
   // image's coordinate system.
   Box* GetBoxForTBOX(const TBOX& tbox) const;

   // This method returns y-extents of the shiro-rekha computed from the input
   // word image.
   static void GetShiroRekhaYExtents(Pix* word_pix,
                                     int* shirorekha_top,
                                     int* shirorekha_bottom,
                                     int* shirorekha_ylevel);

   Pix* orig_pix_;         // Just a clone of the input image passed.
   Pix* splitted_image_;   // Image produced after the last splitting round. The
                           // object is owned by this class.
   SplitStrategy pageseg_split_strategy_;
   SplitStrategy ocr_split_strategy_;
   Pix* debug_image_;
   // This block list is used as a golden segmentation when performing splitting.
   BLOCK_LIST* segmentation_block_list_;
   int global_xheight_;
   bool perform_close_;  // Whether a morphological close operation should be
                         // performed before CCs are run through splitting.
 };

 }  // namespace tesseract.

 #endif  // TESSERACT_TEXTORD_DEVNAGARI_PROCESSING_H_
tesseract::PixelHistogram::ConstructVerticalCountHist
void ConstructVerticalCountHist(Pix *pix)
Definition: devanagari_processing.cpp:469

tesseract::ShiroRekhaSplitter::kUnspecifiedXheight
static const int kUnspecifiedXheight
Definition: devanagari_processing.h:109

INT_VAR_H
#define INT_VAR_H(name, val, comment)
Definition: params.h:264

devanagari_split_debuglevel
int devanagari_split_debuglevel
Definition: devanagari_processing.cpp:34

tesseract::ShiroRekhaSplitter::NO_SPLIT
Definition: devanagari_processing.h:75

tesseract::ShiroRekhaSplitter::splitted_image
Pix * splitted_image()
Definition: devanagari_processing.h:122

tesseract::ShiroRekhaSplitter::segmentation_block_list
BLOCK_LIST * segmentation_block_list()
Definition: devanagari_processing.h:151

BOOL_VAR_H
#define BOOL_VAR_H(name, val, comment)
Definition: params.h:267

count
int count(LIST var_list)
Definition: oldlist.cpp:98

tesseract::ShiroRekhaSplitter::RefreshSegmentationWithNewBlobs
void RefreshSegmentationWithNewBlobs(C_BLOB_LIST *new_blobs)
Definition: devanagari_processing.cpp:356

TBOX
Definition: rect.h:34

tesseract::ShiroRekhaSplitter::ocr_split_strategy
SplitStrategy ocr_split_strategy() const
Definition: devanagari_processing.h:135

tesseract::ShiroRekhaSplitter::MINIMAL_SPLIT
Definition: devanagari_processing.h:76

tesseract::ShiroRekhaSplitter::~ShiroRekhaSplitter
virtual ~ShiroRekhaSplitter()
Definition: devanagari_processing.cpp:52

tesseract::DebugPixa
Definition: debugpixa.h:10

tesseract::PixelHistogram::length
int length() const
Definition: devanagari_processing.h:55

tesseract::PixelHistogram::~PixelHistogram
~PixelHistogram()
Definition: devanagari_processing.h:44

tesseract::ShiroRekhaSplitter::set_global_xheight
void set_global_xheight(int xheight)
Definition: devanagari_processing.h:111

tesseract::PixelHistogram::Clear
void Clear()
Definition: devanagari_processing.h:48

tesseract::ShiroRekhaSplitter::HasDifferentSplitStrategies
bool HasDifferentSplitStrategies() const
Definition: devanagari_processing.h:98

tesseract::PixelHistogram
Definition: devanagari_processing.h:37

tesseract::ShiroRekhaSplitter::GetModeHeight
static int GetModeHeight(Pix *pix)
Definition: devanagari_processing.cpp:410

tesseract::ShiroRekhaSplitter::set_perform_close
void set_perform_close(bool perform)
Definition: devanagari_processing.h:115

tesseract::ShiroRekhaSplitter::MAXIMAL_SPLIT
Definition: devanagari_processing.h:77

tesseract::PixelHistogram::GetHistogramMaximum
int GetHistogramMaximum(int *count) const
Definition: devanagari_processing.cpp:455

tesseract::ShiroRekhaSplitter::ShiroRekhaSplitter
ShiroRekhaSplitter()
Definition: devanagari_processing.cpp:41

tesseract::ShiroRekhaSplitter::set_orig_pix
void set_orig_pix(Pix *pix)
Definition: devanagari_processing.cpp:68

ocrblock.h

debugpixa.h

tesseract::ShiroRekhaSplitter::orig_pix
Pix * orig_pix()
Definition: devanagari_processing.h:131

tesseract
Definition: baseapi.cpp:94

tesseract::ShiroRekhaSplitter::pageseg_split_strategy
SplitStrategy pageseg_split_strategy() const
Definition: devanagari_processing.h:143

tesseract::ShiroRekhaSplitter::set_pageseg_split_strategy
void set_pageseg_split_strategy(SplitStrategy strategy)
Definition: devanagari_processing.h:147

params.h

tesseract::PixelHistogram::PixelHistogram
PixelHistogram()
Definition: devanagari_processing.h:39

tesseract::ShiroRekhaSplitter::Split
bool Split(bool split_for_pageseg, DebugPixa *pixa_debug)
Definition: devanagari_processing.cpp:80

tesseract::ShiroRekhaSplitter::SplitStrategy
SplitStrategy
Definition: devanagari_processing.h:74

tesseract::ShiroRekhaSplitter
Definition: devanagari_processing.h:72

tesseract::PixelHistogram::ConstructHorizontalCountHist
void ConstructHorizontalCountHist(Pix *pix)
Definition: devanagari_processing.cpp:487

tesseract::ShiroRekhaSplitter::set_ocr_split_strategy
void set_ocr_split_strategy(SplitStrategy strategy)
Definition: devanagari_processing.h:139

devanagari_split_debugimage
bool devanagari_split_debugimage
Definition: devanagari_processing.cpp:37

tesseract::PixelHistogram::hist
int * hist() const
Definition: devanagari_processing.h:53

tesseract::ShiroRekhaSplitter::Clear
void Clear()
Definition: devanagari_processing.cpp:56

tesseract::ShiroRekhaSplitter::set_segmentation_block_list
void set_segmentation_block_list(BLOCK_LIST *block_list)
Definition: devanagari_processing.h:105