#include <ligature_table.h>
Definition at line 38 of file ligature_table.h.
◆ LigatureTable()
tesseract::LigatureTable::LigatureTable |
( |
| ) |
|
|
protected |
◆ AddLigatures()
std::string tesseract::LigatureTable::AddLigatures |
( |
const std::string & |
str, |
|
|
const PangoFontInfo * |
font |
|
) |
| const |
Definition at line 156 of file ligature_table.cpp.
159 int len = str.size();
165 if (i + liglen <= len) {
166 std::string lig_cand = str.substr(i, liglen);
169 tlog(3,
"Considering %s -> %s\n", lig_cand.c_str(),
173 if (!font->CanRenderString(it->second.data(), it->second.length()))
178 result += it->second;
179 tlog(2,
"Substituted %s -> %s\n", lig_cand.c_str(),
190 result += str.substr(i, len - i);
LigHash norm_to_lig_table_
◆ Get()
◆ Init()
void tesseract::LigatureTable::Init |
( |
| ) |
|
|
protected |
Definition at line 63 of file ligature_table.cpp.
68 std::string lig8 = EncodeAsUTF8(lig);
69 icu::UnicodeString unicode_lig8(static_cast<UChar32>(lig));
70 icu::UnicodeString normed8_result;
71 icu::ErrorCode status;
72 icu::Normalizer::normalize(unicode_lig8, UNORM_NFKC, 0, normed8_result,
75 normed8_result.toUTF8String(normed8);
80 int lig_length = lig8.length();
81 int norm_length = normed8.size();
82 if (normed8 != lig8 && lig_length > 1 && norm_length > 1) {
LigHash norm_to_lig_table_
static TESS_API const char * kCustomLigatures[][2]
LigHash lig_to_norm_table_
◆ lig_to_norm_table()
const LigHash& tesseract::LigatureTable::lig_to_norm_table |
( |
| ) |
const |
|
inline |
◆ norm_to_lig_table()
const LigHash& tesseract::LigatureTable::norm_to_lig_table |
( |
| ) |
const |
|
inline |
◆ RemoveCustomLigatures()
std::string tesseract::LigatureTable::RemoveCustomLigatures |
( |
const std::string & |
str | ) |
const |
Definition at line 130 of file ligature_table.cpp.
132 UNICHAR::const_iterator it_begin =
UNICHAR::begin(str.c_str(), str.length());
133 UNICHAR::const_iterator it_end =
UNICHAR::end(str.c_str(), str.length());
137 for (UNICHAR::const_iterator it = it_begin; it != it_end; ++it) {
static TESS_API const char * kCustomLigatures[][2]
int get_utf8(char *buf) const
static const_iterator begin(const char *utf8_str, const int byte_length)
static const_iterator end(const char *utf8_str, const int byte_length)
◆ RemoveLigatures()
std::string tesseract::LigatureTable::RemoveLigatures |
( |
const std::string & |
str | ) |
const |
Definition at line 111 of file ligature_table.cpp.
113 UNICHAR::const_iterator it_begin =
UNICHAR::begin(str.c_str(), str.length());
114 UNICHAR::const_iterator it_end =
UNICHAR::end(str.c_str(), str.length());
117 for (UNICHAR::const_iterator it = it_begin; it != it_end; ++it) {
122 result += lig_it->second;
int get_utf8(char *buf) const
static const_iterator begin(const char *utf8_str, const int byte_length)
static const_iterator end(const char *utf8_str, const int byte_length)
LigHash lig_to_norm_table_
◆ instance_
std::unique_ptr< LigatureTable > tesseract::LigatureTable::instance_ |
|
staticprotected |
◆ lig_to_norm_table_
LigHash tesseract::LigatureTable::lig_to_norm_table_ |
|
protected |
◆ max_lig_length_
int tesseract::LigatureTable::max_lig_length_ |
|
protected |
◆ max_norm_length_
int tesseract::LigatureTable::max_norm_length_ |
|
protected |
◆ min_lig_length_
int tesseract::LigatureTable::min_lig_length_ |
|
protected |
◆ min_norm_length_
int tesseract::LigatureTable::min_norm_length_ |
|
protected |
◆ norm_to_lig_table_
LigHash tesseract::LigatureTable::norm_to_lig_table_ |
|
protected |
The documentation for this class was generated from the following files: