tesseract
5.0.0-alpha-619-ge9db
|
Go to the documentation of this file.
19 #ifndef TESSERACT_CCUTIL_UNICHAR_H_
20 #define TESSERACT_CCUTIL_UNICHAR_H_
32 #define UNICHAR_LEN 30
39 static const int INVALID_UNICHAR_ID = -1;
41 static const char INVALID_UNICHAR[] =
"__INVALID_UNICHAR__";
143 return lhs.it_ == rhs.it_;
146 return !(lhs == rhs);
159 static const_iterator
begin(
const char*
utf8_str,
int byte_length);
160 static const_iterator
end(
const char*
utf8_str,
int byte_length);
178 #endif // TESSERACT_CCUTIL_UNICHAR_H_
const char * utf8() const
static const_iterator begin(const char *utf8_str, int byte_length)
static std::vector< char32 > UTF8ToUTF32(const char *utf8_str)
static const_iterator end(const char *utf8_str, int byte_length)
friend bool operator==(const CI &lhs, const CI &rhs)
const_iterator & operator++()
const char * utf8_data() const
static int utf8_step(const char *utf8_str)
static std::string UTF32ToUTF8(const std::vector< char32 > &str32)
int get_utf8(char *buf) const
friend bool operator!=(const CI &lhs, const CI &rhs)