21 #ifndef TESSERACT_CCUTIL_NORMSTRNGS_H_
22 #define TESSERACT_CCUTIL_NORMSTRNGS_H_
82 #endif // TESSERACT_CCUTIL_NORMSTRNGS_H_
void UTF8ToUTF32(const char *utf8_str, GenericVector< char32 > *str32)
bool IsUTF8Whitespace(const char *text)
char32 OCRNormalize(char32 ch)
int SpanUTF8Whitespace(const char *text)
int SpanUTF8NotWhitespace(const char *text)
void NormalizeChar32(char32 ch, GenericVector< char32 > *str)
STRING NormalizeUTF8String(const char *str8)
void UTF32ToUTF8(const GenericVector< char32 > &str32, STRING *utf8_str)
bool IsInterchangeValid(const char32 ch)
char32 FullwidthToHalfwidth(const char32 ch)
bool IsValidCodepoint(const char32 ch)
bool IsOCREquivalent(char32 ch1, char32 ch2)
bool IsWhitespace(const char32 ch)
bool IsInterchangeValid7BitAscii(const char32 ch)