Go to the source code of this file.
|
| STRING_PARAM_FLAG (output_unicharset, "unicharset", "Output file path") |
|
| INT_PARAM_FLAG (norm_mode, 1, "Normalization mode: 1=Combine graphemes, " "2=Split graphemes, 3=Pure unicode") |
|
int | main (int argc, char **argv) |
|
◆ INT_PARAM_FLAG()
INT_PARAM_FLAG |
( |
norm_mode |
, |
|
|
1 |
, |
|
|
"Normalization mode: |
1 = Combine graphemes , |
|
|
" " |
2 = Split graphemes |
|
) |
| |
◆ main()
int main |
( |
int |
argc, |
|
|
char ** |
argv |
|
) |
| |
Definition at line 97 of file unicharset_extractor.cpp.
98 tesseract::CheckSharedLibraryVersion();
104 "Usage: %s [--output_unicharset filename] [--norm_mode mode]" 105 " box_or_text_file [...]\n",
107 tprintf(
"Where mode means:\n");
108 tprintf(
" 1=combine graphemes (use for Latin and other simple scripts)\n");
109 tprintf(
" 2=split graphemes (use for Indic/Khmer/Myanmar)\n");
110 tprintf(
" 3=pure unicode (use for Arabic/Hebrew/Thai/Tibetan)\n");
111 tprintf(
"Reads box or plain text files to extract the unicharset.\n");
114 return tesseract::Main(argc, argv);
void ParseCommandLineFlags(const char *usage, int *argc, char ***argv, const bool remove_flags)
DLLSYM void tprintf(const char *format,...)
◆ STRING_PARAM_FLAG()
STRING_PARAM_FLAG |
( |
output_unicharset |
, |
|
|
"unicharset" |
, |
|
|
"Output file path" |
|
|
) |
| |