tesseract
4.0.0-1-g2a2b
|
#include "cluster.h"
#include "commandlineflags.h"
#include "featdefs.h"
#include "intproto.h"
#include "oldlist.h"
Go to the source code of this file.
Classes | |
struct | LABELEDLISTNODE |
struct | MERGE_CLASS_NODE |
Namespaces | |
tesseract | |
Typedefs | |
typedef struct LABELEDLISTNODE * | LABELEDLIST |
using | MERGE_CLASS = MERGE_CLASS_NODE * |
Functions | |
void | ParseArguments (int *argc, char ***argv) |
ShapeTable * | tesseract::LoadShapeTable (const STRING &file_prefix) |
void | tesseract::WriteShapeTable (const STRING &file_prefix, const ShapeTable &shape_table) |
MasterTrainer * | tesseract::LoadTrainingData (int argc, const char *const *argv, bool replication, ShapeTable **shape_table, STRING *file_prefix) |
const char * | GetNextFilename (int argc, const char *const *argv) |
LABELEDLIST | FindList (LIST List, char *Label) |
LABELEDLIST | NewLabeledList (const char *Label) |
void | ReadTrainingSamples (const FEATURE_DEFS_STRUCT &feature_defs, const char *feature_name, int max_samples, UNICHARSET *unicharset, FILE *file, LIST *training_samples) |
void | WriteTrainingSamples (const FEATURE_DEFS_STRUCT &FeatureDefs, char *Directory, LIST CharList, const char *program_feature_type) |
void | FreeTrainingSamples (LIST CharList) |
void | FreeLabeledList (LABELEDLIST LabeledList) |
void | FreeLabeledClassList (LIST ClassListList) |
CLUSTERER * | SetUpForClustering (const FEATURE_DEFS_STRUCT &FeatureDefs, LABELEDLIST CharSample, const char *program_feature_type) |
LIST | RemoveInsignificantProtos (LIST ProtoList, bool KeepSigProtos, bool KeepInsigProtos, int N) |
void | CleanUpUnusedData (LIST ProtoList) |
void | MergeInsignificantProtos (LIST ProtoList, const char *label, CLUSTERER *Clusterer, CLUSTERCONFIG *Config) |
MERGE_CLASS | FindClass (LIST List, const char *Label) |
MERGE_CLASS | NewLabeledClass (const char *Label) |
CLASS_STRUCT * | SetUpForFloat2Int (const UNICHARSET &unicharset, LIST LabeledClassList) |
void | Normalize (float *Values) |
void | FreeNormProtoList (LIST CharList) |
void | AddToNormProtosList (LIST *NormProtoList, LIST ProtoList, char *CharName) |
int | NumberOfProtos (LIST ProtoList, bool CountSigProtos, bool CountInsigProtos) |
void | allocNormProtos () |
Variables | |
FEATURE_DEFS_STRUCT | feature_defs |
CLUSTERCONFIG | Config |
typedef struct LABELEDLISTNODE * LABELEDLIST |
using MERGE_CLASS = MERGE_CLASS_NODE* |
Definition at line 92 of file commontraining.h.
Definition at line 836 of file commontraining.cpp.
void allocNormProtos | ( | ) |
void CleanUpUnusedData | ( | LIST | ProtoList | ) |
Definition at line 608 of file commontraining.cpp.
MERGE_CLASS FindClass | ( | LIST | List, |
const char * | Label | ||
) |
Definition at line 691 of file commontraining.cpp.
LABELEDLIST FindList | ( | LIST | List, |
char * | Label | ||
) |
This routine searches through a list of labeled lists to find a list with the specified label. If a matching labeled list cannot be found, nullptr is returned.
List | list to search |
Label | label to search for |
Definition at line 348 of file commontraining.cpp.
void FreeLabeledClassList | ( | LIST | ClassList | ) |
This routine deallocates all of the space allocated to the specified list of training samples.
ClassList | list of all fonts in document |
Definition at line 724 of file commontraining.cpp.
void FreeLabeledList | ( | LABELEDLIST | LabeledList | ) |
This routine deallocates all of the memory consumed by a labeled list. It does not free any memory which may be consumed by the items in the list.
LabeledList | labeled list to be freed |
Definition at line 489 of file commontraining.cpp.
void FreeNormProtoList | ( | LIST | CharList | ) |
Definition at line 820 of file commontraining.cpp.
void FreeTrainingSamples | ( | LIST | CharList | ) |
This routine deallocates all of the space allocated to the specified list of training samples.
CharList | list of all fonts in document |
Definition at line 462 of file commontraining.cpp.
const char* GetNextFilename | ( | int | argc, |
const char *const * | argv | ||
) |
This routine returns the next command line argument. If there are no remaining command line arguments, it returns nullptr. This routine should only be called after all option arguments have been parsed and removed with ParseArguments.
Globals:
Definition at line 331 of file commontraining.cpp.
void MergeInsignificantProtos | ( | LIST | ProtoList, |
const char * | label, | ||
CLUSTERER * | Clusterer, | ||
CLUSTERCONFIG * | Config | ||
) |
Definition at line 541 of file commontraining.cpp.
MERGE_CLASS NewLabeledClass | ( | const char * | Label | ) |
Definition at line 705 of file commontraining.cpp.
LABELEDLIST NewLabeledList | ( | const char * | Label | ) |
This routine allocates a new, empty labeled list and gives it the specified label.
Label | label for new list |
Definition at line 369 of file commontraining.cpp.
void Normalize | ( | float * | Values | ) |
Definition at line 803 of file commontraining.cpp.
int NumberOfProtos | ( | LIST | ProtoList, |
bool | CountSigProtos, | ||
bool | CountInsigProtos | ||
) |
Definition at line 854 of file commontraining.cpp.
void ParseArguments | ( | int * | argc, |
char *** | argv | ||
) |
This routine parses the command line arguments that were passed to the program and uses them to set relevant training-related global parameters.
Globals:
argc | number of command line arguments to parse |
argv | command line arguments |
Definition at line 130 of file commontraining.cpp.
void ReadTrainingSamples | ( | const FEATURE_DEFS_STRUCT & | feature_definitions, |
const char * | feature_name, | ||
int | max_samples, | ||
UNICHARSET * | unicharset, | ||
FILE * | file, | ||
LIST * | training_samples | ||
) |
This routine reads training samples from a file and places them into a data structure which organizes the samples by FontName and CharName. It then returns this data structure.
file | open text file to read samples from |
feature_definitions | |
feature_name | |
max_samples | |
unicharset | |
training_samples |
Definition at line 399 of file commontraining.cpp.
Definition at line 626 of file commontraining.cpp.
CLUSTERER* SetUpForClustering | ( | const FEATURE_DEFS_STRUCT & | FeatureDefs, |
LABELEDLIST | char_sample, | ||
const char * | program_feature_type | ||
) |
This routine reads samples from a LABELEDLIST and enters those samples into a clusterer data structure. This data structure is then returned to the caller.
char_sample | LABELEDLIST that holds all the feature information for a |
FeatureDefs | |
program_feature_type | given character. |
Definition at line 507 of file commontraining.cpp.
CLASS_STRUCT* SetUpForFloat2Int | ( | const UNICHARSET & | unicharset, |
LIST | LabeledClassList | ||
) |
Definition at line 740 of file commontraining.cpp.
void WriteTrainingSamples | ( | const FEATURE_DEFS_STRUCT & | FeatureDefs, |
char * | Directory, | ||
LIST | CharList, | ||
const char * | program_feature_type | ||
) |
CLUSTERCONFIG Config |
Definition at line 95 of file commontraining.cpp.
FEATURE_DEFS_STRUCT feature_defs |
Definition at line 96 of file commontraining.cpp.