22 #ifndef TESSERACT_TRAINING_MASTERTRAINER_H__
23 #define TESSERACT_TRAINING_MASTERTRAINER_H__
46 class ShapeClassifier;
71 bool replicate_samples,
int debug_level);
86 feature_map_.
Init(fs);
98 void AddSample(
bool verification,
const char* unichar_str,
169 int shape_id,
int* num_samples);
179 const char* inttemp_file,
180 const char* pffmtable_file);
189 return master_shapes_;
194 void DebugCanonical(
const char* unichar_str1,
const char* unichar_str2);
195 #ifndef GRAPHICS_DISABLED
207 const char* unichar_str2,
int canonical_font);
208 #endif // GRAPHICS_DISABLED
213 bool replicate_samples,
229 bool replicate_samples,
242 void ReplaceFragmentedSamples();
249 void ClusterShapes(
int min_shapes,
int max_shape_unichars,
276 bool enable_shape_anaylsis_;
278 bool enable_replication_;
284 int prev_unichar_id_;
bool LoadFontInfo(const char *filename)
bool AddSpacingInfo(const char *filename)
TrainingSampleSet * GetSamples()
MasterTrainer(NormalizationMode norm_mode, bool shape_analysis, bool replicate_samples, int debug_level)
CLUSTERER * SetupForClustering(const ShapeTable &shape_table, const FEATURE_DEFS_STRUCT &feature_defs, int shape_id, int *num_samples)
void SetupFlatShapeTable(ShapeTable *shape_table)
ShapeDist(int s1, int s2, float dist)
int GetBestMatchingFontInfoId(const char *filename)
const UNICHARSET & unicharset() const
void LoadUnicharset(const char *filename)
void TestClassifierOnSamples(int report_level, bool replicate_samples, ShapeClassifier *test_classifier, STRING *report_string)
void AddSample(bool verification, const char *unichar_str, TrainingSample *sample)
void WriteInttempAndPFFMTable(const UNICHARSET &unicharset, const UNICHARSET &shape_set, const ShapeTable &shape_table, CLASS_STRUCT *float_classes, const char *inttemp_file, const char *pffmtable_file)
bool Serialize(FILE *fp) const
const UNICHARSET & unicharset() const
void LoadPageImages(const char *filename)
bool DeSerialize(bool swap, FILE *fp)
void ReplicateAndRandomizeSamplesIfRequired()
bool LoadXHeights(const char *filename)
const ShapeTable & master_shapes() const
void ReadTrainingSamples(FILE *fp, const FEATURE_DEFS_STRUCT &feature_defs, bool verification)
void Init(const IntFeatureSpace &feature_space)
double TestClassifier(int report_level, bool replicate_samples, TrainingSampleSet *samples, ShapeClassifier *test_classifier, STRING *report_string)
bool operator<(const ShapeDist &other) const
int GetFontInfoId(const char *font_name)
void DisplaySamples(const char *unichar_str1, int cloud_font, const char *unichar_str2, int canonical_font)
void DebugCanonical(const char *unichar_str1, const char *unichar_str2)
void SetFeatureSpace(const IntFeatureSpace &fs)
FEATURE_DEFS_STRUCT feature_defs
float ShapeDistance(const ShapeTable &shapes, int s1, int s2)