#include <trainingsample.h>
Definition at line 53 of file trainingsample.h.
| tesseract::TrainingSample::TrainingSample |
( |
| ) |
|
|
inline |
Definition at line 55 of file trainingsample.h.
56 : class_id_(INVALID_UNICHAR_ID), font_id_(0), page_num_(0),
57 num_features_(0), num_micro_features_(0),
58 features_(
NULL), micro_features_(
NULL), weight_(1.0),
59 max_dist_(0.0), sample_index_(0),
60 features_are_indexed_(
false), features_are_mapped_(
false),
| tesseract::TrainingSample::~TrainingSample |
( |
| ) |
|
| const TBOX& tesseract::TrainingSample::bounding_box |
( |
| ) |
const |
|
inline |
| UNICHAR_ID tesseract::TrainingSample::class_id |
( |
| ) |
const |
|
inline |
| float tesseract::TrainingSample::cn_feature |
( |
int |
index | ) |
const |
|
inline |
Definition at line 154 of file trainingsample.cpp.
156 sample->class_id_ = class_id_;
157 sample->font_id_ = font_id_;
158 sample->weight_ = weight_;
159 sample->sample_index_ = sample_index_;
160 sample->num_features_ = num_features_;
161 if (num_features_ > 0) {
163 memcpy(sample->features_, features_, num_features_ *
sizeof(features_[0]));
165 sample->num_micro_features_ = num_micro_features_;
166 if (num_micro_features_ > 0) {
167 sample->micro_features_ =
new MicroFeature[num_micro_features_];
168 memcpy(sample->micro_features_, micro_features_,
169 num_micro_features_ *
sizeof(micro_features_[0]));
171 memcpy(sample->cn_feature_, cn_feature_,
sizeof(*cn_feature_) * kNumCNParams);
172 memcpy(sample->geo_feature_, geo_feature_,
sizeof(*geo_feature_) *
GeoCount);
float MicroFeature[MFCount]
Definition at line 115 of file trainingsample.cpp.
121 memcpy(sample->features_, features,
num_features *
sizeof(features[0]));
125 sample->features_are_indexed_ =
false;
126 sample->features_are_mapped_ =
false;
| bool tesseract::TrainingSample::DeSerialize |
( |
bool |
swap, |
|
|
FILE * |
fp |
|
) |
| |
Definition at line 85 of file trainingsample.cpp.
86 if (fread(&class_id_,
sizeof(class_id_), 1, fp) != 1)
return false;
87 if (fread(&font_id_,
sizeof(font_id_), 1, fp) != 1)
return false;
88 if (fread(&page_num_,
sizeof(page_num_), 1, fp) != 1)
return false;
89 if (!bounding_box_.
DeSerialize(swap, fp))
return false;
90 if (fread(&num_features_,
sizeof(num_features_), 1, fp) != 1)
return false;
91 if (fread(&num_micro_features_,
sizeof(num_micro_features_), 1, fp) != 1)
94 ReverseN(&class_id_,
sizeof(class_id_));
95 ReverseN(&num_features_,
sizeof(num_features_));
96 ReverseN(&num_micro_features_,
sizeof(num_micro_features_));
100 if (fread(features_,
sizeof(*features_), num_features_, fp) != num_features_)
102 delete [] micro_features_;
103 micro_features_ =
new MicroFeature[num_micro_features_];
104 if (fread(micro_features_,
sizeof(*micro_features_), num_micro_features_,
105 fp) != num_micro_features_)
107 if (fread(cn_feature_,
sizeof(*cn_feature_), kNumCNParams, fp) !=
108 kNumCNParams)
return false;
void ReverseN(void *ptr, int num_bytes)
bool DeSerialize(bool swap, FILE *fp)
float MicroFeature[MFCount]
| TrainingSample * tesseract::TrainingSample::DeSerializeCreate |
( |
bool |
swap, |
|
|
FILE * |
fp |
|
) |
| |
|
static |
Definition at line 76 of file trainingsample.cpp.
78 if (sample->DeSerialize(swap, fp))
return sample;
Definition at line 288 of file trainingsample.cpp.
290 #ifndef GRAPHICS_DISABLED
291 for (
int f = 0;
f < num_features_; ++
f) {
294 #endif // GRAPHICS_DISABLED
void RenderIntFeature(ScrollView *window, const INT_FEATURE_STRUCT *Feature, ScrollView::Color color)
| void tesseract::TrainingSample::ExtractCharDesc |
( |
int |
feature_type, |
|
|
int |
micro_type, |
|
|
int |
cn_type, |
|
|
int |
geo_type, |
|
|
CHAR_DESC_STRUCT * |
char_desc |
|
) |
| |
Definition at line 177 of file trainingsample.cpp.
183 if (features_ !=
NULL)
delete [] features_;
185 if (char_features ==
NULL) {
186 tprintf(
"Error: no features to train on of type %s\n",
193 for (
int f = 0;
f < num_features_; ++
f) {
204 if (micro_features_ !=
NULL)
delete [] micro_features_;
205 char_features = char_desc->
FeatureSets[micro_type];
206 if (char_features ==
NULL) {
207 tprintf(
"Error: no features to train on of type %s\n",
209 num_micro_features_ = 0;
210 micro_features_ =
NULL;
213 micro_features_ =
new MicroFeature[num_micro_features_];
214 for (
int f = 0;
f < num_micro_features_; ++
f) {
215 for (
int d = 0; d <
MFCount; ++d) {
222 if (char_features ==
NULL) {
223 tprintf(
"Error: no CN feature to train on.\n");
234 if (char_features ==
NULL) {
235 tprintf(
"Error: no Geo feature to train on.\n");
242 features_are_indexed_ =
false;
243 features_are_mapped_ =
false;
const char * kMicroFeatureType
const char * kIntFeatureType
FEATURE_SET FeatureSets[NUM_FEATURE_TYPES]
DLLSYM void tprintf(const char *format,...)
float MicroFeature[MFCount]
| bool tesseract::TrainingSample::features_are_mapped |
( |
| ) |
const |
|
inline |
| int tesseract::TrainingSample::font_id |
( |
| ) |
const |
|
inline |
| int tesseract::TrainingSample::geo_feature |
( |
int |
index | ) |
const |
|
inline |
| Pix * tesseract::TrainingSample::GetSamplePix |
( |
int |
padding, |
|
|
Pix * |
page_pix |
|
) |
| const |
Definition at line 301 of file trainingsample.cpp.
302 if (page_pix ==
NULL)
304 int page_width = pixGetWidth(page_pix);
305 int page_height = pixGetHeight(page_pix);
307 padded_box.
pad(padding, padding);
309 TBOX page_box(0, 0, page_width, page_height);
310 padded_box &= page_box;
311 Box* box = boxCreate(page_box.left(), page_height - page_box.top(),
312 page_box.width(), page_box.height());
313 Pix* sample_pix = pixClipRectangle(page_pix, box,
NULL);
const TBOX & bounding_box() const
void pad(int xpad, int ypad)
| const GenericVector<int>& tesseract::TrainingSample::indexed_features |
( |
| ) |
const |
|
inline |
| void tesseract::TrainingSample::IndexFeatures |
( |
const IntFeatureSpace & |
feature_space | ) |
|
Definition at line 248 of file trainingsample.cpp.
250 feature_space.IndexAndSortFeatures(features_, num_features_,
252 features_are_indexed_ =
true;
253 features_are_mapped_ =
false;
const GenericVector< int > & indexed_features() const
| bool tesseract::TrainingSample::is_error |
( |
| ) |
const |
|
inline |
| void tesseract::TrainingSample::MapFeatures |
( |
const IntFeatureMap & |
feature_map | ) |
|
Definition at line 258 of file trainingsample.cpp.
260 feature_map.feature_space().IndexAndSortFeatures(features_, num_features_,
262 feature_map.MapIndexedFeatures(indexed_features, &mapped_features_);
263 features_are_indexed_ =
false;
264 features_are_mapped_ =
true;
const GenericVector< int > & indexed_features() const
| const GenericVector<int>& tesseract::TrainingSample::mapped_features |
( |
| ) |
const |
|
inline |
| double tesseract::TrainingSample::max_dist |
( |
| ) |
const |
|
inline |
| const MicroFeature* tesseract::TrainingSample::micro_features |
( |
| ) |
const |
|
inline |
| int tesseract::TrainingSample::num_features |
( |
| ) |
const |
|
inline |
| int tesseract::TrainingSample::num_micro_features |
( |
| ) |
const |
|
inline |
| int tesseract::TrainingSample::page_num |
( |
| ) |
const |
|
inline |
| TrainingSample * tesseract::TrainingSample::RandomizedCopy |
( |
int |
index | ) |
const |
Definition at line 133 of file trainingsample.cpp.
135 if (index >= 0 && index < kSampleRandomSize) {
137 int yshift = kYShiftValues[index / kSampleScaleSize];
138 double scaling = kScaleValues[index % kSampleScaleSize];
139 for (
int i = 0; i < num_features_; ++i) {
142 sample->features_[i].X =
ClipToRange(static_cast<int>(result + 0.5), 0,
146 sample->features_[i].Y =
ClipToRange(static_cast<int>(result + 0.5), 0,
TrainingSample * Copy() const
const int kRandomizingCenter
T ClipToRange(const T &x, const T &lower_bound, const T &upper_bound)
| Pix * tesseract::TrainingSample::RenderToPix |
( |
const UNICHARSET * |
unicharset | ) |
const |
Definition at line 268 of file trainingsample.cpp.
270 for (
int f = 0;
f < num_features_; ++
f) {
271 int start_x = features_[
f].
X;
273 double dx = cos((features_[
f].Theta / 256.0) * 2.0 *
PI -
PI);
274 double dy = -sin((features_[
f].Theta / 256.0) * 2.0 *
PI -
PI);
275 for (
int i = 0; i <= 5; ++i) {
276 int x =
static_cast<int>(start_x + dx * i);
277 int y =
static_cast<int>(start_y + dy * i);
278 if (x >= 0 && x < 256 && y >= 0 && y < 256)
279 pixSetPixel(pix, x, y, 1);
282 if (unicharset !=
NULL)
const char *const id_to_unichar(UNICHAR_ID id) const
const int kIntFeatureExtent
| int tesseract::TrainingSample::sample_index |
( |
| ) |
const |
|
inline |
| bool tesseract::TrainingSample::Serialize |
( |
FILE * |
fp | ) |
const |
Definition at line 54 of file trainingsample.cpp.
55 if (fwrite(&class_id_,
sizeof(class_id_), 1, fp) != 1)
return false;
56 if (fwrite(&font_id_,
sizeof(font_id_), 1, fp) != 1)
return false;
57 if (fwrite(&page_num_,
sizeof(page_num_), 1, fp) != 1)
return false;
58 if (!bounding_box_.
Serialize(fp))
return false;
59 if (fwrite(&num_features_,
sizeof(num_features_), 1, fp) != 1)
return false;
60 if (fwrite(&num_micro_features_,
sizeof(num_micro_features_), 1, fp) != 1)
62 if (fwrite(features_,
sizeof(*features_), num_features_, fp) != num_features_)
64 if (fwrite(micro_features_,
sizeof(*micro_features_), num_micro_features_,
65 fp) != num_micro_features_)
67 if (fwrite(cn_feature_,
sizeof(*cn_feature_), kNumCNParams, fp) !=
68 kNumCNParams)
return false;
bool Serialize(FILE *fp) const
| void tesseract::TrainingSample::set_bounding_box |
( |
const TBOX & |
box | ) |
|
|
inline |
| void tesseract::TrainingSample::set_class_id |
( |
int |
id | ) |
|
|
inline |
| void tesseract::TrainingSample::set_font_id |
( |
int |
id | ) |
|
|
inline |
| void tesseract::TrainingSample::set_is_error |
( |
bool |
value | ) |
|
|
inline |
| void tesseract::TrainingSample::set_max_dist |
( |
double |
value | ) |
|
|
inline |
| void tesseract::TrainingSample::set_page_num |
( |
int |
page | ) |
|
|
inline |
| void tesseract::TrainingSample::set_sample_index |
( |
int |
value | ) |
|
|
inline |
| void tesseract::TrainingSample::set_weight |
( |
double |
value | ) |
|
|
inline |
| double tesseract::TrainingSample::weight |
( |
| ) |
const |
|
inline |
The documentation for this class was generated from the following files: