20 #ifndef TESSERACT_IMAGE_IMAGEDATA_H_ 21 #define TESSERACT_IMAGE_IMAGEDATA_H_ 62 int* max_x,
int* max_y);
68 int x()
const {
return x_; }
69 int y()
const {
return y_; }
70 int dir()
const {
return dir_; }
113 const char* imagedata,
int imagedatasize,
114 const char* truth_text,
const char*
box_text);
126 return imagefilename_;
129 imagefilename_ = name;
147 return transcription_;
156 return box_texts_[index];
168 Pix*
PreScale(
int target_height,
int max_height,
float* scale_factor,
169 int* scaled_width,
int* scaled_height,
227 return document_name_;
260 pages_[index] = NULL;
272 void set_total_pages(
int total) {
274 total_pages_ = total;
290 PointerVector<ImageData> pages_;
306 mutable SVMutex general_mutex_;
322 num_pages_per_doc_ = 0;
339 return GetPageSequential(serial);
341 return GetPageRoundRobin(serial);
355 const ImageData* GetPageRoundRobin(
int serial);
359 const ImageData* GetPageSequential(
int serial);
363 int CountNeighbourDocs(
int index,
int dir);
371 int num_pages_per_doc_;
379 #endif // TESSERACT_IMAGE_IMAGEDATA_H_ const ImageData * GetPageBySerial(int serial)
static void ComputeSize(const GenericVector< WordFeature > &features, int *max_x, int *max_y)
bool LoadDocument(const char *filename, const char *lang, int start_page, inT64 max_memory, FileReader reader)
bool SaveDocument(const char *filename, FileWriter writer)
bool SaveToBuffer(GenericVector< char > *buffer)
static void Draw(const GenericVector< WordFeature > &features, ScrollView *window)
friend void * ReCachePagesFunc(void *data)
void SetDocument(const char *filename, const char *lang, inT64 max_memory, FileReader reader)
const GenericVector< TBOX > & boxes() const
bool DeSerialize(bool swap, FILE *fp)
ImageData * TakePage(int index)
void set_page_number(int num)
const GenericVector< char > & image_data() const
void set_language(const STRING &lang)
const int kFeaturePadding
bool Serialize(TFile *fp) const
const PointerVector< DocumentData > & documents() const
const ImageData * GetPage(int index)
bool LoadDocuments(const GenericVector< STRING > &filenames, const char *lang, CachingStrategy cache_strategy, FileReader reader)
DocumentCache(inT64 max_memory)
static ImageData * Build(const char *name, int page_number, const char *lang, const char *imagedata, int imagedatasize, const char *truth_text, const char *box_text)
bool AddToCache(DocumentData *data)
void LoadPageInBackground(int index)
void set_imagefilename(const STRING &name)
const STRING & document_name() const
bool IsPageAvailable(int index, ImageData **page)
const GenericVector< STRING > & box_texts() const
const STRING & transcription() const
bool Serialize(FILE *fp) const
DocumentData(const STRING &name)
static int SortByXBucket(const void *, const void *)
const STRING & box_text(int index) const
bool DeSerialize(bool swap, TFile *fp)
Pix * PreScale(int target_height, int max_height, float *scale_factor, int *scaled_width, int *scaled_height, GenericVector< TBOX > *boxes) const
void AddBoxes(const GenericVector< TBOX > &boxes, const GenericVector< STRING > &texts, const GenericVector< int > &box_pages)
inT64 memory_used() const
void AddPageToDocument(ImageData *page)
static void FromWordFeatures(const GenericVector< WordFeature > &word_features, GenericVector< FloatWordFeature > *float_features)
bool(* FileReader)(const STRING &filename, GenericVector< char > *data)
static bool SkipDeSerialize(bool swap, tesseract::TFile *fp)
const STRING & imagefilename() const
const STRING & language() const
DocumentData * FindDocument(const STRING &document_name) const
bool(* FileWriter)(const GenericVector< char > &data, const STRING &filename)