tesseract  3.05.02
underlin.h File Reference
#include "fpchop.h"

Go to the source code of this file.

Functions

void restore_underlined_blobs (TO_BLOCK *block)
 
TO_ROWmost_overlapping_row (TO_ROW_LIST *rows, BLOBNBOX *blob)
 
void find_underlined_blobs (BLOBNBOX *u_line, QSPLINE *baseline, float xheight, float baseline_offset, ICOORDELT_LIST *chop_cells)
 
void vertical_cunderline_projection (C_OUTLINE *outline, QSPLINE *baseline, float xheight, float baseline_offset, STATS *lower_proj, STATS *middle_proj, STATS *upper_proj)
 

Variables

double textord_underline_offset = 0.1
 
bool textord_restore_underlines = FALSE
 

Function Documentation

◆ find_underlined_blobs()

void find_underlined_blobs ( BLOBNBOX u_line,
QSPLINE baseline,
float  xheight,
float  baseline_offset,
ICOORDELT_LIST *  chop_cells 
)

Definition at line 173 of file underlin.cpp.

179  {
180  inT16 x, y; //sides of blob
181  ICOORD blob_chop; //sides of blob
182  TBOX blob_box = u_line->bounding_box ();
183  //cell iterator
184  ICOORDELT_IT cell_it = chop_cells;
185  STATS upper_proj (blob_box.left (), blob_box.right () + 1);
186  STATS middle_proj (blob_box.left (), blob_box.right () + 1);
187  STATS lower_proj (blob_box.left (), blob_box.right () + 1);
188  C_OUTLINE_IT out_it; //outlines of blob
189 
190  ASSERT_HOST (u_line->cblob () != NULL);
191 
192  out_it.set_to_list (u_line->cblob ()->out_list ());
193  for (out_it.mark_cycle_pt (); !out_it.cycled_list (); out_it.forward ()) {
194  vertical_cunderline_projection (out_it.data (),
195  baseline, xheight, baseline_offset,
196  &lower_proj, &middle_proj, &upper_proj);
197  }
198 
199  for (x = blob_box.left (); x < blob_box.right (); x++) {
200  if (middle_proj.pile_count (x) > 0) {
201  for (y = x + 1;
202  y < blob_box.right () && middle_proj.pile_count (y) > 0; y++);
203  blob_chop = ICOORD (x, y);
204  cell_it.add_after_then_move (new ICOORDELT (blob_chop));
205  x = y;
206  }
207  }
208 }
const TBOX & bounding_box() const
Definition: blobbox.h:215
short inT16
Definition: host.h:33
integer coordinate
Definition: points.h:30
C_BLOB * cblob() const
Definition: blobbox.h:253
C_OUTLINE_LIST * out_list()
Definition: stepblob.h:64
void vertical_cunderline_projection(C_OUTLINE *outline, QSPLINE *baseline, float xheight, float baseline_offset, STATS *lower_proj, STATS *middle_proj, STATS *upper_proj)
Definition: underlin.cpp:218
inT16 left() const
Definition: rect.h:68
Definition: rect.h:30
inT16 right() const
Definition: rect.h:75
Definition: statistc.h:33
#define ASSERT_HOST(x)
Definition: errcode.h:84

◆ most_overlapping_row()

TO_ROW* most_overlapping_row ( TO_ROW_LIST *  rows,
BLOBNBOX blob 
)

Definition at line 116 of file underlin.cpp.

119  {
120  inT16 x = (blob->bounding_box ().left ()
121  + blob->bounding_box ().right ()) / 2;
122  TO_ROW_IT row_it = rows; //row iterator
123  TO_ROW *row; //current row
124  TO_ROW *best_row; //output row
125  float overlap; //of blob & row
126  float bestover; //best overlap
127 
128  best_row = NULL;
129  bestover = (float) -MAX_INT32;
130  if (row_it.empty ())
131  return NULL;
132  row = row_it.data ();
133  row_it.mark_cycle_pt ();
134  while (row->baseline.y (x) + row->descdrop > blob->bounding_box ().top ()
135  && !row_it.cycled_list ()) {
136  best_row = row;
137  bestover =
138  blob->bounding_box ().top () - row->baseline.y (x) + row->descdrop;
139  row_it.forward ();
140  row = row_it.data ();
141  }
142  while (row->baseline.y (x) + row->xheight + row->ascrise
143  >= blob->bounding_box ().bottom () && !row_it.cycled_list ()) {
144  overlap = row->baseline.y (x) + row->xheight + row->ascrise;
145  if (blob->bounding_box ().top () < overlap)
146  overlap = blob->bounding_box ().top ();
147  if (blob->bounding_box ().bottom () >
148  row->baseline.y (x) + row->descdrop)
149  overlap -= blob->bounding_box ().bottom ();
150  else
151  overlap -= row->baseline.y (x) + row->descdrop;
152  if (overlap > bestover) {
153  bestover = overlap;
154  best_row = row;
155  }
156  row_it.forward ();
157  row = row_it.data ();
158  }
159  if (bestover < 0
160  && row->baseline.y (x) + row->xheight + row->ascrise
161  - blob->bounding_box ().bottom () > bestover)
162  best_row = row;
163  return best_row;
164 }
const TBOX & bounding_box() const
Definition: blobbox.h:215
short inT16
Definition: host.h:33
double y(double x) const
Definition: quspline.cpp:217
inT16 bottom() const
Definition: rect.h:61
float ascrise
Definition: blobbox.h:655
inT16 left() const
Definition: rect.h:68
QSPLINE baseline
Definition: blobbox.h:666
float xheight
Definition: blobbox.h:653
#define MAX_INT32
Definition: host.h:53
inT16 top() const
Definition: rect.h:54
inT16 right() const
Definition: rect.h:75
float descdrop
Definition: blobbox.h:656

◆ restore_underlined_blobs()

void restore_underlined_blobs ( TO_BLOCK block)

Definition at line 38 of file underlin.cpp.

40  {
41  inT16 chop_coord; //chop boundary
42  TBOX blob_box; //of underline
43  BLOBNBOX *u_line; //underline bit
44  TO_ROW *row; //best row for blob
45  ICOORDELT_LIST chop_cells; //blobs to cut out
46  //real underlines
47  BLOBNBOX_LIST residual_underlines;
48  C_OUTLINE_LIST left_coutlines;
49  C_OUTLINE_LIST right_coutlines;
50  ICOORDELT_IT cell_it = &chop_cells;
51  //under lines
52  BLOBNBOX_IT under_it = &block->underlines;
53  BLOBNBOX_IT ru_it = &residual_underlines;
54 
55  if (block->get_rows()->empty())
56  return; // Don't crash if there are no rows.
57  for (under_it.mark_cycle_pt (); !under_it.cycled_list ();
58  under_it.forward ()) {
59  u_line = under_it.extract ();
60  blob_box = u_line->bounding_box ();
61  row = most_overlapping_row (block->get_rows (), u_line);
62  if (row == NULL)
63  return; // Don't crash if there is no row.
64  find_underlined_blobs (u_line, &row->baseline, row->xheight,
66  &chop_cells);
67  cell_it.set_to_list (&chop_cells);
68  for (cell_it.mark_cycle_pt (); !cell_it.cycled_list ();
69  cell_it.forward ()) {
70  chop_coord = cell_it.data ()->x ();
71  if (cell_it.data ()->y () - chop_coord > textord_fp_chop_error + 1) {
72  split_to_blob (u_line, chop_coord,
74  &left_coutlines,
75  &right_coutlines);
76  if (!left_coutlines.empty()) {
77  ru_it.add_after_then_move(new BLOBNBOX(new C_BLOB(&left_coutlines)));
78  }
79  chop_coord = cell_it.data ()->y ();
80  split_to_blob(NULL, chop_coord, textord_fp_chop_error + 0.5,
81  &left_coutlines, &right_coutlines);
82  if (!left_coutlines.empty()) {
83  row->insert_blob(new BLOBNBOX(new C_BLOB(&left_coutlines)));
84  }
85  u_line = NULL; //no more blobs to add
86  }
87  delete cell_it.extract();
88  }
89  if (!right_coutlines.empty ()) {
90  split_to_blob(NULL, blob_box.right(), textord_fp_chop_error + 0.5,
91  &left_coutlines, &right_coutlines);
92  if (!left_coutlines.empty())
93  ru_it.add_after_then_move(new BLOBNBOX(new C_BLOB(&left_coutlines)));
94  }
95  if (u_line != NULL) {
96  if (u_line->cblob() != NULL)
97  delete u_line->cblob();
98  delete u_line;
99  }
100  }
101  if (!ru_it.empty()) {
102  ru_it.move_to_first();
103  for (ru_it.mark_cycle_pt(); !ru_it.cycled_list(); ru_it.forward()) {
104  under_it.add_after_then_move(ru_it.extract());
105  }
106  }
107 }
const TBOX & bounding_box() const
Definition: blobbox.h:215
short inT16
Definition: host.h:33
EXTERN int textord_fp_chop_error
Definition: fpchop.cpp:39
C_BLOB * cblob() const
Definition: blobbox.h:253
BLOBNBOX_LIST underlines
Definition: blobbox.h:769
void insert_blob(BLOBNBOX *blob)
Definition: blobbox.cpp:764
EXTERN double textord_underline_offset
Definition: underlin.cpp:28
TO_ROW_LIST * get_rows()
Definition: blobbox.h:700
TO_ROW * most_overlapping_row(TO_ROW_LIST *rows, BLOBNBOX *blob)
Definition: underlin.cpp:116
QSPLINE baseline
Definition: blobbox.h:666
float xheight
Definition: blobbox.h:653
void split_to_blob(BLOBNBOX *blob, inT16 chop_coord, float pitch_error, C_OUTLINE_LIST *left_coutlines, C_OUTLINE_LIST *right_coutlines)
Definition: fpchop.cpp:243
Definition: rect.h:30
inT16 right() const
Definition: rect.h:75
void find_underlined_blobs(BLOBNBOX *u_line, QSPLINE *baseline, float xheight, float baseline_offset, ICOORDELT_LIST *chop_cells)
Definition: underlin.cpp:173

◆ vertical_cunderline_projection()

void vertical_cunderline_projection ( C_OUTLINE outline,
QSPLINE baseline,
float  xheight,
float  baseline_offset,
STATS lower_proj,
STATS middle_proj,
STATS upper_proj 
)

Definition at line 218 of file underlin.cpp.

226  {
227  ICOORD pos; //current point
228  ICOORD step; //edge step
229  inT16 lower_y, upper_y; //region limits
230  inT32 length; //of outline
231  inT16 stepindex; //current step
232  C_OUTLINE_IT out_it = outline->child ();
233 
234  pos = outline->start_pos ();
235  length = outline->pathlength ();
236  for (stepindex = 0; stepindex < length; stepindex++) {
237  step = outline->step (stepindex);
238  if (step.x () > 0) {
239  lower_y =
240  (inT16) floor (baseline->y (pos.x ()) + baseline_offset + 0.5);
241  upper_y =
242  (inT16) floor (baseline->y (pos.x ()) + baseline_offset +
243  xheight + 0.5);
244  if (pos.y () >= lower_y) {
245  lower_proj->add (pos.x (), -lower_y);
246  if (pos.y () >= upper_y) {
247  middle_proj->add (pos.x (), lower_y - upper_y);
248  upper_proj->add (pos.x (), upper_y - pos.y ());
249  }
250  else
251  middle_proj->add (pos.x (), lower_y - pos.y ());
252  }
253  else
254  lower_proj->add (pos.x (), -pos.y ());
255  }
256  else if (step.x () < 0) {
257  lower_y =
258  (inT16) floor (baseline->y (pos.x () - 1) + baseline_offset +
259  0.5);
260  upper_y =
261  (inT16) floor (baseline->y (pos.x () - 1) + baseline_offset +
262  xheight + 0.5);
263  if (pos.y () >= lower_y) {
264  lower_proj->add (pos.x () - 1, lower_y);
265  if (pos.y () >= upper_y) {
266  middle_proj->add (pos.x () - 1, upper_y - lower_y);
267  upper_proj->add (pos.x () - 1, pos.y () - upper_y);
268  }
269  else
270  middle_proj->add (pos.x () - 1, pos.y () - lower_y);
271  }
272  else
273  lower_proj->add (pos.x () - 1, pos.y ());
274  }
275  pos += step;
276  }
277 
278  for (out_it.mark_cycle_pt (); !out_it.cycled_list (); out_it.forward ()) {
279  vertical_cunderline_projection (out_it.data (),
280  baseline, xheight, baseline_offset,
281  lower_proj, middle_proj, upper_proj);
282  }
283 }
short inT16
Definition: host.h:33
integer coordinate
Definition: points.h:30
void add(inT32 value, inT32 count)
Definition: statistc.cpp:101
inT32 pathlength() const
Definition: coutln.h:133
ICOORD step(int index) const
Definition: coutln.h:142
void vertical_cunderline_projection(C_OUTLINE *outline, QSPLINE *baseline, float xheight, float baseline_offset, STATS *lower_proj, STATS *middle_proj, STATS *upper_proj)
Definition: underlin.cpp:218
inT16 x() const
access function
Definition: points.h:52
C_OUTLINE_LIST * child()
Definition: coutln.h:106
int inT32
Definition: host.h:35
const ICOORD & start_pos() const
Definition: coutln.h:146
inT16 y() const
access_function
Definition: points.h:56

Variable Documentation

◆ textord_restore_underlines

bool textord_restore_underlines = FALSE

"Chop underlines & put back"

Definition at line 30 of file underlin.cpp.

◆ textord_underline_offset

double textord_underline_offset = 0.1

"Fraction of x to ignore"

Definition at line 28 of file underlin.cpp.