Definition at line 282 of file paragraphs.cpp.
◆ UnicodeSpanSkipper()
tesseract::UnicodeSpanSkipper::UnicodeSpanSkipper |
( |
const UNICHARSET * |
unicharset, |
|
|
const WERD_CHOICE * |
word |
|
) |
| |
|
inline |
◆ SkipAlpha()
int tesseract::UnicodeSpanSkipper::SkipAlpha |
( |
int |
pos | ) |
|
Definition at line 323 of file paragraphs.cpp.
324 while (pos < wordlen_ && u_->get_isalpha(word_->
unichar_id(pos))) pos++;
UNICHAR_ID unichar_id(int index) const
◆ SkipDigits()
int tesseract::UnicodeSpanSkipper::SkipDigits |
( |
int |
pos | ) |
|
Definition at line 307 of file paragraphs.cpp.
UNICHAR_ID unichar_id(int index) const
int UnicodeFor(const UNICHARSET *u, const WERD_CHOICE *werd, int pos)
bool get_isdigit(UNICHAR_ID unichar_id) const
◆ SkipPunc()
int tesseract::UnicodeSpanSkipper::SkipPunc |
( |
int |
pos | ) |
|
Definition at line 302 of file paragraphs.cpp.
303 while (pos < wordlen_ && u_->get_ispunctuation(word_->
unichar_id(pos))) pos++;
UNICHAR_ID unichar_id(int index) const
◆ SkipRomans()
int tesseract::UnicodeSpanSkipper::SkipRomans |
( |
int |
pos | ) |
|
Definition at line 313 of file paragraphs.cpp.
314 const char *kRomans =
"ivxlmdIVXLMD";
315 while (pos < wordlen_) {
317 if (ch >= 0xF0 || strchr(kRomans, ch) == 0)
break;
int UnicodeFor(const UNICHARSET *u, const WERD_CHOICE *werd, int pos)
The documentation for this class was generated from the following file: