Definition at line 296 of file paragraphs.cpp.
◆ UnicodeSpanSkipper()
tesseract::UnicodeSpanSkipper::UnicodeSpanSkipper |
( |
const UNICHARSET * |
unicharset, |
|
|
const WERD_CHOICE * |
word |
|
) |
| |
|
inline |
◆ SkipAlpha()
int tesseract::UnicodeSpanSkipper::SkipAlpha |
( |
int |
pos | ) |
|
Definition at line 337 of file paragraphs.cpp.
338 while (pos < wordlen_ && u_->get_isalpha(word_->
unichar_id(pos))) pos++;
UNICHAR_ID unichar_id(int index) const
◆ SkipDigits()
int tesseract::UnicodeSpanSkipper::SkipDigits |
( |
int |
pos | ) |
|
Definition at line 321 of file paragraphs.cpp.
323 IsDigitLike(
UnicodeFor(u_, word_, pos)))) pos++;
int UnicodeFor(const UNICHARSET *u, const WERD_CHOICE *werd, int pos)
bool get_isdigit(UNICHAR_ID unichar_id) const
◆ SkipPunc()
int tesseract::UnicodeSpanSkipper::SkipPunc |
( |
int |
pos | ) |
|
◆ SkipRomans()
int tesseract::UnicodeSpanSkipper::SkipRomans |
( |
int |
pos | ) |
|
Definition at line 327 of file paragraphs.cpp.
328 const char *kRomans =
"ivxlmdIVXLMD";
329 while (pos < wordlen_) {
331 if (ch >= 0xF0 || strchr(kRomans, ch) ==
nullptr)
break;
The documentation for this class was generated from the following file: