21 #ifndef TESSERACT_CCUTIL_NORMSTRNGS_H_ 22 #define TESSERACT_CCUTIL_NORMSTRNGS_H_ 87 #endif // TESSERACT_CCUTIL_NORMSTRNGS_H_
void UTF32ToUTF8(const GenericVector< char32 > &str32, STRING *utf8_str)
void UTF8ToUTF32(const char *utf8_str, GenericVector< char32 > *str32)
void NormalizeChar32(char32 ch, bool decompose, GenericVector< char32 > *str)
bool IsUTF8Whitespace(const char *text)
int SpanUTF8NotWhitespace(const char *text)
STRING NormalizeUTF8String(bool decompose, const char *str8)
char32 OCRNormalize(char32 ch)
bool IsWhitespace(const char32 ch)
bool IsInterchangeValid7BitAscii(const char32 ch)
bool IsInterchangeValid(const char32 ch)
int SpanUTF8Whitespace(const char *text)
char32 FullwidthToHalfwidth(const char32 ch)
bool IsValidCodepoint(const char32 ch)
bool IsOCREquivalent(char32 ch1, char32 ch2)