20 #ifndef TESSERACT_CCUTIL_UNICHAR_H_ 21 #define TESSERACT_CCUTIL_UNICHAR_H_ 30 #define UNICHAR_LEN 30 36 static const int INVALID_UNICHAR_ID = -1;
38 static const char INVALID_UNICHAR[] =
"__INVALID_UNICHAR__";
86 static int utf8_step(
const char* utf8_str);
134 return lhs.it_ == rhs.it_;
137 return !(lhs == rhs);
165 #endif // TESSERACT_CCUTIL_UNICHAR_H_ static const_iterator begin(const char *utf8_str, const int byte_length)
int get_utf8(char *buf) const
static const_iterator end(const char *utf8_str, const int byte_length)
friend bool operator!=(const CI &lhs, const CI &rhs)
const char * utf8_data() const
const_iterator & operator++()
const char * utf8() const
friend bool operator==(const CI &lhs, const CI &rhs)
static int utf8_step(const char *utf8_str)
static bool UTF8ToUnicode(const char *utf8_str, GenericVector< int > *unicodes)