From 199d7ee000fcb1ce24d3f4a919dc825e6c0d2f45 Mon Sep 17 00:00:00 2001 From: Neil Date: Mon, 22 Jul 2013 19:36:55 +1000 Subject: Added the character representation feature. --- src/UniConversion.h | 4 ++++ 1 file changed, 4 insertions(+) (limited to 'src/UniConversion.h') diff --git a/src/UniConversion.h b/src/UniConversion.h index 1c54506dd..753490bab 100644 --- a/src/UniConversion.h +++ b/src/UniConversion.h @@ -34,6 +34,10 @@ inline bool UTF8IsAscii(int ch) { enum { UTF8MaskWidth=0x7, UTF8MaskInvalid=0x8 }; int UTF8Classify(const unsigned char *us, int len); +// Similar to UTF8Classify but returns a length of 1 for invalid bytes +// instead of setting the invalid flag +int UTF8DrawBytes(const unsigned char *us, int len); + // Line separator is U+2028 \xe2\x80\xa8 // Paragraph separator is U+2029 \xe2\x80\xa9 const int UTF8SeparatorLength = 3; -- cgit v1.2.3