24int a_Utf8_test(
const char* src,
unsigned int srclen);
static const char utf8_replacement_char[]
Unicode replacement character U+FFFD.
bool_t a_Utf8_ideographic(const char *s, const char *end, int *len)
Does s point to a UTF-8-encoded ideographic character?.
int a_Utf8_char_count(const char *str, int len)
uint_t a_Utf8_decode(const char *, const char *end, int *len)
Decode a single UTF-8-encoded character starting at p.
static const char utf8_zero_width_space[]
Unicode zero width space U+200B.
int a_Utf8_test(const char *src, unsigned int srclen)
Examine first srclen bytes of src.
uint_t a_Utf8_end_of_char(const char *str, uint_t i)
Return index of the last byte of the UTF-8-encoded character that str + i points to or into.
int a_Utf8_encode(unsigned int ucs, char *buf)
Write UTF-8 encoding of ucs into buf and return number of bytes written.
bool_t a_Utf8_combining_char(int unicode)