以前的笔记, 转存一下:
功能应该是计算utf8串长度
size_t utf8_charsize(unsigned char c) {
/* Determine size in bytes of character */
if ((c >>= 1) == 0x7E) return 6;
if ((c >>= 1) == 0x3E) return 5;
if ((c >>= 1) == 0x1E) return 4;
if ((c >>= 1) == 0x0E) return 3;
if ((c >>= 1) == 0x06) return 2;
/* Default to one character */
return 1;
}
size_t utf8_strlen(const char* str) {
/* The current length of the string */
int length = 0;
/* Number of characters before start of next character */
int skip = 0;
while (*str != 0) {
/* If skipping, then skip */
if (skip > 0) skip--;
/* Otherwise, determine next skip value, and increment length */
else {
/* Get next character */
unsigned char c = (unsigned char) *str;
/* Determine skip value (size in bytes of rest of character) */
skip = guac_utf8_charsize(c) - 1;
length++;
}
str++;
}
return length;
}