bstr: add function for UTF-8 parsing (taken from libav)

Parts taken from libavutil's GET_UTF8 and slightly modified.
author: wm4 <wm4@mplayer2.org> 2012-01-13 07:38:40 +0100
committer: wm4 <wm4@mplayer2.org> 2012-01-14 14:35:39 +0100
commit: 7700e6effca6358820cb969ddf896a2be4b77ede (patch)
tree: 23fd1dabddaadb9bad35e0b6a03a0226b48bcc94 /bstr.h
parent: 827faa38436f55fbb15b7dce4abcc5c6608a428b (diff)
download: mpv-7700e6effca6358820cb969ddf896a2be4b77ede.tar.bz2
mpv-7700e6effca6358820cb969ddf896a2be4b77ede.tar.xz
1 files changed, 13 insertions, 0 deletions
diff --git a/bstr.h b/bstr.h
index 1344f0d443..8b1644cac0 100644
--- a/bstr.h
+++ b/bstr.h
@@ -69,6 +69,19 @@ double bstrtod(struct bstr str, struct bstr *rest);
 void bstr_lower(struct bstr str);
 int bstr_sscanf(struct bstr str, const char *format, ...);
 
+// Decode the UTF-8 code point at the start of the string,, and return the
+// character.
+// After calling this function, *out_next will point to the next character.
+// out_next can be NULL.
+// On error, -1 is returned, and *out_next is not modified.
+int bstr_decode_utf8(struct bstr str, struct bstr *out_next);
+
+// Return the length of the UTF-8 sequence that starts with the given byte.
+// Given a string char *s, the next UTF-8 code point is to be expected at
+//      s + bstr_parse_utf8_code_length(s[0])
+// On error, -1 is returned. On success, it returns a value in the range [1, 4].
+int bstr_parse_utf8_code_length(unsigned char b);
+
 static inline struct bstr bstr_cut(struct bstr str, int n)
 {
     if (n > str.len)
author	wm4 <wm4@mplayer2.org>	2012-01-13 07:38:40 +0100
committer	wm4 <wm4@mplayer2.org>	2012-01-14 14:35:39 +0100
commit	7700e6effca6358820cb969ddf896a2be4b77ede (patch)
tree	23fd1dabddaadb9bad35e0b6a03a0226b48bcc94 /bstr.h
parent	827faa38436f55fbb15b7dce4abcc5c6608a428b (diff)
download	mpv-7700e6effca6358820cb969ddf896a2be4b77ede.tar.bz2 mpv-7700e6effca6358820cb969ddf896a2be4b77ede.tar.xz