Merge branch 'wlroots'

author: Drew DeVault <sir@cmpwn.com> 2018-04-12 20:19:54 -0400
committer: Drew DeVault <sir@cmpwn.com> 2018-04-12 20:19:54 -0400
commit: cd1b32453a9296c18b28bff71607aeb22987b5cd (patch)
tree: c653c6d525b471914c01a9d7ae543f521b6138ed /include/unicode.h
parent: 8e06985cc1b479724446fba752e0fecfb998e87b (diff)
parent: 5785170421dc38437acde8bb61068cd16fda716c (diff)
1 files changed, 33 insertions, 0 deletions
diff --git a/include/unicode.h b/include/unicode.h
new file mode 100644
index 00000000..e2ee9588
--- /dev/null
+++ b/include/unicode.h
@@ -0,0 +1,33 @@
+#ifndef _SWAY_UNICODE_H
+#define _SWAY_UNICODE_H
+#include <stddef.h>
+#include <stdint.h>
+
+// Technically UTF-8 supports up to 6 byte codepoints, but Unicode itself
+// doesn't really bother with more than 4.
+#define UTF8_MAX_SIZE 4
+
+#define UTF8_INVALID 0x80
+
+/**
+ * Grabs the next UTF-8 character and advances the string pointer
+ */
+uint32_t utf8_decode(const char **str);
+
+/**
+ * Encodes a character as UTF-8 and returns the length of that character.
+ */
+size_t utf8_encode(char *str, uint32_t ch);
+
+/**
+ * Returns the size of the next UTF-8 character
+ */
+int utf8_size(const char *str);
+
+/**
+ * Returns the size of a UTF-8 character
+ */
+size_t utf8_chsize(uint32_t ch);
+
+#endif
+
author	Drew DeVault <sir@cmpwn.com>	2018-04-12 20:19:54 -0400
committer	Drew DeVault <sir@cmpwn.com>	2018-04-12 20:19:54 -0400
commit	cd1b32453a9296c18b28bff71607aeb22987b5cd (patch)
tree	c653c6d525b471914c01a9d7ae543f521b6138ed /include/unicode.h
parent	8e06985cc1b479724446fba752e0fecfb998e87b (diff)
parent	5785170421dc38437acde8bb61068cd16fda716c (diff)