diff options
| author | Drew DeVault <sir@cmpwn.com> | 2018-04-12 20:19:54 -0400 |
|---|---|---|
| committer | Drew DeVault <sir@cmpwn.com> | 2018-04-12 20:19:54 -0400 |
| commit | cd1b32453a9296c18b28bff71607aeb22987b5cd (patch) | |
| tree | c653c6d525b471914c01a9d7ae543f521b6138ed /include/unicode.h | |
| parent | 8e06985cc1b479724446fba752e0fecfb998e87b (diff) | |
| parent | 5785170421dc38437acde8bb61068cd16fda716c (diff) | |
Merge branch 'wlroots'
Diffstat (limited to 'include/unicode.h')
| -rw-r--r-- | include/unicode.h | 33 |
1 files changed, 33 insertions, 0 deletions
diff --git a/include/unicode.h b/include/unicode.h new file mode 100644 index 00000000..e2ee9588 --- /dev/null +++ b/include/unicode.h @@ -0,0 +1,33 @@ +#ifndef _SWAY_UNICODE_H +#define _SWAY_UNICODE_H +#include <stddef.h> +#include <stdint.h> + +// Technically UTF-8 supports up to 6 byte codepoints, but Unicode itself +// doesn't really bother with more than 4. +#define UTF8_MAX_SIZE 4 + +#define UTF8_INVALID 0x80 + +/** + * Grabs the next UTF-8 character and advances the string pointer + */ +uint32_t utf8_decode(const char **str); + +/** + * Encodes a character as UTF-8 and returns the length of that character. + */ +size_t utf8_encode(char *str, uint32_t ch); + +/** + * Returns the size of the next UTF-8 character + */ +int utf8_size(const char *str); + +/** + * Returns the size of a UTF-8 character + */ +size_t utf8_chsize(uint32_t ch); + +#endif + |
