chiark
/
gitweb
/
~mdw
/
disorder
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
utf32_word_split() and utf8_word_split() splits a string into words
[disorder]
/
lib
/
unicode.h
diff --git
a/lib/unicode.h
b/lib/unicode.h
index a996844ae5ebcd22a3851764f19b9cde72a4026c..7f3220773537d0447c2fbc810a1e517b61e1dcbf 100644
(file)
--- a/
lib/unicode.h
+++ b/
lib/unicode.h
@@
-74,6
+74,9
@@
uint32_t utf32_iterator_code(utf32_iterator it);
int utf32_iterator_grapheme_boundary(utf32_iterator it);
int utf32_iterator_word_boundary(utf32_iterator it);
int utf32_iterator_grapheme_boundary(utf32_iterator it);
int utf32_iterator_word_boundary(utf32_iterator it);
+uint32_t **utf32_word_split(const uint32_t *s, size_t ns, size_t *nwp);
+char **utf8_word_split(const char *s, size_t ns, size_t *nwp);
+
/** @brief Convert 0-terminated UTF-32 to UTF-8
* @param s 0-terminated UTF-32 string
* @return 0-terminated UTF-8 string or 0 on error
/** @brief Convert 0-terminated UTF-32 to UTF-8
* @param s 0-terminated UTF-32 string
* @return 0-terminated UTF-8 string or 0 on error