summaryrefslogtreecommitdiff
path: root/unicode.h
diff options
context:
space:
mode:
authorJared Van Bortel <jared@nomic.ai>2024-03-26 17:46:21 -0400
committerGitHub <noreply@github.com>2024-03-26 17:46:21 -0400
commit32c8486e1f0297393cb22ac0a0d26a6b17ad4d54 (patch)
treeaae4f945bf3355c009cb9643376439fcba5558d0 /unicode.h
parent557410b8f06380560155ac7fcb8316d71ddc9837 (diff)
wpm : portable unicode tolower (#6305)
Also use C locale for ispunct/isspace, and split unicode-data.cpp from unicode.cpp.
Diffstat (limited to 'unicode.h')
-rw-r--r--unicode.h2
1 files changed, 2 insertions, 0 deletions
diff --git a/unicode.h b/unicode.h
index 6d14a5a3..6a0be393 100644
--- a/unicode.h
+++ b/unicode.h
@@ -24,3 +24,5 @@ int unicode_cpt_type(const std::string & utf8);
std::string unicode_byte_to_utf8(uint8_t byte);
uint8_t unicode_utf8_to_byte(const std::string & utf8);
+// simple tolower that only implements one-to-one mapping, not one-to-many
+char32_t unicode_tolower(char32_t cp);