diff options
author | Jared Van Bortel <jared@nomic.ai> | 2024-03-26 17:46:21 -0400 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-03-26 17:46:21 -0400 |
commit | 32c8486e1f0297393cb22ac0a0d26a6b17ad4d54 (patch) | |
tree | aae4f945bf3355c009cb9643376439fcba5558d0 /unicode.h | |
parent | 557410b8f06380560155ac7fcb8316d71ddc9837 (diff) |
wpm : portable unicode tolower (#6305)
Also use C locale for ispunct/isspace, and split unicode-data.cpp from unicode.cpp.
Diffstat (limited to 'unicode.h')
-rw-r--r-- | unicode.h | 2 |
1 files changed, 2 insertions, 0 deletions
@@ -24,3 +24,5 @@ int unicode_cpt_type(const std::string & utf8); std::string unicode_byte_to_utf8(uint8_t byte); uint8_t unicode_utf8_to_byte(const std::string & utf8); +// simple tolower that only implements one-to-one mapping, not one-to-many +char32_t unicode_tolower(char32_t cp); |