#include "html.h" #include "document_container.h" void litehtml::document_container::split_text(const char* text, const std::function& on_word, const std::function& on_space) { std::wstring str; std::wstring str_in = (const wchar_t*)utf8_to_wchar(text); ucode_t c; for (size_t i = 0; i < str_in.length(); i++) { c = (ucode_t)str_in[i]; if (c <= ' ' && (c == ' ' || c == '\t' || c == '\n' || c == '\r' || c == '\f')) { if (!str.empty()) { on_word(wchar_to_utf8(str.c_str())); str.clear(); } str += c; on_space(wchar_to_utf8(str.c_str())); str.clear(); } // CJK character range else if (c >= 0x4E00 && c <= 0x9FCC) { if (!str.empty()) { on_word(wchar_to_utf8(str.c_str())); str.clear(); } str += c; on_word(wchar_to_utf8(str.c_str())); str.clear(); } else { str += c; } } if (!str.empty()) { on_word(wchar_to_utf8(str.c_str())); } }