#ifndef unicode_hh_INCLUDED #define unicode_hh_INCLUDED #include namespace Kakoune { using Codepoint = char32_t; inline bool is_eol(Codepoint c) { return c == '\n'; } inline bool is_horizontal_blank(Codepoint c) { return c == ' ' or c == '\t'; } enum WordType { Word, WORD }; template inline bool is_word(Codepoint c) { return c == '_' or iswalnum(c); } template<> inline bool is_word(Codepoint c) { return not is_horizontal_blank(c) and not is_eol(c); } inline bool is_punctuation(Codepoint c) { return not (is_word(c) or is_horizontal_blank(c) or is_eol(c)); } enum class CharCategories { Blank, EndOfLine, Word, Punctuation, }; template inline CharCategories categorize(Codepoint c) { if (is_word(c)) return CharCategories::Word; if (is_eol(c)) return CharCategories::EndOfLine; if (is_horizontal_blank(c)) return CharCategories::Blank; return word_type == WORD ? CharCategories::Word : CharCategories::Punctuation; } } #endif // unicode_hh_INCLUDED