2012-05-29 07:19:50 +02:00
|
|
|
#include "string.hh"
|
2013-04-09 20:05:40 +02:00
|
|
|
|
2013-03-29 19:31:06 +01:00
|
|
|
#include "exception.hh"
|
2014-12-23 14:34:21 +01:00
|
|
|
#include "containers.hh"
|
2014-04-28 20:49:00 +02:00
|
|
|
#include "utf8_iterator.hh"
|
2012-05-29 07:19:50 +02:00
|
|
|
|
|
|
|
namespace Kakoune
|
|
|
|
{
|
|
|
|
|
2014-10-01 01:20:12 +02:00
|
|
|
bool operator<(StringView lhs, StringView rhs)
|
|
|
|
{
|
|
|
|
int cmp = strncmp(lhs.data(), rhs.data(), (int)std::min(lhs.length(), rhs.length()));
|
|
|
|
if (cmp == 0)
|
|
|
|
return lhs.length() < rhs.length();
|
|
|
|
return cmp < 0;
|
|
|
|
}
|
|
|
|
|
2014-08-03 11:02:17 +02:00
|
|
|
std::vector<String> split(StringView str, char separator, char escape)
|
2012-05-29 07:19:50 +02:00
|
|
|
{
|
|
|
|
std::vector<String> res;
|
2014-08-03 11:02:17 +02:00
|
|
|
auto it = str.begin();
|
|
|
|
while (it != str.end())
|
2012-05-29 07:19:50 +02:00
|
|
|
{
|
2013-07-24 22:37:17 +02:00
|
|
|
res.emplace_back();
|
|
|
|
String& element = res.back();
|
2014-08-03 11:02:17 +02:00
|
|
|
while (it != str.end())
|
2013-07-24 22:37:17 +02:00
|
|
|
{
|
2014-08-03 11:02:17 +02:00
|
|
|
auto c = *it;
|
|
|
|
if (c == escape and it + 1 != str.end() and *(it+1) == separator)
|
2013-07-24 22:37:17 +02:00
|
|
|
{
|
|
|
|
element += separator;
|
2014-08-03 11:02:17 +02:00
|
|
|
it += 2;
|
2013-07-24 22:37:17 +02:00
|
|
|
}
|
|
|
|
else if (c == separator)
|
|
|
|
{
|
2014-08-03 11:02:17 +02:00
|
|
|
++it;
|
2013-07-24 22:37:17 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
element += c;
|
2014-08-03 11:02:17 +02:00
|
|
|
++it;
|
2013-07-24 22:37:17 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-10-19 17:27:36 +02:00
|
|
|
std::vector<StringView> split(StringView str, char separator)
|
|
|
|
{
|
|
|
|
std::vector<StringView> res;
|
|
|
|
auto beg = str.begin();
|
|
|
|
for (auto it = beg; it != str.end(); ++it)
|
|
|
|
{
|
|
|
|
if (*it == separator)
|
|
|
|
{
|
|
|
|
res.emplace_back(beg, it);
|
|
|
|
beg = it + 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
res.emplace_back(beg, str.end());
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-11-04 14:31:15 +01:00
|
|
|
String escape(StringView str, StringView characters, char escape)
|
2013-07-24 22:37:17 +02:00
|
|
|
{
|
|
|
|
String res;
|
|
|
|
for (auto& c : str)
|
|
|
|
{
|
2014-11-04 14:31:15 +01:00
|
|
|
if (contains(characters, c))
|
2013-07-24 22:37:17 +02:00
|
|
|
res += escape;
|
|
|
|
res += c;
|
2012-05-29 07:19:50 +02:00
|
|
|
}
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-11-04 14:31:15 +01:00
|
|
|
String unescape(StringView str, StringView characters, char escape)
|
2014-08-03 11:02:17 +02:00
|
|
|
{
|
|
|
|
String res;
|
|
|
|
for (auto& c : str)
|
|
|
|
{
|
2014-11-04 14:31:15 +01:00
|
|
|
if (contains(characters, c) and not res.empty() and res.back() == escape)
|
|
|
|
res.back() = c;
|
|
|
|
else
|
|
|
|
res += c;
|
2014-08-03 11:02:17 +02:00
|
|
|
}
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
int str_to_int(StringView str)
|
2013-05-17 14:09:42 +02:00
|
|
|
{
|
2013-06-18 22:11:44 +02:00
|
|
|
int res = 0;
|
2014-08-03 11:02:17 +02:00
|
|
|
if (sscanf(str.zstr(), "%i", &res) != 1)
|
2013-05-17 14:09:42 +02:00
|
|
|
throw runtime_error(str + "is not a number");
|
2013-06-18 22:11:44 +02:00
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
String to_string(int val)
|
|
|
|
{
|
|
|
|
char buf[16];
|
|
|
|
sprintf(buf, "%i", val);
|
|
|
|
return buf;
|
2013-05-17 14:09:42 +02:00
|
|
|
}
|
|
|
|
|
2014-04-18 14:45:33 +02:00
|
|
|
bool subsequence_match(StringView str, StringView subseq)
|
2013-09-23 21:16:57 +02:00
|
|
|
{
|
|
|
|
auto it = str.begin();
|
|
|
|
for (auto& c : subseq)
|
|
|
|
{
|
|
|
|
if (it == str.end())
|
|
|
|
return false;
|
|
|
|
while (*it != c)
|
|
|
|
{
|
|
|
|
if (++it == str.end())
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
++it;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-04-28 20:49:00 +02:00
|
|
|
String expand_tabs(StringView line, CharCount tabstop, CharCount col)
|
|
|
|
{
|
|
|
|
String res;
|
2014-06-24 20:10:57 +02:00
|
|
|
using Utf8It = utf8::iterator<const char*>;
|
2014-04-28 20:49:00 +02:00
|
|
|
for (Utf8It it = line.begin(); it.base() < line.end(); ++it)
|
|
|
|
{
|
|
|
|
if (*it == '\t')
|
|
|
|
{
|
|
|
|
CharCount end_col = (col / tabstop + 1) * tabstop;
|
|
|
|
res += String{' ', end_col - col};
|
|
|
|
}
|
|
|
|
else
|
|
|
|
res += *it;
|
|
|
|
}
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2014-11-19 20:42:15 +01:00
|
|
|
std::vector<StringView> wrap_lines(StringView text, CharCount max_width)
|
|
|
|
{
|
|
|
|
using Utf8It = utf8::iterator<const char*>;
|
|
|
|
Utf8It word_begin{text.begin()};
|
|
|
|
Utf8It word_end{word_begin};
|
|
|
|
Utf8It end{text.end()};
|
|
|
|
CharCount col = 0;
|
|
|
|
std::vector<StringView> lines;
|
2014-11-20 19:45:10 +01:00
|
|
|
Utf8It line_begin = text.begin();
|
|
|
|
Utf8It line_end = line_begin;
|
2014-11-19 20:42:15 +01:00
|
|
|
while (word_begin != end)
|
|
|
|
{
|
2014-11-20 14:55:07 +01:00
|
|
|
const CharCategories cat = categorize(*word_begin);
|
2014-11-19 20:42:15 +01:00
|
|
|
do
|
|
|
|
{
|
|
|
|
++word_end;
|
|
|
|
} while (word_end != end and categorize(*word_end) == cat);
|
|
|
|
|
|
|
|
col += word_end - word_begin;
|
2014-11-20 19:45:10 +01:00
|
|
|
if ((word_begin != line_begin and col > max_width) or
|
|
|
|
cat == CharCategories::EndOfLine)
|
2014-11-19 20:42:15 +01:00
|
|
|
{
|
2014-11-20 19:45:10 +01:00
|
|
|
lines.emplace_back(line_begin.base(), line_end.base());
|
2014-11-20 14:55:07 +01:00
|
|
|
line_begin = (cat == CharCategories::EndOfLine or
|
2014-11-20 19:45:10 +01:00
|
|
|
cat == CharCategories::Blank) ? word_end : word_begin;
|
|
|
|
col = word_end - line_begin;
|
2014-11-19 20:42:15 +01:00
|
|
|
}
|
2014-11-20 14:55:07 +01:00
|
|
|
if (cat == CharCategories::Word or cat == CharCategories::Punctuation)
|
2014-11-20 19:45:10 +01:00
|
|
|
line_end = word_end;
|
2014-11-20 14:55:07 +01:00
|
|
|
|
2014-11-19 20:42:15 +01:00
|
|
|
word_begin = word_end;
|
|
|
|
}
|
2014-11-20 19:45:10 +01:00
|
|
|
if (line_begin != word_begin)
|
|
|
|
lines.emplace_back(line_begin.base(), word_begin.base());
|
2014-11-19 20:42:15 +01:00
|
|
|
return lines;
|
|
|
|
}
|
|
|
|
|
2012-05-29 07:19:50 +02:00
|
|
|
}
|