libcubescript/src/cs_parser.cc

233 lines
6.7 KiB
C++
Raw Normal View History

2017-06-20 21:21:39 +02:00
#include <cubescript/cubescript.hh>
2021-03-23 02:00:11 +01:00
#include "cs_std.hh"
namespace cscript {
2021-03-23 02:00:11 +01:00
/* string/word parsers are also useful to have public */
LIBCUBESCRIPT_EXPORT char const *cs_parse_string(
cs_state &cs, std::string_view str, size_t &nlines
) {
size_t nl = 0;
nlines = nl;
if (str.empty() || (str.front() != '\"')) {
return str.data();
}
char const *beg = str.begin();
char const *end = str.end();
char const *orig = beg++;
++nl;
while (beg != end) {
switch (*beg) {
case '\r':
case '\n':
case '\"':
goto end;
case '^':
case '\\': {
bool needn = (*beg == '\\');
if (++beg == end) {
2016-09-26 02:26:02 +02:00
goto end;
2021-03-23 02:00:11 +01:00
}
if ((*beg == '\r') || (*beg == '\n')) {
char c = *beg++;
++nl;
if ((beg != end) && (c == '\r') && (*beg == '\n')) {
++beg;
}
2021-03-23 02:00:11 +01:00
} else if (needn) {
goto end;
} else {
++beg;
}
2021-03-23 02:00:11 +01:00
continue;
2016-09-21 21:02:13 +02:00
}
2021-03-23 02:00:11 +01:00
default:
break;
2016-09-21 21:02:13 +02:00
}
2021-03-23 02:00:11 +01:00
++beg;
}
2016-09-26 02:26:02 +02:00
end:
2021-03-23 02:00:11 +01:00
nlines = nl;
if ((beg == end) || (*beg != '\"')) {
throw cs_error(
cs, "unfinished string '%s'",
std::string_view{orig, std::size_t(beg - orig)}
);
2016-09-21 21:02:13 +02:00
}
2021-03-23 02:00:11 +01:00
return ++beg;
}
2016-09-21 21:02:13 +02:00
2021-03-23 02:00:11 +01:00
LIBCUBESCRIPT_EXPORT char const *cs_parse_word(
cs_state &cs, std::string_view str
) {
char const *it = str.begin();
char const *end = str.end();
for (; it != end; ++it) {
std::string_view chrs{"\"/;()[] \t\r\n"};
it = std::find_first_of(it, end, chrs.begin(), chrs.end());
if (it == end) {
return it;
}
switch (*it) {
case '"':
case ';':
case ' ':
case '\t':
case '\r':
case '\n':
return it;
2021-03-23 02:00:11 +01:00
case '/':
if (((end - it) > 1) && (it[1] == '/')) {
return it;
2021-03-23 02:00:11 +01:00
}
break;
case '[':
++it;
it = cs_parse_word(cs, std::string_view{
it, std::size_t(end - it)
});
if ((it == end) || (*it != ']')) {
throw cs_error(cs, "missing \"]\"");
}
break;
case '(':
++it;
it = cs_parse_word(cs, std::string_view{
it, std::size_t(end - it)
});
if ((it == end) || (*it != ')')) {
throw cs_error(cs, "missing \")\"");
}
break;
case ']':
case ')':
return it;
2016-09-21 21:02:13 +02:00
}
}
2021-03-23 02:00:11 +01:00
return it;
}
/* list parser public implementation */
2016-09-21 21:02:13 +02:00
2021-03-20 19:34:26 +01:00
LIBCUBESCRIPT_EXPORT bool cs_list_parser::parse() {
skip_until_item();
if (p_input_beg == p_input_end) {
2021-03-18 23:53:16 +01:00
return false;
}
2021-03-20 19:34:26 +01:00
switch (*p_input_beg) {
case '"': {
2021-03-20 19:34:26 +01:00
char const *qi = p_input_beg;
2021-03-23 02:00:11 +01:00
p_input_beg = cs_parse_string(*p_state, get_input());
2021-03-20 19:34:26 +01:00
p_quoted_item = std::string_view{qi, p_input_beg};
p_item = p_quoted_item.substr(1, p_quoted_item.size() - 2);
2021-03-18 23:53:16 +01:00
break;
}
2021-03-18 23:53:16 +01:00
case '(':
case '[': {
2021-03-20 19:34:26 +01:00
char btype = *p_input_beg;
2021-03-18 23:53:16 +01:00
int brak = 1;
2021-03-20 19:34:26 +01:00
char const *ibeg = p_input_beg++;
2021-03-18 23:53:16 +01:00
for (;;) {
std::string_view chrs{"\"/;()[]"};
2021-03-20 19:34:26 +01:00
p_input_beg = std::find_first_of(
p_input_beg, p_input_end, chrs.begin(), chrs.end()
2021-03-18 23:53:16 +01:00
);
2021-03-20 19:34:26 +01:00
if (p_input_beg == p_input_end) {
2021-03-18 23:53:16 +01:00
return true;
}
2021-03-20 19:34:26 +01:00
char c = *p_input_beg++;
2021-03-18 23:53:16 +01:00
switch (c) {
case '"':
/* the quote is needed in str parsing */
2021-03-20 19:34:26 +01:00
--p_input_beg;
2021-03-23 02:00:11 +01:00
p_input_beg = cs_parse_string(*p_state, get_input());
2021-03-18 23:53:16 +01:00
break;
case '/':
if (
2021-03-20 19:34:26 +01:00
(p_input_beg != p_input_end) &&
(*p_input_beg == '/')
) {
2021-03-20 19:34:26 +01:00
p_input_beg = std::find(
p_input_beg, p_input_end, '\n'
);
2021-03-18 23:53:16 +01:00
}
break;
case '(':
case '[':
brak += (c == btype);
break;
case ')':
if ((btype == '(') && (--brak <= 0)) {
goto endblock;
}
break;
case ']':
if ((btype == '[') && (--brak <= 0)) {
goto endblock;
}
break;
2016-09-21 21:02:13 +02:00
}
}
2021-03-18 23:53:16 +01:00
endblock:
2021-03-20 19:34:26 +01:00
p_item = std::string_view{ibeg + 1, p_input_beg - 1};
p_quoted_item = std::string_view{ibeg, p_input_beg};
2021-03-18 23:53:16 +01:00
break;
2016-09-21 21:02:13 +02:00
}
2021-03-18 23:53:16 +01:00
case ')':
case ']':
2016-09-21 21:02:13 +02:00
return false;
2021-03-18 23:53:16 +01:00
default: {
2021-03-23 02:00:11 +01:00
char const *e = cs_parse_word(*p_state, get_input());
2021-03-20 19:34:26 +01:00
p_quoted_item = p_item = std::string_view{p_input_beg, e};
p_input_beg = e;
2021-03-18 23:53:16 +01:00
break;
2016-09-21 21:02:13 +02:00
}
2021-03-18 23:53:16 +01:00
}
2021-03-20 19:34:26 +01:00
skip_until_item();
if ((p_input_beg != p_input_end) && (*p_input_beg == ';')) {
++p_input_beg;
2021-03-18 23:53:16 +01:00
}
return true;
}
2021-03-20 19:34:26 +01:00
LIBCUBESCRIPT_EXPORT std::size_t cs_list_parser::count() {
2021-03-18 23:53:16 +01:00
size_t ret = 0;
2021-03-20 19:34:26 +01:00
while (parse()) {
2021-03-18 23:53:16 +01:00
++ret;
}
return ret;
}
2021-03-20 19:34:26 +01:00
LIBCUBESCRIPT_EXPORT cs_strref cs_list_parser::get_item() const {
if (!p_quoted_item.empty() && (p_quoted_item.front() == '"')) {
cs_charbuf buf{*p_state};
2021-03-23 02:02:43 +01:00
cs_unescape_string(std::back_inserter(buf), p_item);
2021-03-20 19:34:26 +01:00
return cs_strref{*p_state, buf.str()};
2021-03-18 23:53:16 +01:00
}
2021-03-20 19:34:26 +01:00
return cs_strref{*p_state, p_item};
2021-03-18 23:53:16 +01:00
}
2021-03-20 19:34:26 +01:00
LIBCUBESCRIPT_EXPORT void cs_list_parser::skip_until_item() {
2021-03-18 23:53:16 +01:00
for (;;) {
2021-03-20 19:34:26 +01:00
while (p_input_beg != p_input_end) {
char c = *p_input_beg;
2021-03-18 23:53:16 +01:00
if ((c == ' ') || (c == '\t') || (c == '\r') || (c == '\n')) {
2021-03-20 19:34:26 +01:00
++p_input_beg;
2021-03-18 23:53:16 +01:00
} else {
2016-09-21 21:02:13 +02:00
break;
}
}
2021-03-20 19:34:26 +01:00
if ((p_input_end - p_input_beg) < 2) {
break;
}
2021-03-20 19:34:26 +01:00
if ((p_input_beg[0] != '/') || (p_input_beg[1]) != '/') {
2021-03-18 23:53:16 +01:00
break;
}
2021-03-20 19:34:26 +01:00
p_input_beg = std::find(p_input_beg, p_input_end, '\n');
}
2021-03-18 23:53:16 +01:00
}
2016-09-21 21:02:13 +02:00
} /* namespace cscript */