2017-06-20 21:21:39 +02:00
|
|
|
#include <cubescript/cubescript.hh>
|
2016-08-15 03:19:59 +02:00
|
|
|
|
2021-03-23 22:17:25 +01:00
|
|
|
#include <cmath>
|
|
|
|
#include <cctype>
|
2021-04-08 23:33:00 +02:00
|
|
|
#include <limits>
|
2021-03-31 01:10:58 +02:00
|
|
|
#include <iterator>
|
2021-03-23 22:17:25 +01:00
|
|
|
|
2021-04-08 23:33:00 +02:00
|
|
|
#include "cs_parser.hh"
|
2016-08-15 03:19:59 +02:00
|
|
|
|
2021-03-23 23:32:25 +01:00
|
|
|
namespace cubescript {
|
2016-08-15 03:19:59 +02:00
|
|
|
|
2021-03-23 02:00:11 +01:00
|
|
|
/* string/word parsers are also useful to have public */
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT char const *parse_string(
|
|
|
|
state &cs, std::string_view str, size_t &nlines
|
2021-03-23 02:00:11 +01:00
|
|
|
) {
|
|
|
|
size_t nl = 0;
|
|
|
|
nlines = nl;
|
|
|
|
if (str.empty() || (str.front() != '\"')) {
|
|
|
|
return str.data();
|
|
|
|
}
|
2021-03-31 01:10:58 +02:00
|
|
|
char const *beg = &str[0];
|
|
|
|
char const *end = &str[str.size()];
|
2021-03-23 02:00:11 +01:00
|
|
|
char const *orig = beg++;
|
|
|
|
++nl;
|
|
|
|
while (beg != end) {
|
|
|
|
switch (*beg) {
|
|
|
|
case '\r':
|
|
|
|
case '\n':
|
|
|
|
case '\"':
|
|
|
|
goto end;
|
|
|
|
case '^':
|
|
|
|
case '\\': {
|
|
|
|
bool needn = (*beg == '\\');
|
|
|
|
if (++beg == end) {
|
2016-09-26 02:26:02 +02:00
|
|
|
goto end;
|
2021-03-23 02:00:11 +01:00
|
|
|
}
|
|
|
|
if ((*beg == '\r') || (*beg == '\n')) {
|
|
|
|
char c = *beg++;
|
|
|
|
++nl;
|
|
|
|
if ((beg != end) && (c == '\r') && (*beg == '\n')) {
|
2021-03-20 02:26:37 +01:00
|
|
|
++beg;
|
2016-09-24 03:31:41 +02:00
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
} else if (needn) {
|
|
|
|
goto end;
|
|
|
|
} else {
|
|
|
|
++beg;
|
2016-10-11 21:15:23 +02:00
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
continue;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
default:
|
|
|
|
break;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
++beg;
|
|
|
|
}
|
2016-09-26 02:26:02 +02:00
|
|
|
end:
|
2021-03-23 02:00:11 +01:00
|
|
|
nlines = nl;
|
|
|
|
if ((beg == end) || (*beg != '\"')) {
|
2021-03-23 23:29:32 +01:00
|
|
|
throw error{
|
2021-03-23 02:00:11 +01:00
|
|
|
cs, "unfinished string '%s'",
|
|
|
|
std::string_view{orig, std::size_t(beg - orig)}
|
2021-03-23 22:17:25 +01:00
|
|
|
};
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
return ++beg;
|
|
|
|
}
|
2016-09-21 21:02:13 +02:00
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT char const *parse_word(
|
|
|
|
state &cs, std::string_view str
|
2021-03-23 02:00:11 +01:00
|
|
|
) {
|
2021-03-31 01:10:58 +02:00
|
|
|
char const *it = &str[0];
|
|
|
|
char const *end = &str[str.size()];
|
2021-03-23 02:00:11 +01:00
|
|
|
for (; it != end; ++it) {
|
|
|
|
std::string_view chrs{"\"/;()[] \t\r\n"};
|
|
|
|
it = std::find_first_of(it, end, chrs.begin(), chrs.end());
|
|
|
|
if (it == end) {
|
|
|
|
return it;
|
|
|
|
}
|
|
|
|
switch (*it) {
|
|
|
|
case '"':
|
|
|
|
case ';':
|
|
|
|
case ' ':
|
|
|
|
case '\t':
|
|
|
|
case '\r':
|
|
|
|
case '\n':
|
2021-03-20 02:26:37 +01:00
|
|
|
return it;
|
2021-03-23 02:00:11 +01:00
|
|
|
case '/':
|
|
|
|
if (((end - it) > 1) && (it[1] == '/')) {
|
2021-03-20 02:26:37 +01:00
|
|
|
return it;
|
2021-03-23 02:00:11 +01:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '[':
|
|
|
|
++it;
|
2021-03-23 23:29:32 +01:00
|
|
|
it = parse_word(cs, std::string_view{
|
2021-03-23 02:00:11 +01:00
|
|
|
it, std::size_t(end - it)
|
|
|
|
});
|
|
|
|
if ((it == end) || (*it != ']')) {
|
2021-03-23 23:29:32 +01:00
|
|
|
throw error{cs, "missing \"]\""};
|
2021-03-23 02:00:11 +01:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '(':
|
|
|
|
++it;
|
2021-03-23 23:29:32 +01:00
|
|
|
it = parse_word(cs, std::string_view{
|
2021-03-23 02:00:11 +01:00
|
|
|
it, std::size_t(end - it)
|
|
|
|
});
|
|
|
|
if ((it == end) || (*it != ')')) {
|
2021-03-23 23:29:32 +01:00
|
|
|
throw error{cs, "missing \")\""};
|
2021-03-23 02:00:11 +01:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ']':
|
|
|
|
case ')':
|
|
|
|
return it;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
|
|
|
}
|
2021-03-23 02:00:11 +01:00
|
|
|
return it;
|
|
|
|
}
|
|
|
|
|
2021-03-23 22:17:25 +01:00
|
|
|
static inline char const *p_skip_white(char const *beg, char const *end) {
|
|
|
|
while ((beg != end) && isspace(*beg)) {
|
|
|
|
++beg;
|
|
|
|
}
|
|
|
|
return beg;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void p_set_end(
|
|
|
|
char const *nbeg, char const *nend, std::string_view *end
|
|
|
|
) {
|
|
|
|
if (!end) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
*end = std::string_view{nbeg, nend};
|
|
|
|
}
|
|
|
|
/* this function assumes the input is definitely a hex digit */
|
2021-03-23 23:29:32 +01:00
|
|
|
static inline integer_type p_hexd_to_int(char c) {
|
2021-03-23 22:17:25 +01:00
|
|
|
if (c >= 97) { /* a-f */
|
|
|
|
return (c - 'a') + 10;
|
|
|
|
} else if (c >= 65) { /* A-F */
|
|
|
|
return (c - 'A') + 10;
|
|
|
|
}
|
|
|
|
/* 0-9 */
|
|
|
|
return c - '0';
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline bool p_check_neg(char const *&input) {
|
|
|
|
bool neg = (*input == '-');
|
|
|
|
if (neg || (*input == '+')) {
|
|
|
|
++input;
|
|
|
|
}
|
|
|
|
return neg;
|
|
|
|
}
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
integer_type parse_int(std::string_view input, std::string_view *endstr) {
|
2021-03-31 01:10:58 +02:00
|
|
|
char const *beg = &input[0];
|
|
|
|
char const *end = &input[input.size()];
|
2021-03-23 22:17:25 +01:00
|
|
|
char const *orig = beg;
|
|
|
|
beg = p_skip_white(beg, end);
|
|
|
|
if (beg == end) {
|
|
|
|
p_set_end(orig, end, endstr);
|
2021-03-23 23:29:32 +01:00
|
|
|
return integer_type(0);
|
2021-03-23 22:17:25 +01:00
|
|
|
}
|
|
|
|
bool neg = p_check_neg(beg);
|
2021-03-23 23:29:32 +01:00
|
|
|
integer_type ret = 0;
|
2021-03-23 22:17:25 +01:00
|
|
|
char const *past = beg;
|
|
|
|
if ((end - beg) >= 2) {
|
|
|
|
std::string_view pfx = std::string_view{beg, 2};
|
|
|
|
if ((pfx == "0x") || (pfx == "0X")) {
|
|
|
|
beg += 2;
|
|
|
|
past = beg;
|
|
|
|
while ((past != end) && std::isxdigit(*past)) {
|
|
|
|
ret = ret * 16 + p_hexd_to_int(*past++);
|
|
|
|
}
|
|
|
|
goto done;
|
|
|
|
} else if ((pfx == "0b") || (pfx == "0B")) {
|
|
|
|
beg += 2;
|
|
|
|
past = beg;
|
|
|
|
while ((past != end) && ((*past == '0') || (*past == '1'))) {
|
|
|
|
ret = ret * 2 + (*past++ - '0');
|
|
|
|
}
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
while ((past != end) && std::isdigit(*past)) {
|
|
|
|
ret = ret * 10 + (*past++ - '0');
|
|
|
|
}
|
|
|
|
done:
|
|
|
|
p_set_end((past == beg) ? orig : past, end, endstr);
|
|
|
|
if (neg) {
|
|
|
|
return -ret;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
template<bool Hex, char e1 = Hex ? 'p' : 'e', char e2 = Hex ? 'P' : 'E'>
|
2021-03-23 23:29:32 +01:00
|
|
|
static inline bool p_read_exp(char const *&beg, char const *end, integer_type &fn) {
|
2021-03-23 22:17:25 +01:00
|
|
|
if (beg == end) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if ((*beg != e1) && (*beg != e2)) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (++beg == end) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
bool neg = p_check_neg(beg);
|
|
|
|
if ((beg == end) || !std::isdigit(*beg)) {
|
|
|
|
return false;
|
|
|
|
}
|
2021-03-23 23:29:32 +01:00
|
|
|
integer_type exp = 0;
|
2021-03-23 22:17:25 +01:00
|
|
|
while ((beg != end) && std::isdigit(*beg)) {
|
|
|
|
exp = exp * 10 + (*beg++ - '0');
|
|
|
|
}
|
|
|
|
if (neg) {
|
|
|
|
exp = -exp;
|
|
|
|
}
|
|
|
|
fn += exp;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
template<bool Hex>
|
|
|
|
static inline bool parse_gen_float(
|
2021-03-23 23:29:32 +01:00
|
|
|
char const *&beg, char const *end, std::string_view *endstr, float_type &ret
|
2021-03-23 22:17:25 +01:00
|
|
|
) {
|
2021-03-23 23:29:32 +01:00
|
|
|
auto read_digits = [&beg, end](double r, integer_type &n) {
|
2021-03-23 22:17:25 +01:00
|
|
|
while (
|
|
|
|
(beg != end) &&
|
|
|
|
(Hex ? std::isxdigit(*beg) : std::isdigit(*beg))
|
|
|
|
) {
|
|
|
|
if (Hex) {
|
|
|
|
r = r * 16.0 + double(p_hexd_to_int(*beg));
|
|
|
|
} else {
|
|
|
|
r = r * 10.0 + double(*beg - '0');
|
|
|
|
}
|
|
|
|
++n;
|
|
|
|
++beg;
|
|
|
|
}
|
|
|
|
return r;
|
|
|
|
};
|
2021-03-23 23:29:32 +01:00
|
|
|
integer_type wn = 0, fn = 0;
|
2021-03-23 22:17:25 +01:00
|
|
|
double r = read_digits(0.0, wn);
|
|
|
|
if ((beg != end) && (*beg == '.')) {
|
|
|
|
++beg;
|
|
|
|
r = read_digits(r, fn);
|
|
|
|
}
|
|
|
|
if (!wn && !fn) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
fn = -fn;
|
|
|
|
p_set_end(beg, end, endstr); /* we have a valid number until here */
|
|
|
|
if (p_read_exp<Hex>(beg, end, fn)) {
|
|
|
|
p_set_end(beg, end, endstr);
|
|
|
|
}
|
|
|
|
if (Hex) {
|
2021-03-23 23:29:32 +01:00
|
|
|
ret = float_type(ldexp(r, fn * 4));
|
2021-03-23 22:17:25 +01:00
|
|
|
} else {
|
2021-03-23 23:29:32 +01:00
|
|
|
ret = float_type(r * pow(10, fn));
|
2021-03-23 22:17:25 +01:00
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
float_type parse_float(std::string_view input, std::string_view *endstr) {
|
2021-03-31 01:10:58 +02:00
|
|
|
char const *beg = &input[0];
|
|
|
|
char const *end = &input[input.size()];
|
2021-03-23 22:17:25 +01:00
|
|
|
char const *orig = beg;
|
|
|
|
beg = p_skip_white(beg, end);
|
|
|
|
if (beg == end) {
|
|
|
|
p_set_end(orig, end, endstr);
|
2021-03-23 23:29:32 +01:00
|
|
|
return float_type(0);
|
2021-03-23 22:17:25 +01:00
|
|
|
}
|
|
|
|
bool neg = p_check_neg(beg);
|
2021-03-23 23:29:32 +01:00
|
|
|
float_type ret = float_type(0);
|
2021-03-23 22:17:25 +01:00
|
|
|
if ((end - beg) >= 2) {
|
|
|
|
std::string_view pfx = std::string_view{beg, 2};
|
|
|
|
if ((pfx == "0x") || (pfx == "0X")) {
|
|
|
|
beg += 2;
|
|
|
|
if (!parse_gen_float<true>(beg, end, endstr, ret)) {
|
|
|
|
p_set_end(orig, end, endstr);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!parse_gen_float<false>(beg, end, endstr, ret)) {
|
|
|
|
p_set_end(orig, end, endstr);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
done:
|
|
|
|
if (neg) {
|
|
|
|
return -ret;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool is_valid_name(std::string_view s) {
|
|
|
|
/* names cannot start with numbers (clashes with numeric literals) */
|
|
|
|
if (std::isdigit(s[0])) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
switch (s[0]) {
|
|
|
|
/* more numeric literal clashes */
|
|
|
|
case '+':
|
|
|
|
case '-':
|
|
|
|
return std::isdigit(s[1]) || ((s[1] == '.') && std::isdigit(s[2]));
|
|
|
|
case '.':
|
|
|
|
return std::isdigit(s[1]) != 0;
|
|
|
|
/* other than that a name can be mostly anything */
|
|
|
|
default:
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-08 23:33:00 +02:00
|
|
|
std::string_view parser_state::get_str() {
|
|
|
|
size_t nl;
|
|
|
|
char const *beg = source;
|
|
|
|
source = parse_string(
|
|
|
|
*ts.pstate, std::string_view{source, std::size_t(send - source)}, nl
|
|
|
|
);
|
|
|
|
current_line += nl - 1;
|
|
|
|
auto ret = std::string_view{beg, std::size_t(source - beg)};
|
|
|
|
return ret.substr(1, ret.size() - 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
charbuf parser_state::get_str_dup() {
|
|
|
|
charbuf buf{ts};
|
|
|
|
unescape_string(std::back_inserter(buf), get_str());
|
|
|
|
return buf;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string_view parser_state::read_macro_name() {
|
|
|
|
char const *op = source;
|
|
|
|
char c = current();
|
|
|
|
if (!isalpha(c) && (c != '_')) {
|
|
|
|
return std::string_view{};
|
|
|
|
}
|
|
|
|
for (; isalnum(c) || (c == '_'); c = current()) {
|
|
|
|
next_char();
|
|
|
|
}
|
|
|
|
return std::string_view{op, std::size_t(source - op)};
|
|
|
|
}
|
|
|
|
|
|
|
|
char parser_state::skip_until(std::string_view chars) {
|
|
|
|
char c = current();
|
|
|
|
while (c && (chars.find(c) == std::string_view::npos)) {
|
|
|
|
next_char();
|
|
|
|
c = current();
|
|
|
|
}
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
|
|
|
char parser_state::skip_until(char cf) {
|
|
|
|
char c = current();
|
|
|
|
while (c && (c != cf)) {
|
|
|
|
next_char();
|
|
|
|
c = current();
|
|
|
|
}
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool is_hspace(char c) {
|
|
|
|
return (c == ' ') || (c == '\t') || (c == '\r');
|
|
|
|
}
|
|
|
|
|
|
|
|
void parser_state::skip_comments() {
|
|
|
|
for (;;) {
|
|
|
|
for (char c = current(); is_hspace(c); c = current()) {
|
|
|
|
next_char();
|
|
|
|
}
|
|
|
|
if (current() == '\\') {
|
|
|
|
char c = current(1);
|
|
|
|
if ((c != '\r') && (c != '\n')) {
|
|
|
|
throw error{*ts.pstate, "invalid line break"};
|
|
|
|
}
|
|
|
|
/* skip backslash */
|
|
|
|
next_char();
|
|
|
|
/* skip CR or LF */
|
|
|
|
next_char();
|
|
|
|
/* when CR, try also skipping LF; covers \r, \n, \r\n */
|
|
|
|
if ((c == '\r') && (current(1) == '\n')) {
|
|
|
|
next_char();
|
|
|
|
}
|
|
|
|
/* skip whitespace on new line */
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if ((current() != '/') || (current(1) != '/')) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
while (current() != '\n') {
|
|
|
|
next_char();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string_view parser_state::get_word() {
|
|
|
|
char const *beg = source;
|
|
|
|
source = parse_word(
|
|
|
|
*ts.pstate, std::string_view{source, std::size_t(send - source)}
|
|
|
|
);
|
|
|
|
return std::string_view{beg, std::size_t(source - beg)};
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int ret_code(int type, int def = 0) {
|
|
|
|
if (type >= VAL_ANY) {
|
|
|
|
return def;
|
|
|
|
}
|
|
|
|
return type << BC_INST_RET;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void compileunescapestr(parser_state &gs) {
|
|
|
|
auto str = gs.get_str();
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_VAL | BC_RET_STRING);
|
|
|
|
gs.gs.code.reserve(
|
|
|
|
gs.gs.code.size() + str.size() / sizeof(uint32_t) + 1
|
2021-04-08 23:33:00 +02:00
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
size_t bufs = (gs.gs.code.capacity() - gs.gs.code.size()) * sizeof(uint32_t);
|
2021-04-08 23:33:00 +02:00
|
|
|
auto alloc = std_allocator<char>{gs.ts.istate};
|
|
|
|
auto *buf = alloc.allocate(bufs + 1);
|
|
|
|
char *wbuf = unescape_string(&buf[0], str);
|
|
|
|
memset(
|
|
|
|
&buf[wbuf - buf], 0,
|
|
|
|
sizeof(uint32_t) - (wbuf - buf) % sizeof(uint32_t)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.back() |= (wbuf - buf) << 8;
|
2021-04-08 23:33:00 +02:00
|
|
|
uint32_t *ubuf = reinterpret_cast<uint32_t *>(buf);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.append(ubuf, ubuf + ((wbuf - buf) / sizeof(uint32_t) + 1));
|
2021-04-08 23:33:00 +02:00
|
|
|
alloc.deallocate(buf, bufs + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool compilearg(
|
|
|
|
parser_state &gs, int wordtype, charbuf *word = nullptr
|
|
|
|
);
|
|
|
|
|
|
|
|
static void compilelookup(parser_state &gs, int ltype) {
|
|
|
|
charbuf lookup{gs.ts};
|
|
|
|
gs.next_char();
|
|
|
|
switch (gs.current()) {
|
|
|
|
case '(':
|
|
|
|
case '[':
|
|
|
|
if (!compilearg(gs, VAL_STRING)) {
|
|
|
|
goto invalid;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '$':
|
|
|
|
compilelookup(gs, VAL_STRING);
|
|
|
|
break;
|
|
|
|
case '\"':
|
|
|
|
lookup = gs.get_str_dup();
|
|
|
|
lookup.push_back('\0');
|
|
|
|
goto lookupid;
|
|
|
|
default: {
|
|
|
|
lookup.append(gs.get_word());
|
|
|
|
if (lookup.empty()) goto invalid;
|
|
|
|
lookup.push_back('\0');
|
|
|
|
lookupid:
|
|
|
|
ident &id = gs.ts.istate->new_ident(
|
|
|
|
*gs.ts.pstate, lookup.str_term(), IDENT_FLAG_UNKNOWN
|
|
|
|
);
|
|
|
|
switch (id.get_type()) {
|
|
|
|
case ident_type::IVAR:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_IVAR | ret_code(ltype, BC_RET_INT) |
|
|
|
|
(id.get_index() << 8)
|
|
|
|
);
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.pop_back();
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_CODE:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COMPILE);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_IDENT:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IDENT_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
case ident_type::FVAR:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_FVAR | ret_code(ltype, BC_RET_FLOAT) |
|
|
|
|
(id.get_index() << 8)
|
|
|
|
);
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.pop_back();
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_CODE:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COMPILE);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_IDENT:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IDENT_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
case ident_type::SVAR:
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
|
|
|
return;
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_SVAR | ret_code(ltype, BC_RET_STRING) |
|
|
|
|
(id.get_index() << 8)
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
goto done;
|
|
|
|
case ident_type::ALIAS:
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
|
|
|
return;
|
|
|
|
case VAL_COND:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_LOOKUP | (id.get_index() << 8)
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_LOOKUP |
|
|
|
|
ret_code(ltype, BC_RET_STRING) |
|
|
|
|
(id.get_index() << 8)
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
goto done;
|
|
|
|
case ident_type::COMMAND: {
|
|
|
|
std::uint32_t comtype = BC_INST_COM, numargs = 0;
|
|
|
|
auto fmt = static_cast<command_impl &>(id).get_args();
|
|
|
|
for (char c: fmt) {
|
|
|
|
switch (c) {
|
|
|
|
case 's':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_string(std::string_view{});
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'i':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer();
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'b':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer(std::numeric_limits<integer_type>::min());
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'f':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_float();
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'F':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_DUP | BC_RET_FLOAT);
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'E':
|
|
|
|
case 't':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'e':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block();
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'r':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident();
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case '$':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident(id);
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'N':
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer(-1);
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'C':
|
|
|
|
comtype = BC_INST_COM_C;
|
|
|
|
goto compilecomv;
|
|
|
|
case 'V':
|
|
|
|
comtype = BC_INST_COM_V;
|
|
|
|
goto compilecomv;
|
|
|
|
case '1':
|
|
|
|
case '2':
|
|
|
|
case '3':
|
|
|
|
case '4':
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
comtype | ret_code(ltype) | (id.get_index() << 8)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_RESULT_ARG | ret_code(ltype)
|
|
|
|
);
|
|
|
|
goto done;
|
|
|
|
compilecomv:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
comtype | ret_code(ltype) | (id.get_index() << 8)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(numargs);
|
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_RESULT_ARG | ret_code(ltype)
|
|
|
|
);
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
goto invalid;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_string(lookup.str_term());
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_COND:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_LOOKUP_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_LOOKUP_U | ret_code(ltype));
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
done:
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_POP);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_CODE:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COMPILE);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_COND:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COND);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_IDENT:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IDENT_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
invalid:
|
|
|
|
switch (ltype) {
|
|
|
|
case VAL_POP:
|
|
|
|
break;
|
|
|
|
case VAL_NULL:
|
|
|
|
case VAL_ANY:
|
|
|
|
case VAL_WORD:
|
|
|
|
case VAL_COND:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val(ltype);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool compileblockstr(parser_state &gs, char const *str, char const *send) {
|
2021-04-09 00:41:55 +02:00
|
|
|
std::size_t startc = gs.gs.code.size();
|
|
|
|
gs.gs.code.push_back(BC_INST_VAL | BC_RET_STRING);
|
|
|
|
gs.gs.code.reserve(gs.gs.code.size() + (send - str) / sizeof(uint32_t) + 1);
|
2021-04-08 23:33:00 +02:00
|
|
|
auto alloc = std_allocator<char>{gs.ts.istate};
|
|
|
|
auto asz = ((send - str) / sizeof(uint32_t) + 1) * sizeof(uint32_t);
|
|
|
|
char *buf = alloc.allocate(asz);
|
|
|
|
std::size_t len = 0;
|
|
|
|
while (str < send) {
|
|
|
|
std::string_view chrs{"\r/\"@]"};
|
|
|
|
char const *orig = str;
|
|
|
|
str = std::find_first_of(str, send, chrs.begin(), chrs.end());
|
|
|
|
memcpy(&buf[len], orig, str - orig);
|
|
|
|
len += (str - orig);
|
|
|
|
if (str == send) {
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
switch (*str) {
|
|
|
|
case '\r':
|
|
|
|
++str;
|
|
|
|
break;
|
|
|
|
case '\"': {
|
|
|
|
char const *start = str;
|
|
|
|
str = parse_string(
|
|
|
|
*gs.ts.pstate, std::string_view{str, send}
|
|
|
|
);
|
|
|
|
memcpy(&buf[len], start, std::size_t(str - start));
|
|
|
|
len += (str - start);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case '/':
|
|
|
|
if (((str + 1) != send) && str[1] == '/') {
|
|
|
|
str = std::find(str, send, '\n');
|
|
|
|
} else {
|
|
|
|
buf[len++] = *str++;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '@':
|
|
|
|
case ']':
|
|
|
|
if (str < send) {
|
|
|
|
buf[len++] = *str++;
|
|
|
|
} else {
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
done:
|
|
|
|
memset(&buf[len], '\0', sizeof(uint32_t) - len % sizeof(uint32_t));
|
|
|
|
uint32_t *ubuf = reinterpret_cast<uint32_t *>(buf);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.append(ubuf, ubuf + (len / sizeof(uint32_t) + 1));
|
|
|
|
gs.gs.code[startc] |= len << 8;
|
2021-04-08 23:33:00 +02:00
|
|
|
alloc.deallocate(buf, asz);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool compileblocksub(parser_state &gs) {
|
|
|
|
charbuf lookup{gs.ts};
|
|
|
|
switch (gs.current()) {
|
|
|
|
case '(':
|
|
|
|
if (!compilearg(gs, VAL_ANY)) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '[':
|
|
|
|
if (!compilearg(gs, VAL_STRING)) {
|
|
|
|
return false;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_LOOKUP_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case '\"':
|
|
|
|
lookup = gs.get_str_dup();
|
|
|
|
lookup.push_back('\0');
|
|
|
|
goto lookupid;
|
|
|
|
default: {
|
|
|
|
lookup.append(gs.read_macro_name());
|
|
|
|
if (lookup.empty()) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
lookup.push_back('\0');
|
|
|
|
lookupid:
|
|
|
|
ident &id = gs.ts.istate->new_ident(
|
|
|
|
*gs.ts.pstate, lookup.str_term(), IDENT_FLAG_UNKNOWN
|
|
|
|
);
|
|
|
|
switch (id.get_type()) {
|
|
|
|
case ident_type::IVAR:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IVAR | (id.get_index() << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
goto done;
|
|
|
|
case ident_type::FVAR:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_FVAR | (id.get_index() << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
goto done;
|
|
|
|
case ident_type::SVAR:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_SVAR | (id.get_index() << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
goto done;
|
|
|
|
case ident_type::ALIAS:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_LOOKUP | (id.get_index() << 8)
|
|
|
|
);
|
|
|
|
goto done;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_string(lookup.str_term());
|
|
|
|
gs.gs.code.push_back(BC_INST_LOOKUP_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
done:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void compileblockmain(parser_state &gs, int wordtype) {
|
|
|
|
char const *start = gs.source;
|
|
|
|
size_t curline = gs.current_line;
|
|
|
|
int concs = 0;
|
|
|
|
for (int brak = 1; brak;) {
|
|
|
|
switch (gs.skip_until("@\"/[]")) {
|
|
|
|
case '\0':
|
|
|
|
throw error{*gs.ts.pstate, "missing \"]\""};
|
|
|
|
return;
|
|
|
|
case '\"':
|
|
|
|
gs.get_str();
|
|
|
|
break;
|
|
|
|
case '/':
|
|
|
|
gs.next_char();
|
|
|
|
if (gs.current() == '/') {
|
|
|
|
gs.skip_until('\n');
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '[':
|
|
|
|
gs.next_char();
|
|
|
|
brak++;
|
|
|
|
break;
|
|
|
|
case ']':
|
|
|
|
gs.next_char();
|
|
|
|
brak--;
|
|
|
|
break;
|
|
|
|
case '@': {
|
|
|
|
char const *esc = gs.source;
|
|
|
|
int level = 0;
|
|
|
|
while (gs.current() == '@') {
|
|
|
|
++level;
|
|
|
|
gs.next_char();
|
|
|
|
}
|
|
|
|
if (brak > level) {
|
|
|
|
continue;
|
|
|
|
} else if (brak < level) {
|
|
|
|
throw error{*gs.ts.pstate, "too many @s"};
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (compileblockstr(gs, start, esc)) {
|
|
|
|
concs++;
|
|
|
|
}
|
|
|
|
if (compileblocksub(gs)) {
|
|
|
|
concs++;
|
|
|
|
}
|
|
|
|
if (concs) {
|
|
|
|
start = gs.source;
|
|
|
|
curline = gs.current_line;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
gs.next_char();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (gs.source - 1 > start) {
|
|
|
|
if (!concs) {
|
|
|
|
switch (wordtype) {
|
|
|
|
case VAL_POP:
|
|
|
|
return;
|
|
|
|
case VAL_CODE:
|
|
|
|
case VAL_COND: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto ret = gs.gs.gen_block(std::string_view{
|
|
|
|
start, gs.send
|
2021-04-08 23:33:00 +02:00
|
|
|
}, curline, BC_RET_NULL, ']');
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.source = ret.second.data();
|
|
|
|
gs.send = ret.second.data() + ret.second.size();
|
|
|
|
gs.current_line = ret.first;
|
2021-04-08 23:33:00 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
case VAL_IDENT:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident(std::string_view{
|
2021-04-08 23:33:00 +02:00
|
|
|
start, std::size_t((gs.source - 1) - start)
|
|
|
|
});
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
compileblockstr(gs, start, gs.source - 1);
|
|
|
|
if (concs > 1) {
|
|
|
|
concs++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (concs) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_CONC_W | ret_code(wordtype) | (concs << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
switch (wordtype) {
|
|
|
|
case VAL_POP:
|
|
|
|
if (concs || gs.source - 1 > start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_POP);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VAL_COND:
|
|
|
|
if (!concs && gs.source - 1 <= start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COND);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VAL_CODE:
|
|
|
|
if (!concs && gs.source - 1 <= start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block();
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COMPILE);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VAL_IDENT:
|
|
|
|
if (!concs && gs.source - 1 <= start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident();
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IDENT_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VAL_STRING:
|
|
|
|
case VAL_NULL:
|
|
|
|
case VAL_ANY:
|
|
|
|
case VAL_WORD:
|
|
|
|
if (!concs && gs.source - 1 <= start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_string();
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
if (!concs) {
|
|
|
|
if (gs.source - 1 <= start) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val(wordtype);
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_FORCE | (wordtype << BC_INST_RET));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool compilearg(
|
|
|
|
parser_state &gs, int wordtype, charbuf *word
|
|
|
|
) {
|
|
|
|
gs.skip_comments();
|
|
|
|
switch (gs.current()) {
|
|
|
|
case '\"':
|
|
|
|
switch (wordtype) {
|
|
|
|
case VAL_POP:
|
|
|
|
gs.get_str();
|
|
|
|
break;
|
|
|
|
case VAL_COND: {
|
|
|
|
size_t line = gs.current_line;
|
|
|
|
auto s = gs.get_str_dup();
|
|
|
|
if (!s.empty()) {
|
|
|
|
s.push_back('\0');
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block(s.str_term(), line);
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case VAL_CODE: {
|
|
|
|
auto s = gs.get_str_dup();
|
|
|
|
s.push_back('\0');
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block(s.str_term(), gs.current_line);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
case VAL_WORD:
|
|
|
|
if (word) {
|
|
|
|
*word = gs.get_str_dup();
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case VAL_ANY:
|
|
|
|
case VAL_STRING:
|
|
|
|
compileunescapestr(gs);
|
|
|
|
break;
|
|
|
|
default: {
|
|
|
|
int line = int(gs.current_line);
|
|
|
|
auto s = gs.get_str_dup();
|
|
|
|
s.push_back('\0');
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val(wordtype, s.str_term(), line);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
case '$':
|
|
|
|
compilelookup(gs, wordtype);
|
|
|
|
return true;
|
|
|
|
case '(': {
|
|
|
|
gs.next_char();
|
2021-04-09 00:41:55 +02:00
|
|
|
std::size_t start = gs.gs.code.size();
|
|
|
|
gs.parse_block(VAL_ANY, ')');
|
|
|
|
if (gs.gs.code.size() > start) {
|
|
|
|
gs.gs.code.push_back(BC_INST_RESULT_ARG | ret_code(wordtype));
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val(wordtype);
|
2021-04-08 23:33:00 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
switch (wordtype) {
|
|
|
|
case VAL_POP:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_POP);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_COND:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COND);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_CODE:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COMPILE);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case VAL_IDENT:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_IDENT_U);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
case '[':
|
|
|
|
gs.next_char();
|
|
|
|
compileblockmain(gs, wordtype);
|
|
|
|
return true;
|
|
|
|
default:
|
|
|
|
switch (wordtype) {
|
|
|
|
case VAL_POP: {
|
|
|
|
return !gs.get_word().empty();
|
|
|
|
}
|
|
|
|
case VAL_COND: {
|
|
|
|
size_t line = gs.current_line;
|
|
|
|
auto s = gs.get_word();
|
|
|
|
if (s.empty()) {
|
|
|
|
return false;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block(s, line);
|
2021-04-08 23:33:00 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
case VAL_CODE: {
|
|
|
|
size_t line = gs.current_line;
|
|
|
|
auto s = gs.get_word();
|
|
|
|
if (s.empty()) {
|
|
|
|
return false;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block(s, line);
|
2021-04-08 23:33:00 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
case VAL_WORD: {
|
|
|
|
auto w = gs.get_word();
|
|
|
|
if (word) {
|
|
|
|
word->clear();
|
|
|
|
word->append(w);
|
|
|
|
}
|
|
|
|
return !w.empty();
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
int line = int(gs.current_line);
|
|
|
|
auto s = gs.get_word();
|
|
|
|
if (s.empty()) {
|
|
|
|
return false;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val(wordtype, s, line);
|
2021-04-08 23:33:00 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_cmd(
|
|
|
|
parser_state &gs, command_impl *id, ident &self, bool &more, int rettype,
|
|
|
|
std::uint32_t limit = 0
|
|
|
|
) {
|
|
|
|
std::uint32_t comtype = BC_INST_COM, numargs = 0, numcargs = 0, fakeargs = 0;
|
|
|
|
bool rep = false;
|
|
|
|
auto fmt = id->get_args();
|
|
|
|
for (auto it = fmt.begin(); it != fmt.end(); ++it) {
|
|
|
|
switch (*it) {
|
|
|
|
case 's': /* string */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_STRING);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_string();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
} else if ((it + 1) == fmt.end()) {
|
|
|
|
int numconc = 1;
|
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_STRING);
|
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numconc++;
|
|
|
|
}
|
|
|
|
if (numconc > 1) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_CONC | BC_RET_STRING | (numconc << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'i': /* integer */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_INT);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'b': /* integer, INT_MIN default */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_INT);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer(std::numeric_limits<integer_type>::min());
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'f': /* float */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_FLOAT);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_float();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'F': /* float, prev-argument default */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_FLOAT);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_DUP | BC_RET_FLOAT);
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 't': /* any arg */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_ANY);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'E': /* condition */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_COND);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_null();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'e': /* code */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_CODE);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case 'r': /* ident */
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
more = compilearg(gs, VAL_IDENT);
|
|
|
|
}
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
if (rep) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident();
|
2021-04-08 23:33:00 +02:00
|
|
|
fakeargs++;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
break;
|
|
|
|
case '$': /* self */
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_ident(self);
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'N': /* number of arguments */
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_val_integer(numargs - fakeargs);
|
2021-04-08 23:33:00 +02:00
|
|
|
numargs++;
|
|
|
|
break;
|
|
|
|
case 'C': /* concatenated string */
|
|
|
|
comtype = BC_INST_COM_C;
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_ANY);
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
goto compilecomv;
|
|
|
|
case 'V': /* varargs */
|
|
|
|
comtype = BC_INST_COM_V;
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
for(;;) {
|
|
|
|
more = compilearg(gs, VAL_ANY);
|
|
|
|
if (!more || (limit && (numcargs >= limit))) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
numcargs++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
goto compilecomv;
|
|
|
|
case '1': /* vararg repetition */
|
|
|
|
case '2':
|
|
|
|
case '3':
|
|
|
|
case '4':
|
|
|
|
if (more && (!limit || (numcargs < limit))) {
|
|
|
|
int numrep = *it - '0' + 1;
|
|
|
|
it -= numrep;
|
|
|
|
rep = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(comtype | ret_code(rettype) | (id->get_index() << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
return;
|
|
|
|
compilecomv:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
comtype | ret_code(rettype) | (id->get_index() << 8)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(numargs);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_alias(parser_state &gs, alias *id, bool &more) {
|
|
|
|
std::uint32_t numargs = 0;
|
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_ANY);
|
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
++numargs;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_CALL | (id->get_index() << 8)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(numargs);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_local(parser_state &gs, bool &more) {
|
|
|
|
std::uint32_t numargs = 0;
|
|
|
|
if (more) {
|
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_IDENT);
|
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
}
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_LOCAL | (numargs << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_do(
|
|
|
|
parser_state &gs, bool &more, int rettype, int opcode
|
|
|
|
) {
|
|
|
|
if (more) {
|
|
|
|
more = compilearg(gs, VAL_CODE);
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back((more ? opcode : BC_INST_NULL) | ret_code(rettype));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_if(
|
|
|
|
parser_state &gs, ident *id, bool &more, int rettype
|
|
|
|
) {
|
|
|
|
if (more) {
|
|
|
|
more = compilearg(gs, VAL_ANY);
|
|
|
|
}
|
|
|
|
if (!more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_NULL | ret_code(rettype));
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
std::size_t start1 = gs.gs.code.size();
|
2021-04-08 23:33:00 +02:00
|
|
|
more = compilearg(gs, VAL_CODE);
|
|
|
|
if (!more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_POP);
|
|
|
|
gs.gs.code.push_back(BC_INST_NULL | ret_code(rettype));
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
std::size_t start2 = gs.gs.code.size();
|
2021-04-08 23:33:00 +02:00
|
|
|
more = compilearg(gs, VAL_CODE);
|
2021-04-09 00:41:55 +02:00
|
|
|
std::uint32_t inst1 = gs.gs.code[start1];
|
2021-04-08 23:33:00 +02:00
|
|
|
std::uint32_t op1 = inst1 & ~BC_INST_RET_MASK;
|
|
|
|
auto len1 = std::uint32_t(start2 - (start1 + 1));
|
|
|
|
if (!more) {
|
|
|
|
if (op1 == (BC_INST_BLOCK | (len1 << 8))) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code[start1] = (len1 << 8) | BC_INST_JUMP_B | BC_INST_FLAG_FALSE;
|
|
|
|
gs.gs.code[start1 + 1] = BC_INST_ENTER_RESULT;
|
|
|
|
gs.gs.code[start1 + len1] = (
|
|
|
|
gs.gs.code[start1 + len1] & ~BC_INST_RET_MASK
|
2021-04-08 23:33:00 +02:00
|
|
|
) | ret_code(rettype);
|
|
|
|
return;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.gen_block();
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
std::uint32_t inst2 = gs.gs.code[start2];
|
2021-04-08 23:33:00 +02:00
|
|
|
std::uint32_t op2 = inst2 & ~BC_INST_RET_MASK;
|
2021-04-09 00:41:55 +02:00
|
|
|
auto len2 = std::uint32_t(gs.gs.code.size() - (start2 + 1));
|
2021-04-08 23:33:00 +02:00
|
|
|
if (op2 == (BC_INST_BLOCK | (len2 << 8))) {
|
|
|
|
if (op1 == (BC_INST_BLOCK | (len1 << 8))) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code[start1] = (std::uint32_t(start2 - start1) << 8)
|
2021-04-08 23:33:00 +02:00
|
|
|
| BC_INST_JUMP_B | BC_INST_FLAG_FALSE;
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code[start1 + 1] = BC_INST_ENTER_RESULT;
|
|
|
|
gs.gs.code[start1 + len1] = (
|
|
|
|
gs.gs.code[start1 + len1] & ~BC_INST_RET_MASK
|
2021-04-08 23:33:00 +02:00
|
|
|
) | ret_code(rettype);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code[start2] = (len2 << 8) | BC_INST_JUMP;
|
|
|
|
gs.gs.code[start2 + 1] = BC_INST_ENTER_RESULT;
|
|
|
|
gs.gs.code[start2 + len2] = (
|
|
|
|
gs.gs.code[start2 + len2] & ~BC_INST_RET_MASK
|
2021-04-08 23:33:00 +02:00
|
|
|
) | ret_code(rettype);
|
|
|
|
return;
|
|
|
|
} else if (op1 == (BC_INST_EMPTY | (len1 << 8))) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code[start1] = BC_INST_NULL | (inst2 & BC_INST_RET_MASK);
|
|
|
|
gs.gs.code[start2] = (len2 << 8) | BC_INST_JUMP_B | BC_INST_FLAG_TRUE;
|
|
|
|
gs.gs.code[start2 + 1] = BC_INST_ENTER_RESULT;
|
|
|
|
gs.gs.code[start2 + len2] = (
|
|
|
|
gs.gs.code[start2 + len2] & ~BC_INST_RET_MASK
|
2021-04-08 23:33:00 +02:00
|
|
|
) | ret_code(rettype);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(BC_INST_COM | ret_code(rettype) | (id->get_index() << 8));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void compile_and_or(
|
|
|
|
parser_state &gs, ident *id, bool &more, int rettype
|
|
|
|
) {
|
|
|
|
std::uint32_t numargs = 0;
|
|
|
|
if (more) {
|
|
|
|
more = compilearg(gs, VAL_COND);
|
|
|
|
}
|
|
|
|
if (!more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
((ident_p{*id}.impl().p_type == ID_AND)
|
|
|
|
? BC_INST_TRUE : BC_INST_FALSE) | ret_code(rettype)
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
numargs++;
|
2021-04-09 00:41:55 +02:00
|
|
|
std::size_t start = gs.gs.code.size(), end = start;
|
2021-04-08 23:33:00 +02:00
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_COND);
|
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numargs++;
|
2021-04-09 00:41:55 +02:00
|
|
|
if ((gs.gs.code[end] & ~BC_INST_RET_MASK) != (
|
|
|
|
BC_INST_BLOCK | (uint32_t(gs.gs.code.size() - (end + 1)) << 8)
|
2021-04-08 23:33:00 +02:00
|
|
|
)) {
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
end = gs.gs.code.size();
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
if (more) {
|
|
|
|
for (;;) {
|
|
|
|
more = compilearg(gs, VAL_COND);
|
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
numargs++;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(
|
2021-04-08 23:33:00 +02:00
|
|
|
BC_INST_COM_V | ret_code(rettype) | (id->get_index() << 8)
|
|
|
|
);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(numargs);
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
|
|
|
std::uint32_t op = (ident_p{*id}.impl().p_type == ID_AND)
|
|
|
|
? (BC_INST_JUMP_RESULT | BC_INST_FLAG_FALSE)
|
|
|
|
: (BC_INST_JUMP_RESULT | BC_INST_FLAG_TRUE);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gs.code.push_back(op);
|
|
|
|
end = gs.gs.code.size();
|
2021-04-08 23:33:00 +02:00
|
|
|
while ((start + 1) < end) {
|
2021-04-09 00:41:55 +02:00
|
|
|
uint32_t len = gs.gs.code[start] >> 8;
|
|
|
|
gs.gs.code[start] = std::uint32_t((end - (start + 1)) << 8) | op;
|
|
|
|
gs.gs.code[start + 1] = BC_INST_ENTER;
|
|
|
|
gs.gs.code[start + len] = (
|
|
|
|
gs.gs.code[start + len] & ~BC_INST_RET_MASK
|
2021-04-08 23:33:00 +02:00
|
|
|
) | ret_code(rettype);
|
|
|
|
start += len + 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-09 00:41:55 +02:00
|
|
|
void parser_state::parse_block(int rettype, int brak) {
|
2021-04-08 23:33:00 +02:00
|
|
|
charbuf idname{gs.ts};
|
|
|
|
for (;;) {
|
2021-04-09 00:41:55 +02:00
|
|
|
skip_comments();
|
2021-04-08 23:33:00 +02:00
|
|
|
idname.clear();
|
2021-04-09 00:41:55 +02:00
|
|
|
size_t curline = current_line;
|
|
|
|
bool more = compilearg(*this, VAL_WORD, &idname);
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!more) {
|
|
|
|
goto endstatement;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
skip_comments();
|
|
|
|
if (current() == '=') {
|
|
|
|
switch (current(1)) {
|
2021-04-08 23:33:00 +02:00
|
|
|
case '/':
|
2021-04-09 00:41:55 +02:00
|
|
|
if (current(2) != '/') {
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
[[fallthrough]];
|
|
|
|
case ';':
|
|
|
|
case ' ':
|
|
|
|
case '\t':
|
|
|
|
case '\r':
|
|
|
|
case '\n':
|
|
|
|
case '\0':
|
2021-04-09 00:41:55 +02:00
|
|
|
next_char();
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!idname.empty()) {
|
|
|
|
idname.push_back('\0');
|
2021-04-09 00:41:55 +02:00
|
|
|
ident &id = ts.istate->new_ident(
|
|
|
|
*ts.pstate, idname.str_term(), IDENT_FLAG_UNKNOWN
|
2021-04-08 23:33:00 +02:00
|
|
|
);
|
|
|
|
switch (id.get_type()) {
|
|
|
|
case ident_type::ALIAS:
|
2021-04-09 00:41:55 +02:00
|
|
|
more = compilearg(*this, VAL_ANY);
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_string();
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
gs.code.push_back(
|
|
|
|
BC_INST_ALIAS | (id.get_index() << 8)
|
|
|
|
);
|
|
|
|
goto endstatement;
|
|
|
|
case ident_type::IVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_ivar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
id, more, rettype, 1
|
|
|
|
);
|
|
|
|
goto endstatement;
|
|
|
|
}
|
|
|
|
case ident_type::FVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_fvar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
id, more, rettype, 1
|
|
|
|
);
|
|
|
|
goto endstatement;
|
|
|
|
}
|
|
|
|
case ident_type::SVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_svar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
id, more, rettype, 1
|
|
|
|
);
|
|
|
|
goto endstatement;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_string(idname.str_term());
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
more = compilearg(*this, VAL_ANY);
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_string();
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
gs.code.push_back(BC_INST_ALIAS_U);
|
|
|
|
goto endstatement;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (idname.empty()) {
|
|
|
|
noid:
|
|
|
|
std::uint32_t numargs = 0;
|
|
|
|
for (;;) {
|
2021-04-09 00:41:55 +02:00
|
|
|
more = compilearg(*this, VAL_ANY);
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!more) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
++numargs;
|
|
|
|
}
|
|
|
|
gs.code.push_back(BC_INST_CALL_U | (numargs << 8));
|
|
|
|
} else {
|
|
|
|
idname.push_back('\0');
|
2021-04-09 00:41:55 +02:00
|
|
|
ident *id = ts.pstate->get_ident(idname.str_term());
|
2021-04-08 23:33:00 +02:00
|
|
|
if (!id) {
|
|
|
|
if (is_valid_name(idname.str_term())) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_string(idname.str_term());
|
2021-04-08 23:33:00 +02:00
|
|
|
goto noid;
|
|
|
|
}
|
|
|
|
switch (rettype) {
|
|
|
|
case VAL_ANY: {
|
|
|
|
std::string_view end = idname.str_term();
|
|
|
|
integer_type val = parse_int(end, &end);
|
|
|
|
if (!end.empty()) {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_string(idname.str_term());
|
2021-04-08 23:33:00 +02:00
|
|
|
} else {
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val_integer(val);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.gen_val(rettype, idname.str_term(), int(curline));
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
gs.code.push_back(BC_INST_RESULT);
|
|
|
|
} else {
|
|
|
|
switch (ident_p{*id}.impl().p_type) {
|
|
|
|
case ID_ALIAS:
|
|
|
|
compile_alias(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<alias *>(id), more
|
2021-04-08 23:33:00 +02:00
|
|
|
);
|
|
|
|
break;
|
|
|
|
case ID_COMMAND:
|
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(id), *id, more,
|
2021-04-08 23:33:00 +02:00
|
|
|
rettype
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
case ID_LOCAL:
|
2021-04-09 00:41:55 +02:00
|
|
|
compile_local(*this, more);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case ID_DO:
|
2021-04-09 00:41:55 +02:00
|
|
|
compile_do(*this, more, rettype, BC_INST_DO);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case ID_DOARGS:
|
2021-04-09 00:41:55 +02:00
|
|
|
compile_do(*this, more, rettype, BC_INST_DO_ARGS);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case ID_IF:
|
2021-04-09 00:41:55 +02:00
|
|
|
compile_if(*this, id, more, rettype);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case ID_BREAK:
|
|
|
|
gs.code.push_back(BC_INST_BREAK | BC_INST_FLAG_FALSE);
|
|
|
|
break;
|
|
|
|
case ID_CONTINUE:
|
|
|
|
gs.code.push_back(BC_INST_BREAK | BC_INST_FLAG_TRUE);
|
|
|
|
break;
|
|
|
|
case ID_RESULT:
|
|
|
|
if (more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
more = compilearg(*this, VAL_ANY);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
gs.code.push_back(
|
|
|
|
(more ? BC_INST_RESULT : BC_INST_NULL) |
|
|
|
|
ret_code(rettype)
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
case ID_NOT:
|
|
|
|
if (more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
more = compilearg(*this, VAL_ANY);
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
gs.code.push_back(
|
|
|
|
(more ? BC_INST_NOT : BC_INST_TRUE) | ret_code(rettype)
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
case ID_AND:
|
|
|
|
case ID_OR:
|
2021-04-09 00:41:55 +02:00
|
|
|
compile_and_or(*this, id, more, rettype);
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
case ID_IVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_ivar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
*id, more, rettype
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case ID_FVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_fvar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
*id, more, rettype
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case ID_SVAR: {
|
2021-04-09 00:41:55 +02:00
|
|
|
auto *hid = ts.istate->cmd_svar;
|
2021-04-08 23:33:00 +02:00
|
|
|
compile_cmd(
|
2021-04-09 00:41:55 +02:00
|
|
|
*this, static_cast<command_impl *>(hid),
|
2021-04-08 23:33:00 +02:00
|
|
|
*id, more, rettype
|
|
|
|
);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
endstatement:
|
|
|
|
if (more) {
|
2021-04-09 00:41:55 +02:00
|
|
|
while (compilearg(*this, VAL_POP));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
switch (skip_until(")];/\n")) {
|
2021-04-08 23:33:00 +02:00
|
|
|
case '\0':
|
2021-04-09 00:41:55 +02:00
|
|
|
if (current() != brak) {
|
|
|
|
throw error{*ts.pstate, "missing \"%c\"", char(brak)};
|
2021-04-08 23:33:00 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
case ')':
|
|
|
|
case ']':
|
2021-04-09 00:41:55 +02:00
|
|
|
if (current() == brak) {
|
|
|
|
next_char();
|
2021-04-08 23:33:00 +02:00
|
|
|
return;
|
|
|
|
}
|
2021-04-09 00:41:55 +02:00
|
|
|
throw error{*ts.pstate, "unexpected \"%c\"", current()};
|
2021-04-08 23:33:00 +02:00
|
|
|
return;
|
|
|
|
case '/':
|
2021-04-09 00:41:55 +02:00
|
|
|
next_char();
|
|
|
|
if (current() == '/') {
|
|
|
|
skip_until('\n');
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
goto endstatement;
|
|
|
|
default:
|
2021-04-09 00:41:55 +02:00
|
|
|
next_char();
|
2021-04-08 23:33:00 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void parser_state::gen_main(std::string_view s, int ret_type) {
|
|
|
|
source = s.data();
|
|
|
|
send = s.data() + s.size();
|
2021-04-09 01:03:29 +02:00
|
|
|
gs.code.reserve(gs.code.size() + 8);
|
2021-04-09 00:41:55 +02:00
|
|
|
gs.code.push_back(BC_INST_START);
|
|
|
|
parse_block(VAL_ANY);
|
|
|
|
gs.code.push_back(BC_INST_EXIT | ((ret_type < VAL_ANY) ? (ret_type << BC_INST_RET) : 0));
|
2021-04-08 23:33:00 +02:00
|
|
|
}
|
|
|
|
|
2021-03-23 02:00:11 +01:00
|
|
|
/* list parser public implementation */
|
2016-09-21 21:02:13 +02:00
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT bool list_parser::parse() {
|
2021-03-20 19:34:26 +01:00
|
|
|
skip_until_item();
|
|
|
|
if (p_input_beg == p_input_end) {
|
2021-03-18 23:53:16 +01:00
|
|
|
return false;
|
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
switch (*p_input_beg) {
|
2021-03-20 02:26:37 +01:00
|
|
|
case '"': {
|
2021-03-20 19:34:26 +01:00
|
|
|
char const *qi = p_input_beg;
|
2021-03-23 23:29:32 +01:00
|
|
|
p_input_beg = parse_string(*p_state, get_input());
|
2021-03-31 01:48:56 +02:00
|
|
|
p_qbeg = qi;
|
|
|
|
p_qend = p_input_beg;
|
|
|
|
p_ibeg = p_qbeg + 1;
|
|
|
|
p_iend = p_qend - 1;
|
2021-03-18 23:53:16 +01:00
|
|
|
break;
|
2021-03-20 02:26:37 +01:00
|
|
|
}
|
2021-03-18 23:53:16 +01:00
|
|
|
case '(':
|
|
|
|
case '[': {
|
2021-03-20 19:34:26 +01:00
|
|
|
char btype = *p_input_beg;
|
2021-03-18 23:53:16 +01:00
|
|
|
int brak = 1;
|
2021-03-20 19:34:26 +01:00
|
|
|
char const *ibeg = p_input_beg++;
|
2021-03-18 23:53:16 +01:00
|
|
|
for (;;) {
|
2021-03-20 02:26:37 +01:00
|
|
|
std::string_view chrs{"\"/;()[]"};
|
2021-03-20 19:34:26 +01:00
|
|
|
p_input_beg = std::find_first_of(
|
|
|
|
p_input_beg, p_input_end, chrs.begin(), chrs.end()
|
2021-03-18 23:53:16 +01:00
|
|
|
);
|
2021-03-20 19:34:26 +01:00
|
|
|
if (p_input_beg == p_input_end) {
|
2021-03-18 23:53:16 +01:00
|
|
|
return true;
|
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
char c = *p_input_beg++;
|
2021-03-18 23:53:16 +01:00
|
|
|
switch (c) {
|
|
|
|
case '"':
|
2021-03-20 02:26:37 +01:00
|
|
|
/* the quote is needed in str parsing */
|
2021-03-20 19:34:26 +01:00
|
|
|
--p_input_beg;
|
2021-03-23 23:29:32 +01:00
|
|
|
p_input_beg = parse_string(*p_state, get_input());
|
2021-03-18 23:53:16 +01:00
|
|
|
break;
|
|
|
|
case '/':
|
2021-03-20 02:26:37 +01:00
|
|
|
if (
|
2021-03-20 19:34:26 +01:00
|
|
|
(p_input_beg != p_input_end) &&
|
|
|
|
(*p_input_beg == '/')
|
2021-03-20 02:26:37 +01:00
|
|
|
) {
|
2021-03-20 19:34:26 +01:00
|
|
|
p_input_beg = std::find(
|
|
|
|
p_input_beg, p_input_end, '\n'
|
2021-03-20 02:26:37 +01:00
|
|
|
);
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '(':
|
|
|
|
case '[':
|
|
|
|
brak += (c == btype);
|
|
|
|
break;
|
|
|
|
case ')':
|
|
|
|
if ((btype == '(') && (--brak <= 0)) {
|
|
|
|
goto endblock;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ']':
|
|
|
|
if ((btype == '[') && (--brak <= 0)) {
|
|
|
|
goto endblock;
|
|
|
|
}
|
|
|
|
break;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
|
|
|
}
|
2021-03-18 23:53:16 +01:00
|
|
|
endblock:
|
2021-03-31 01:48:56 +02:00
|
|
|
p_ibeg = ibeg + 1;
|
|
|
|
p_iend = p_input_beg - 1;
|
|
|
|
p_qbeg = ibeg;
|
|
|
|
p_qend = p_input_beg;
|
2021-03-18 23:53:16 +01:00
|
|
|
break;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
2021-03-18 23:53:16 +01:00
|
|
|
case ')':
|
|
|
|
case ']':
|
2016-09-21 21:02:13 +02:00
|
|
|
return false;
|
2021-03-18 23:53:16 +01:00
|
|
|
default: {
|
2021-03-23 23:29:32 +01:00
|
|
|
char const *e = parse_word(*p_state, get_input());
|
2021-03-31 01:48:56 +02:00
|
|
|
p_ibeg = p_qbeg = p_input_beg;
|
|
|
|
p_iend = p_qend = e;
|
2021-03-20 19:34:26 +01:00
|
|
|
p_input_beg = e;
|
2021-03-18 23:53:16 +01:00
|
|
|
break;
|
2016-09-21 21:02:13 +02:00
|
|
|
}
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
skip_until_item();
|
|
|
|
if ((p_input_beg != p_input_end) && (*p_input_beg == ';')) {
|
|
|
|
++p_input_beg;
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT std::size_t list_parser::count() {
|
2021-03-18 23:53:16 +01:00
|
|
|
size_t ret = 0;
|
2021-03-20 19:34:26 +01:00
|
|
|
while (parse()) {
|
2021-03-18 23:53:16 +01:00
|
|
|
++ret;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT string_ref list_parser::get_item() const {
|
2021-03-31 01:48:56 +02:00
|
|
|
if ((p_qbeg != p_qend) && (*p_qbeg == '"')) {
|
2021-03-26 02:59:42 +01:00
|
|
|
charbuf buf{*p_state};
|
2021-03-31 01:48:56 +02:00
|
|
|
unescape_string(std::back_inserter(buf), get_raw_item());
|
2021-03-23 23:29:32 +01:00
|
|
|
return string_ref{*p_state, buf.str()};
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
2021-03-31 01:48:56 +02:00
|
|
|
return string_ref{*p_state, get_raw_item()};
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
|
|
|
|
2021-03-23 23:29:32 +01:00
|
|
|
LIBCUBESCRIPT_EXPORT void list_parser::skip_until_item() {
|
2021-03-18 23:53:16 +01:00
|
|
|
for (;;) {
|
2021-03-20 19:34:26 +01:00
|
|
|
while (p_input_beg != p_input_end) {
|
|
|
|
char c = *p_input_beg;
|
2021-03-18 23:53:16 +01:00
|
|
|
if ((c == ' ') || (c == '\t') || (c == '\r') || (c == '\n')) {
|
2021-03-20 19:34:26 +01:00
|
|
|
++p_input_beg;
|
2021-03-18 23:53:16 +01:00
|
|
|
} else {
|
2016-09-21 21:02:13 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
if ((p_input_end - p_input_beg) < 2) {
|
2021-03-20 02:26:37 +01:00
|
|
|
break;
|
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
if ((p_input_beg[0] != '/') || (p_input_beg[1]) != '/') {
|
2021-03-18 23:53:16 +01:00
|
|
|
break;
|
2016-10-24 02:33:04 +02:00
|
|
|
}
|
2021-03-20 19:34:26 +01:00
|
|
|
p_input_beg = std::find(p_input_beg, p_input_end, '\n');
|
2016-10-24 02:33:04 +02:00
|
|
|
}
|
2021-03-18 23:53:16 +01:00
|
|
|
}
|
2016-09-21 21:02:13 +02:00
|
|
|
|
2021-03-23 23:32:25 +01:00
|
|
|
} /* namespace cubescript */
|