#include #include "cs_util.hh" #include "cs_vm.hh" #include #include namespace cscript { static inline void p_skip_white(ostd::string_range &v) { while (!v.empty() && isspace(*v)) { ++v; } } static inline void p_set_end( const ostd::string_range &v, ostd::string_range *end ) { if (!end) { return; } *end = v; } /* this function assumes the input is definitely a hex digit */ static inline cs_int p_hexd_to_int(char c) { if (c >= 97) { /* a-f */ return (c - 'a') + 10; } else if (c >= 65) { /* A-F */ return (c - 'A') + 10; } /* 0-9 */ return c - '0'; } static inline bool p_check_neg(ostd::string_range &input) { bool neg = (*input == '-'); if (neg || (*input == '+')) { ++input; } return neg; } cs_int cs_parse_int(ostd::string_range input, ostd::string_range *end) { ostd::string_range orig = input; p_skip_white(input); if (input.empty()) { p_set_end(orig, end); return cs_int(0); } bool neg = p_check_neg(input); cs_int ret = 0; ostd::string_range past = input; if (input.size() >= 2) { ostd::string_range pfx = input.slice(0, 2); if ((pfx == "0x") || (pfx == "0X")) { input = input.slice(2, input.size()); past = input; while (!past.empty() && isxdigit(*past)) { ret = ret * 16 + p_hexd_to_int(*past); ++past; } goto done; } else if ((pfx == "0b") || (pfx == "0B")) { input = input.slice(2, input.size()); past = input; while (!past.empty() && ((*past == '0') || (*past == '1'))) { ret = ret * 2 + (*past - '0'); ++past; } goto done; } } while (!past.empty() && isdigit(*past)) { ret = ret * 10 + (*past - '0'); ++past; } done: if (&past[0] == &input[0]) { p_set_end(orig, end); } else { p_set_end(past, end); } if (neg) { return -ret; } return ret; } template static inline bool p_read_exp(ostd::string_range &input, cs_int &fn) { if (input.empty()) { return true; } if ((*input != e1) && (*input != e2)) { return true; } ++input; if (input.empty()) { return false; } bool neg = p_check_neg(input); if (input.empty() || !isdigit(*input)) { return false; } cs_int exp = 0; while (!input.empty() && isdigit(*input)) { exp = exp * 10 + (*input - '0'); ++input; } if (neg) { exp = -exp; } fn += exp; return true; } template static inline bool parse_gen_float( ostd::string_range input, ostd::string_range *end, cs_float &ret ) { auto read_digits = [&input](double r, cs_int &n) { while (!input.empty() && (Hex ? isxdigit(*input) : isdigit(*input))) { if (Hex) { r = r * 16.0 + double(p_hexd_to_int(*input)); } else { r = r * 10.0 + double(*input - '0'); } ++n; ++input; } return r; }; cs_int wn = 0, fn = 0; double r = read_digits(0.0, wn); if (!input.empty() && (*input == '.')) { ++input; r = read_digits(r, fn); } if (!wn && !fn) { return false; } fn = -fn; p_set_end(input, end); /* we have a valid number until here */ if (p_read_exp(input, fn)) { p_set_end(input, end); } if (Hex) { ret = cs_float(ldexp(r, fn * 4)); } else { ret = cs_float(r * pow(10, fn)); } return true; } cs_float cs_parse_float(ostd::string_range input, ostd::string_range *end) { ostd::string_range orig = input; p_skip_white(input); if (input.empty()) { p_set_end(orig, end); return cs_float(0); } bool neg = p_check_neg(input); cs_float ret = cs_float(0); if (input.size() >= 2) { ostd::string_range pfx = input.slice(0, 2); if ((pfx == "0x") || (pfx == "0X")) { input = input.slice(2, input.size()); if (!parse_gen_float(input, end, ret)) { p_set_end(orig, end); return ret; } goto done; } } if (!parse_gen_float(input, end, ret)) { p_set_end(orig, end); return ret; } done: if (neg) { return -ret; } return ret; } /* string manager */ inline cs_strref_state *get_ref_state(char const *ptr) { return const_cast( reinterpret_cast(ptr) ) - 1; } char const *cs_strman::add(ostd::string_range str) { auto it = counts.find(str); /* already present: just increment ref */ if (it != counts.end()) { auto *st = it->second; /* having a null pointer is the same as non-existence */ if (st) { ++st->refcount; return reinterpret_cast(st + 1); } } /* not present: allocate brand new data */ auto ss = str.size(); auto strp = alloc_buf(ss); /* write string data, it's already pre-terminated */ memcpy(strp, str.data(), ss); /* store it */ counts.emplace(ostd::string_range{strp, strp + ss}, get_ref_state(strp)); return strp; } char const *cs_strman::ref(char const *ptr) { auto *ss = get_ref_state(ptr); ++ss->refcount; return ptr; } char const *cs_strman::steal(char *ptr) { auto *ss = get_ref_state(ptr); auto sr = ostd::string_range{ptr, ptr + ss->length}; /* much like add(), but we already have memory */ auto it = counts.find(sr); if (it != counts.end()) { auto *st = it->second; if (st) { ++st->refcount; /* the buffer is superfluous now */ cstate->alloc(ss, ss->length + sizeof(cs_strref_state) + 1, 0); return reinterpret_cast(st + 1); } } ss->refcount = 1; counts.emplace(sr, ss); return ptr; } void cs_strman::unref(char const *ptr) { auto *ss = get_ref_state(ptr); if (!--ss->refcount) { /* refcount zero, so ditch it * this path is a little slow... */ auto sr = ostd::string_range{ptr, ptr + ss->length}; auto it = counts.find(sr); if (it == counts.end()) { /* internal error: this should *never* happen */ throw cs_internal_error{"no refcount"}; } /* we're freeing the key */ counts.erase(it); /* dealloc */ cstate->alloc(ss, ss->length + sizeof(cs_strref_state) + 1, 0); } } char const *cs_strman::find(ostd::string_range str) const { auto it = counts.find(str); if (it == counts.end()) { return nullptr; } return reinterpret_cast(it->second + 1); } ostd::string_range cs_strman::get(char const *ptr) const { auto *ss = get_ref_state(ptr); return ostd::string_range{ptr, ptr + ss->length}; } char *cs_strman::alloc_buf(std::size_t len) const { auto mem = cstate->alloc(nullptr, 0, len + sizeof(cs_strref_state) + 1); if (!mem) { throw cs_internal_error{"allocation failed"}; } /* write length and initial refcount */ auto *sst = static_cast(mem); sst->length = len; sst->refcount = 1; /* pre-terminate */ auto *strp = reinterpret_cast(sst + 1); strp[len] = '\0'; /* now the user can fill it */ return strp; }; /* strref */ cs_strref::cs_strref(cs_shared_state &cs, ostd::string_range str): p_state{&cs} { p_str = cs.strman->add(str); } cs_strref::cs_strref(cs_state &cs, ostd::string_range str): p_state{cs.p_state} { p_str = p_state->strman->add(str); } cs_strref::cs_strref(cs_strref const &ref): p_state{ref.p_state}, p_str{ref.p_str} { p_state->strman->ref(p_str); } /* this can be used by friends to do quick cs_strref creation */ cs_strref::cs_strref(char const *p, cs_shared_state &cs): p_state{&cs} { p_str = p_state->strman->ref(p); } cs_strref::~cs_strref() { p_state->strman->unref(p_str); } cs_strref &cs_strref::operator=(cs_strref const &ref) { p_str = ref.p_str; p_state = ref.p_state; p_state->strman->ref(p_str); return *this; } cs_strref::operator ostd::string_range() const { return p_state->strman->get(p_str); } bool cs_strref::operator==(cs_strref const &s) const { return p_str == s.p_str; } namespace util { OSTD_EXPORT ostd::string_range parse_string( cs_state &cs, ostd::string_range str, size_t &nlines ) { size_t nl = 0; nlines = nl; if (str.empty() || (*str != '\"')) { return str; } ostd::string_range orig = str; ++str; ++nl; while (!str.empty()) { switch (*str) { case '\r': case '\n': case '\"': goto end; case '^': case '\\': { bool needn = (*str == '\\'); ++str; if (str.empty()) { goto end; } if ((*str == '\r') || (*str == '\n')) { char c = *str; ++str; ++nl; if (!str.empty() && (c == '\r') && (*str == '\n')) { ++str; } } else if (needn) { goto end; } else { ++str; } continue; } } ++str; } end: nlines = nl; if (str.empty() || (*str != '\"')) { throw cs_error( cs, "unfinished string '%s'", orig.slice(0, &str[0] - &orig[0]) ); } str.pop_front(); return str; } OSTD_EXPORT ostd::string_range parse_word( cs_state &cs, ostd::string_range str ) { for (;;) { str = ostd::find_one_of(str, ostd::string_range("\"/;()[] \t\r\n")); if (str.empty()) { return str; } switch (*str) { case '"': case ';': case ' ': case '\t': case '\r': case '\n': return str; case '/': if ((str.size() > 1) && (str[1] == '/')) { return str; } break; case '[': str.pop_front(); str = parse_word(cs, str); if (str.empty() || (*str != ']')) { throw cs_error(cs, "missing \"]\""); } break; case '(': str.pop_front(); str = parse_word(cs, str); if (str.empty() || (*str != ')')) { throw cs_error(cs, "missing \")\""); } break; case ']': case ')': return str; } ++str; } return str; } } /* namespace util */ OSTD_EXPORT bool list_parse(cs_list_parse_state &ps, cs_state &cs) { list_find_item(ps); if (ps.input.empty()) { return false; } switch (*ps.input) { case '"': ps.quoted_item = ps.input; ps.input = util::parse_string(cs, ps.input); ps.quoted_item = ps.quoted_item.slice( 0, &ps.input[0] - &ps.quoted_item[0] ); ps.item = ps.quoted_item.slice(1, ps.quoted_item.size() - 1); break; case '(': case '[': { ps.quoted_item = ps.input; ++ps.input; ps.item = ps.input; char btype = *ps.quoted_item; int brak = 1; for (;;) { ps.input = ostd::find_one_of( ps.input, ostd::string_range("\"/;()[]") ); if (ps.input.empty()) { return true; } char c = *ps.input; ++ps.input; switch (c) { case '"': ps.input = util::parse_string(cs, ps.input); break; case '/': if (!ps.input.empty() && (*ps.input == '/')) { ps.input = ostd::find(ps.input, '\n'); } break; case '(': case '[': brak += (c == btype); break; case ')': if ((btype == '(') && (--brak <= 0)) { goto endblock; } break; case ']': if ((btype == '[') && (--brak <= 0)) { goto endblock; } break; } } endblock: ps.item = ps.item.slice(0, &ps.input[0] - &ps.item[0]); ps.item.pop_back(); ps.quoted_item = ps.quoted_item.slice( 0, &ps.input[0] - &ps.quoted_item[0] ); break; } case ')': case ']': return false; default: { ostd::string_range e = util::parse_word(cs, ps.input); ps.quoted_item = ps.item = ps.input.slice(0, &e[0] - &ps.input[0]); ps.input = e; break; } } list_find_item(ps); if (!ps.input.empty() && (*ps.input == ';')) { ++ps.input; } return true; } OSTD_EXPORT std::size_t list_count(cs_list_parse_state &ps, cs_state &cs) { size_t ret = 0; while (list_parse(ps, cs)) { ++ret; } return ret; } OSTD_EXPORT cs_strref list_get_item(cs_list_parse_state &ps, cs_state &cs) { if (!ps.quoted_item.empty() && (*ps.quoted_item == '"')) { auto app = ostd::appender(); util::unescape_string(app, ps.item); return cs_strref{cs, app.get()}; } return cs_strref{cs, ps.item}; } OSTD_EXPORT void list_find_item(cs_list_parse_state &ps) { for (;;) { while (!ps.input.empty()) { char c = *ps.input; if ((c == ' ') || (c == '\t') || (c == '\r') || (c == '\n')) { ++ps.input; } else { break; } } if ((ps.input.size() < 2) || (ps.input[0] != '/') || (ps.input[1] != '/')) { break; } ps.input = ostd::find(ps.input, '\n'); } } OSTD_EXPORT cs_strref value_list_concat( cs_state &cs, cs_value_r vals, ostd::string_range sep ) { auto app = ostd::appender(); for (std::size_t i = 0; i < vals.size(); ++i) { switch (vals[i].get_type()) { case cs_value_type::INT: case cs_value_type::FLOAT: case cs_value_type::STRING: { cs_value v{vals[i]}; ostd::range_put_all(app, cs_value{vals[i]}.force_str()); break; } default: break; } if (i == (vals.size() - 1)) { break; } ostd::range_put_all(app, sep); } return cs_strref{cs, ostd::iter(app.get())}; } } /* namespace cscript */