/* String for OctaSTD. * * This file is part of OctaSTD. See COPYING.md for futher information. */ #ifndef OSTD_STRING_HH #define OSTD_STRING_HH #include #include #include "ostd/utility.hh" #include "ostd/range.hh" #include "ostd/vector.hh" #include "ostd/functional.hh" #include "ostd/type_traits.hh" namespace ostd { static constexpr Size npos = -1; template> class StringBase; template struct CharRangeBase: InputRange< CharRangeBase, FiniteRandomAccessRangeTag, T > { private: struct Nat {}; public: CharRangeBase(): p_beg(nullptr), p_end(nullptr) {}; CharRangeBase(T *beg, T *end): p_beg(beg), p_end(end) {} CharRangeBase(T *beg, Size n): p_beg(beg), p_end(beg + n) {} /* TODO: traits for utf-16/utf-32 string lengths, for now assume char */ template CharRangeBase(U beg, EnableIf< IsConvertible::value && !IsArray::value, Nat > = Nat()): p_beg(beg), p_end((T *)beg + strlen(beg)) {} template CharRangeBase(U (&beg)[N], EnableIf< IsConvertible::value, Nat > = Nat()): p_beg(beg), p_end(beg + N - (beg[N - 1] == '\0')) {} template CharRangeBase(const StringBase &s, EnableIf< IsConvertible::value, Nat > = Nat()): p_beg(s.data()), p_end(s.data() + s.size()) {} template::value >> CharRangeBase(const CharRangeBase &v): p_beg(&v[0]), p_end(&v[v.size()]) {} CharRangeBase &operator=(const CharRangeBase &v) { p_beg = v.p_beg; p_end = v.p_end; return *this; } template CharRangeBase &operator=(const StringBase &s) { p_beg = s.data(); p_end = s.data() + s.size(); return *this; } /* TODO: traits for utf-16/utf-32 string lengths, for now assume char */ CharRangeBase &operator=(T *s) { p_beg = s; p_end = s + strlen(s); return *this; } bool empty() const { return p_beg == p_end; } bool pop_front() { if (p_beg == p_end) return false; ++p_beg; return true; } bool push_front() { --p_beg; return true; } Size pop_front_n(Size n) { Size olen = p_end - p_beg; p_beg += n; if (p_beg > p_end) { p_beg = p_end; return olen; } return n; } Size push_front_n(Size n) { p_beg -= n; return true; } T &front() const { return *p_beg; } bool equals_front(const CharRangeBase &range) const { return p_beg == range.p_beg; } Ptrdiff distance_front(const CharRangeBase &range) const { return range.p_beg - p_beg; } bool pop_back() { if (p_end == p_beg) return false; --p_end; return true; } bool push_back() { ++p_end; return true; } Size pop_back_n(Size n) { Size olen = p_end - p_beg; p_end -= n; if (p_end < p_beg) { p_end = p_beg; return olen; } return n; } Size push_back_n(Size n) { p_end += n; return true; } T &back() const { return *(p_end - 1); } bool equals_back(const CharRangeBase &range) const { return p_end == range.p_end; } Ptrdiff distance_back(const CharRangeBase &range) const { return range.p_end - p_end; } Size size() const { return p_end - p_beg; } CharRangeBase slice(Size start, Size end) const { return CharRangeBase(p_beg + start, p_beg + end); } T &operator[](Size i) const { return p_beg[i]; } bool put(T v) { if (empty()) return false; *(p_beg++) = v; return true; } /* non-range methods */ T *data() { return p_beg; } const T *data() const { return p_beg; } Size to_hash() const { return detail::mem_hash(data(), size()); } private: T *p_beg, *p_end; }; template class StringBase { using StrPair = detail::CompressedPair, A>; ostd::Size p_len, p_cap; StrPair p_buf; template void ctor_from_range(R &range, EnableIf< IsFiniteRandomAccessRange::value && IsSame>>::value, bool > = true) { if (range.empty()) return; RangeSize l = range.size(); reserve(l); p_len = l; range.copy(p_buf.first(), l); p_buf.first()[l] = '\0'; } template void ctor_from_range(R &range, EnableIf< !IsFiniteRandomAccessRange::value || !IsSame>>::value, bool > = true) { if (range.empty()) return; Size i = 0; for (; !range.empty(); range.pop_front()) { reserve(i + 1); allocator_construct(p_buf.second(), &p_buf.first()[i], range.front()); ++i; p_len = i; } p_buf.first()[p_len] = '\0'; } public: using Size = ostd::Size; using Difference = Ptrdiff; using Value = T; using Reference = T &; using ConstReference = const T &; using Pointer = AllocatorPointer; using ConstPointer = AllocatorConstPointer; using Range = CharRangeBase; using ConstRange = CharRangeBase; using Allocator = A; StringBase(const A &a = A()): p_len(0), p_cap(0), p_buf((Pointer)&p_len, a) {} explicit StringBase(Size n, T val = T(), const A &al = A()): StringBase(al) { if (!n) return; p_buf.first() = allocator_allocate(p_buf.second(), n + 1); p_len = p_cap = n; Pointer cur = p_buf.first(), last = p_buf.first() + n; while (cur != last) *cur++ = val; *cur = '\0'; } StringBase(const StringBase &s): p_len(0), p_cap(0), p_buf((Pointer)&p_len, allocator_container_copy(s.p_buf.second())) { if (!s.p_len) return; reserve(s.p_len); p_len = s.p_len; memcpy(p_buf.first(), s.p_buf.first(), (p_len + 1) * sizeof(T)); } StringBase(const StringBase &s, const A &a): p_len(0), p_cap(0), p_buf((Pointer)&p_len, a) { if (!s.p_len) return; reserve(s.p_len); p_len = s.p_len; memcpy(p_buf.first(), s.p_buf.first(), (p_len + 1) * sizeof(T)); } StringBase(StringBase &&s): p_len(s.p_len), p_cap(s.p_cap), p_buf(s.p_buf.first(), move(s.p_buf.second())) { s.p_len = s.p_cap = 0; s.p_buf.first() = (Pointer)&s.p_len; } StringBase(StringBase &&s, const A &a): p_len(0), p_cap(0), p_buf((Pointer)&p_len, a) { if (!s.p_len) return; if (a != s.p_buf.second()) { reserve(s.p_cap); p_len = s.p_len; memcpy(p_buf.first(), s.p_buf.first(), (p_len + 1) * sizeof(T)); return; } p_buf.first() = s.p_buf.first(); p_len = s.p_len; p_cap = s.p_cap; s.p_len = s.p_cap = 0; s.p_buf.first() = &s.p_cap; } StringBase(const StringBase &s, Size pos, Size len = npos, const A &a = A()): StringBase(a) { Size end = (len == npos) ? s.size() : (pos + len); Size nch = (end - pos); reserve(nch); memcpy(p_buf.first(), s.p_buf.first() + pos, nch); p_len += nch; p_buf.first()[p_len] = '\0'; } /* TODO: traits for utf-16/utf-32 string lengths, for now assume char */ StringBase(ConstRange v, const A &a = A()): StringBase(a) { if (!v.size()) return; reserve(v.size()); memcpy(p_buf.first(), &v[0], v.size()); p_buf.first()[v.size()] = '\0'; p_len = v.size(); } template StringBase(U v, const EnableIf< IsConvertible::value && !IsArray::value, A > &a = A()): StringBase(ConstRange(v), a) {} template StringBase(U (&v)[N], const EnableIf< IsConvertible::value, A > &a = A()): StringBase(ConstRange(v), a) {} template::value && IsConvertible, Value>::value >> StringBase(R range, const A &a = A()): StringBase(a) { ctor_from_range(range); } ~StringBase() { allocator_deallocate(p_buf.second(), p_buf.first(), p_cap + 1); } void clear() { p_len = 0; *p_buf.first() = '\0'; } StringBase &operator=(const StringBase &v) { if (this == &v) return *this; clear(); if (AllocatorPropagateOnContainerCopyAssignment::value) { if ((p_buf.second() != v.p_buf.second()) && p_cap) { allocator_deallocate(p_buf.second(), p_buf.first(), p_cap); p_cap = 0; p_buf.first() = &p_len; } p_buf.second() = v.p_buf.second(); } reserve(v.p_cap); p_len = v.p_len; if (p_len) { memcpy(p_buf.first(), v.p_buf.first(), p_len); p_buf.first()[p_len] = '\0'; } else p_buf.first() = &p_len; return *this; } StringBase &operator=(StringBase &&v) { clear(); if (p_cap) allocator_deallocate(p_buf.second(), p_buf.first(), p_cap); if (AllocatorPropagateOnContainerMoveAssignment::value) p_buf.second() = v.p_buf.second(); p_len = v.p_len; p_cap = v.p_cap; p_buf.~StrPair(); new (&p_buf) StrPair(v.disown(), move(v.p_buf.second())); if (!p_cap) p_buf.first() = (Pointer)&p_len; return *this; } StringBase &operator=(ConstRange v) { reserve(v.size()); if (v.size()) memcpy(p_buf.first(), &v[0], v.size()); p_buf.first()[v.size()] = '\0'; p_len = v.size(); return *this; } template::value && IsConvertible, Value>::value >> StringBase &operator=(const R &r) { clear(); ctor_from_range(r); return *this; } void resize(Size n, T v = T()) { if (!n) { clear(); return; } Size l = p_len; reserve(n); p_len = n; for (Size i = l; i < p_len; ++i) { p_buf.first()[i] = T(v); } p_buf.first()[l] = '\0'; } void reserve(Size n) { if (n <= p_cap) return; Size oc = p_cap; if (!oc) { p_cap = max(n, Size(8)); } else { while (p_cap < n) p_cap *= 2; } Pointer tmp = allocator_allocate(p_buf.second(), p_cap + 1); if (oc > 0) { memcpy(tmp, p_buf.first(), (p_len + 1) * sizeof(T)); allocator_deallocate(p_buf.second(), p_buf.first(), oc + 1); } tmp[p_len] = '\0'; p_buf.first() = tmp; } T &operator[](Size i) { return p_buf[i]; } const T &operator[](Size i) const { return p_buf[i]; } T &at(Size i) { return p_buf[i]; } const T &at(Size i) const { return p_buf[i]; } T &front() { return p_buf[0]; } const T &front() const { return p_buf[0]; }; T &back() { return p_buf[size() - 1]; } const T &back() const { return p_buf[size() - 1]; } Value *data() { return p_buf.first(); } const Value *data() const { return p_buf.first(); } Size size() const { return p_len; } Size capacity() const { return p_cap; } Size length() const { /* TODO: unicode */ return size(); } bool empty() const { return (size() == 0); } Value *disown() { Pointer r = p_buf.first(); p_buf.first() = nullptr; p_len = p_cap = 0; return (Value *)r; } void push(T v) { reserve(p_len + 1); p_buf.first()[p_len++] = v; p_buf.first()[p_len] = '\0'; } StringBase &append(const StringBase &s) { reserve(p_len + s.p_len); if (!s.p_len) return *this; memcpy(p_buf.first() + p_len, s.p_buf.first(), s.p_len); p_len += s.p_len; p_buf.first()[p_len] = '\0'; return *this; } StringBase &append(const StringBase &s, Size idx, Size len) { if (!s.p_len) return; Size end = (len == npos) ? s.size() : (idx + len); Size nch = (end - idx); if (!nch) return; reserve(p_len + nch); memcpy(p_buf.first() + p_len, s.p_buf.first() + idx, nch); p_len += nch; p_buf.first()[p_len] = '\0'; return *this; } StringBase &append(const Value *s) { Size len = strlen(s); reserve(p_len + len); if (!len) return *this; memcpy(p_buf.first() + p_len, s, len); p_len += len; p_buf.first()[p_len] = '\0'; return *this; } StringBase &append(Size n, T c) { if (!n) return; reserve(p_len + n); for (Size i = 0; i < n; ++n) p_buf.first()[p_len + i] = c; p_len += n; p_buf.first()[p_len] = '\0'; return *this; } template StringBase &append_range(R range) { Size nadd = 0; for (; !range.empty(); range.pop_front()) { reserve(p_len + nadd + 1); p_buf.first()[p_len + nadd++] = range.front(); } p_len += nadd; p_buf.first()[p_len] = '\0'; return *this; } StringBase &operator+=(const StringBase &s) { return append(s); } StringBase &operator+=(const Value *s) { return append(s); } StringBase &operator+=(T c) { reserve(p_len + 1); p_buf.first()[p_len++] = c; p_buf.first()[p_len] = '\0'; return *this; } int compare(const StringBase &s) const { return strcmp(p_buf.first(), s.data()); } int compare(const Value *p) const { return strcmp(p_buf.first(), p); } Range iter() { return Range(p_buf.first(), size()); } ConstRange iter() const { return ConstRange(p_buf.first(), size()); } ConstRange citer() const { return ConstRange(p_buf.dfirst(), size()); } Range iter_cap() { return Range(p_buf.first(), capacity()); } void swap(StringBase &v) { detail::swap_adl(p_len, v.p_len); detail::swap_adl(p_cap, v.p_cap); detail::swap_adl(p_buf.first(), v.p_buf.first()); if (AllocatorPropagateOnContainerSwap::value) detail::swap_adl(p_buf.second(), v.p_buf.second()); } Size to_hash() const { return iter().to_hash(); } A get_allocator() const { return p_buf.second(); } }; using String = StringBase; using CharRange = CharRangeBase; using ConstCharRange = CharRangeBase; template using AnyString = StringBase; template inline bool operator==(const StringBase &lhs, const StringBase &rhs) { return !lhs.compare(rhs); } template inline bool operator==(const StringBase &lhs, const char *rhs) { return !lhs.compare(rhs); } template inline bool operator==(const char *lhs, const StringBase &rhs) { return !rhs.compare(lhs); } template inline bool operator!=(const StringBase &lhs, const StringBase &rhs) { return !(lhs == rhs); } template inline bool operator!=(const StringBase &lhs, const char *rhs) { return !(lhs == rhs); } template inline bool operator!=(const char *lhs, const StringBase &rhs) { return !(rhs == lhs); } template inline bool operator<(const StringBase &lhs, const StringBase &rhs) { return lhs.compare(rhs) < 0; } template inline bool operator<(const StringBase &lhs, const char *rhs) { return lhs.compare(rhs) < 0; } template inline bool operator<(const char *lhs, const StringBase &rhs) { return rhs.compare(lhs) > 0; } template inline bool operator>(const StringBase &lhs, const StringBase &rhs) { return rhs < lhs; } template inline bool operator>(const StringBase &lhs, const char *rhs) { return rhs < lhs; } template inline bool operator>(const char *lhs, const StringBase &rhs) { return rhs < lhs; } template inline bool operator<=(const StringBase &lhs, const StringBase &rhs) { return !(rhs < lhs); } template inline bool operator<=(const StringBase &lhs, const char *rhs) { return !(rhs < lhs); } template inline bool operator<=(const char *lhs, const StringBase &rhs) { return !(rhs < lhs); } template inline bool operator>=(const StringBase &lhs, const StringBase &rhs) { return !(lhs < rhs); } template inline bool operator>=(const StringBase &lhs, const char *rhs) { return !(lhs < rhs); } template inline bool operator>=(const char *lhs, const StringBase &rhs) { return !(lhs < rhs); } /* string literals */ inline namespace literals { inline namespace string_literals { String operator "" _s(const char *str, Size len) { return String(ConstCharRange(str, len)); } ConstCharRange operator "" _S(const char *str, Size len) { return ConstCharRange(str, len); } } } template AnyString concat(AllocatorArg, const A &alloc, const T &v, ConstCharRange sep, F func) { AnyString ret(alloc); auto range = ostd::iter(v); if (range.empty()) return ret; for (;;) { ret += func(range.front()); range.pop_front(); if (range.empty()) break; ret += sep; } return ret; } template AnyString concat(AllocatorArg, const A &alloc, const T &v, ConstCharRange sep = " ") { AnyString ret(alloc); auto range = ostd::iter(v); if (range.empty()) return ret; for (;;) { ret += range.front(); range.pop_front(); if (range.empty()) break; ret += sep; } return ret; } template String concat(const T &v, ConstCharRange sep, F func) { return concat(allocator_arg, typename String::Allocator(), v, sep, func); } template String concat(const T &v, ConstCharRange sep = " ") { return concat(allocator_arg, typename String::Allocator(), v, sep); } template AnyString concat(AllocatorArg, const A &alloc, std::initializer_list v, ConstCharRange sep, F func) { return concat(allocator_arg, alloc, ostd::iter(v), sep, func); } template AnyString concat(AllocatorArg, const A &alloc, std::initializer_list v, ConstCharRange sep = " ") { return concat(allocator_arg, alloc, ostd::iter(v), sep); } template String concat(std::initializer_list v, ConstCharRange sep, F func) { return concat(ostd::iter(v), sep, func); } template String concat(std::initializer_list v, ConstCharRange sep = " ") { return concat(ostd::iter(v), sep); } namespace detail { template auto test_tostring(int) -> decltype(IsSame().to_string()), String>()); template False test_tostring(...); template using ToStringTest = decltype(test_tostring(0)); template True test_iterable(decltype(ostd::iter(declval())) *); template static False test_iterable(...); template using IterableTest = decltype(test_iterable(0)); } template struct ToString; template struct ToString::value>> { using Argument = RemoveCv>; using Result = String; String operator()(const T &v) const { String ret("{"); ret += concat(ostd::iter(v), ", ", ToString< RemoveConst >> >()); ret += "}"; return ret; } }; template struct ToString::value>> { using Argument = RemoveCv>; using Result = String; String operator()(const T &v) const { return v.to_string(); } }; namespace detail { template void str_printf(String &s, const char *fmt, T v) { char buf[256]; int n = snprintf(buf, sizeof(buf), fmt, v); s.clear(); s.reserve(n); if (n >= (int)sizeof(buf)) snprintf(s.data(), n + 1, fmt, v); else if (n > 0) memcpy(s.data(), buf, n + 1); else { s.clear(); } *((Size *)&s) = n; } } template<> struct ToString { using Argument = bool; using Result = String; String operator()(bool b) { return b ? "true" : "false"; } }; template<> struct ToString { using Argument = char; using Result = String; String operator()(char c) { String ret; ret.push(c); return ret; } }; #define OSTD_TOSTR_NUM(T, fmt) \ template<> struct ToString { \ using Argument = T; \ using Result = String; \ String operator()(T v) { \ String ret; \ detail::str_printf(ret, fmt, v); \ return ret; \ } \ }; OSTD_TOSTR_NUM(sbyte, "%d") OSTD_TOSTR_NUM(int, "%d") OSTD_TOSTR_NUM(int &, "%d") OSTD_TOSTR_NUM(long, "%ld") OSTD_TOSTR_NUM(float, "%f") OSTD_TOSTR_NUM(double, "%f") OSTD_TOSTR_NUM(byte, "%u") OSTD_TOSTR_NUM(uint, "%u") OSTD_TOSTR_NUM(ulong, "%lu") OSTD_TOSTR_NUM(llong, "%lld") OSTD_TOSTR_NUM(ullong, "%llu") OSTD_TOSTR_NUM(ldouble, "%Lf") #undef OSTD_TOSTR_NUM template struct ToString { using Argument = T *; using Result = String; String operator()(Argument v) { String ret; detail::str_printf(ret, "%p", v); return ret; } }; template<> struct ToString { using Argument = const char *; using Result = String; String operator()(const char *s) { return String(s); } }; template<> struct ToString { using Argument = char *; using Result = String; String operator()(char *s) { return String(s); } }; template<> struct ToString { using Argument = String; using Result = String; String operator()(const Argument &s) { return s; } }; template<> struct ToString { using Argument = CharRange; using Result = String; String operator()(const Argument &s) { return String(s); } }; template<> struct ToString { using Argument = ConstCharRange; using Result = String; String operator()(const Argument &s) { return String(s); } }; template struct ToString> { using Argument = Pair; using Result = String; String operator()(const Argument &v) { String ret("{"); ret += ToString>>()(v.first); ret += ", "; ret += ToString>>()(v.second); ret += "}"; return ret; } }; template typename ToString::Result to_string(const T &v) { return ToString>>()(v); } template String to_string(std::initializer_list init) { return to_string(iter(init)); } } /* namespace ostd */ #endif