// Matrix Construct // // Copyright (C) Matrix Construct Developers, Authors & Contributors // Copyright (C) 2016-2018 Jason Volk // // Permission to use, copy, modify, and/or distribute this software for any // purpose with or without fee is hereby granted, provided that the above // copyright notice and this permission notice is present in all copies. The // full license for this software is available in the LICENSE file. #include namespace ircd::fmt { using namespace ircd::spirit; struct spec; struct specifier; constexpr char SPECIFIER { '%' }; constexpr char SPECIFIER_TERMINATOR { '$' }; struct parser extern const parser; extern std::map> specifiers; bool is_specifier(const string_view &name); void handle_specifier(mutable_buffer &out, const uint &idx, const spec &, const arg &); template bool generate_string(char *&out, const generator &gen, const arg &val); template bool visit_type(const arg &val, lambda&& closure); } /// Structural representation of a format specifier. The parse of each /// specifier in the format string creates one of these. struct ircd::fmt::spec { char sign {'+'}; ushort width {0}; ushort precision {0}; string_view name; spec() = default; }; /// Reflects the fmt::spec struct to allow the spirit::qi grammar to directly /// fill in the spec struct. BOOST_FUSION_ADAPT_STRUCT ( ircd::fmt::spec, ( decltype(ircd::fmt::spec::sign), sign ) ( decltype(ircd::fmt::spec::width), width ) ( decltype(ircd::fmt::spec::precision), precision ) ( decltype(ircd::fmt::spec::name), name ) ) /// A format specifier handler module. This allows a new "%foo" to be defined /// with custom handling by overriding. This abstraction is inserted into a /// mapping key'ed by the supplied names leading to an instance of this. /// class ircd::fmt::specifier { std::set names; public: virtual bool operator()(char *&out, const size_t &max, const spec &, const arg &) const = 0; specifier(const std::initializer_list &names); specifier(const std::string &name); virtual ~specifier() noexcept; }; /// Linkage for the lookup mapping of registered format specifiers. decltype(ircd::fmt::specifiers) ircd::fmt::specifiers; /// The format string parser grammar. struct ircd::fmt::parser :qi::grammar { template using rule = qi::rule; const rule<> specsym { lit(SPECIFIER) ,"format specifier" }; const rule<> specterm { lit(SPECIFIER_TERMINATOR) ,"specifier termination" }; const rule name { raw[repeat(1,14)[char_("A-Za-z")]] ,"specifier name" }; rule spec; parser() :parser::base_type{spec} { static const auto is_valid([] (const auto &str, auto &, auto &valid) { valid = is_specifier(str); }); spec %= specsym >> -(char_('+') | char_('-')) >> -ushort_ >> -(lit('.') >> ushort_) >> name[is_valid] >> -specterm; } } const ircd::fmt::parser; namespace ircd { namespace fmt { struct string_specifier :specifier { static const std::tuple < const char *, std::string, std::string_view, ircd::string_view, ircd::json::string, ircd::json::object, ircd::json::array > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const string_specifier { "s"s }; decltype(string_specifier::types) string_specifier::types {}; struct bool_specifier :specifier { static const std::tuple < bool, char, unsigned char, short, unsigned short, int, unsigned int, long, unsigned long, long long, unsigned long long > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const bool_specifier { { "b"s } }; decltype(bool_specifier::types) bool_specifier::types {}; struct signed_specifier :specifier { static const std::tuple < bool, char, unsigned char, short, unsigned short, int, unsigned int, long, unsigned long, long long, unsigned long long > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const signed_specifier { { "d"s, "ld"s, "zd"s } }; decltype(signed_specifier::types) signed_specifier::types {}; struct unsigned_specifier :specifier { static const std::tuple < bool, char, unsigned char, short, unsigned short, int, unsigned int, long, unsigned long, long long, unsigned long long > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const unsigned_specifier { { "u"s, "lu"s, "zu"s } }; struct hex_lowercase_specifier :specifier { static const std::tuple < bool, char, unsigned char, short, unsigned short, int, unsigned int, long, unsigned long, long long, unsigned long long > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const hex_lowercase_specifier { { "x"s, "lx"s } }; decltype(hex_lowercase_specifier::types) hex_lowercase_specifier::types {}; decltype(unsigned_specifier::types) unsigned_specifier::types {}; struct float_specifier :specifier { static const std::tuple < char, unsigned char, short, unsigned short, int, unsigned int, long, unsigned long, float, double, long double > types; bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const float_specifier { { "f"s, "lf"s } }; decltype(float_specifier::types) float_specifier::types {}; struct char_specifier :specifier { bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const char_specifier { "c"s }; struct pointer_specifier :specifier { bool operator()(char *&out, const size_t &max, const spec &, const arg &val) const override; using specifier::specifier; } const pointer_specifier { "p"s }; } // namespace fmt } // namespace ircd using namespace ircd; fmt::snprintf::snprintf(internal_t, const mutable_buffer &out, const string_view &fmt, const va_rtti &v) try :out{out} ,fmt{[&fmt] { // start the member fmt variable at the first specifier (or end) const auto pos(fmt.find(SPECIFIER)); return pos != fmt.npos? fmt.substr(pos): string_view{}; }()} ,idx{0} { // If out has no size we have nothing to do, not even null terminate it. if(unlikely(empty(out))) return; // If fmt has no specifiers then we can just copy the fmt as best as // possible to the out buffer. if(empty(this->fmt)) { consume(this->out, strlcpy(this->out, fmt)); return; } // Copy everything from fmt up to the first specifier. assert(data(this->fmt) >= data(fmt)); append(const_buffer(data(fmt), data(this->fmt))); // Iterate auto it(begin(v)); for(size_t i(0); i < v.size() && !finished(); ++it, i++) { const void *const &ptr(get<0>(*it)); const std::type_index type(*get<1>(*it)); argument(std::make_tuple(ptr, type)); } } catch(const std::out_of_range &e) { throw invalid_format { "Format string requires more than %zu arguments.", v.size() }; } void fmt::snprintf::argument(const arg &val) { // The format string's front pointer is sitting on the specifier '%' // waiting to be parsed now. fmt::spec spec; auto &start(std::get<0>(this->fmt)); const auto &stop(std::get<1>(this->fmt)); if(qi::parse(start, stop, parser, spec)) handle_specifier(this->out, idx++, spec, val); // The parse advanced the front pointer of this->fmt to after the // specifier. Now we copy characters from here up until the // next specifier. const string_view fmt(start, stop); const auto nextpos(fmt.find(SPECIFIER)); append(const_buffer(fmt.substr(0, nextpos))); this->fmt = const_buffer { nextpos != fmt.npos? fmt.substr(nextpos): string_view{} }; } void fmt::snprintf::append(const const_buffer &src) { consume(out, strlcpy(out, src)); } size_t fmt::snprintf::remaining() const { return out.remaining()? out.remaining() - 1: 0; } bool fmt::snprintf::finished() const { return empty(fmt) || !remaining(); } fmt::specifier::specifier(const std::string &name) :specifier{{name}} { } fmt::specifier::specifier(const std::initializer_list &names) :names{names} { for(const auto &name : this->names) if(is_specifier(name)) throw error { "Specifier '%s' already registered\n", name }; for(const auto &name : this->names) specifiers.emplace(name, this); } fmt::specifier::~specifier() noexcept { for(const auto &name : names) specifiers.erase(name); } bool fmt::is_specifier(const string_view &name) { return specifiers.count(name); } void fmt::handle_specifier(mutable_buffer &out, const uint &idx, const spec &spec, const arg &val) try { const auto &type(get<1>(val)); const auto &handler(*specifiers.at(spec.name)); auto &outp(std::get<0>(out)); const size_t max(size(out)); if(unlikely(!handler(outp, max, spec, val))) throw invalid_type { "`%s' (%s) for format specifier '%s' for argument #%u", demangle(type.name()), type.name(), spec.name, idx }; } catch(const std::out_of_range &e) { throw invalid_format { "Unhandled specifier `%s' for argument #%u in format string", spec.name, idx }; } catch(const illegal &e) { throw illegal { "Specifier `%s' for argument #%u: %s", spec.name, idx, e.what() }; } template bool fmt::visit_type(const arg &val, lambda&& closure) { const auto &ptr(get<0>(val)); const auto &type(get<1>(val)); return type == typeid(T)? closure(*static_cast(ptr)) : false; } bool fmt::pointer_specifier::operator()(char *&out, const size_t &max, const spec &, const arg &val) const { using karma::ulong_; using karma::eps; using karma::maxwidth; static const auto throw_illegal([] { throw illegal("Not a pointer"); }); struct generator :karma::grammar { karma::rule pointer_hex { lit("0x") << karma::hex }; generator(): generator::base_type{pointer_hex} {} } static const generator; const auto &ptr(get<0>(val)); const auto &type(get<1>(val)); const void *const p(*static_cast(ptr)); return karma::generate(out, maxwidth(max)[generator] | eps[throw_illegal], uintptr_t(p)); } bool fmt::char_specifier::operator()(char *&out, const size_t &max, const spec &, const arg &val) const { using karma::eps; using karma::maxwidth; static const auto throw_illegal([] { throw illegal("Not a printable character"); }); struct generator :karma::grammar { karma::rule printable { karma::print ,"character" }; generator(): generator::base_type{printable} {} } static const generator; const auto &ptr(get<0>(val)); const auto &type(get<1>(val)); if(type == typeid(const char)) { const auto &c(*static_cast(ptr)); karma::generate(out, maxwidth(max)[generator] | eps[throw_illegal], c); return true; } else return false; } bool fmt::bool_specifier::operator()(char *&out, const size_t &max, const spec &, const arg &val) const { using karma::eps; using karma::maxwidth; static const auto throw_illegal([] { throw illegal("Failed to print signed value"); }); const auto closure([&](const bool &boolean) { using karma::maxwidth; struct generator :karma::grammar { karma::rule rule { karma::bool_ ,"boolean" }; generator(): generator::base_type{rule} {} } static const generator; return karma::generate(out, maxwidth(max)[generator] | eps[throw_illegal], boolean); }); return !until(types, [&](auto type) { return !visit_type(val, closure); }); } bool fmt::signed_specifier::operator()(char *&out, const size_t &max, const spec &spec, const arg &val) const { static const auto throw_illegal([] { throw illegal("Failed to print signed value"); }); const auto closure([&out, &max, &spec, &val] (const long &integer) { using karma::long_; struct generator :karma::grammar { karma::rule rule { long_ ,"signed long integer" }; _r1_type width; karma::rule aligned_left { karma::left_align(width)[rule] ,"left aligned" }; karma::rule aligned_right { karma::right_align(width)[rule] ,"right aligned" }; karma::rule aligned_center { karma::center(width)[rule] ,"center aligned" }; generator(): generator::base_type{rule} {} } static const generator; const auto &mw(maxwidth(max)); static const auto &ep(eps[throw_illegal]); if(!spec.width) return karma::generate(out, mw[generator] | ep, integer); if(spec.sign == '-') { const auto &g(generator.aligned_left(spec.width)); return karma::generate(out, mw[g] | ep, integer); } const auto &g(generator.aligned_right(spec.width)); return karma::generate(out, mw[g] | ep, integer); }); return !until(types, [&](auto type) { return !visit_type(val, closure); }); } bool fmt::unsigned_specifier::operator()(char *&out, const size_t &max, const spec &spec, const arg &val) const { static const auto throw_illegal([] { throw illegal("Failed to print unsigned value"); }); const auto closure([&out, &max, &spec, &val] (const ulong &integer) { using karma::ulong_; struct generator :karma::grammar { karma::rule rule { ulong_ ,"unsigned long integer" }; _r1_type width; karma::rule aligned_left { karma::left_align(width)[rule] ,"left aligned" }; karma::rule aligned_right { karma::right_align(width)[rule] ,"right aligned" }; karma::rule aligned_center { karma::center(width)[rule] ,"center aligned" }; generator(): generator::base_type{rule} {} } static const generator; const auto &mw(maxwidth(max)); static const auto &ep(eps[throw_illegal]); if(!spec.width) return karma::generate(out, mw[generator] | ep, integer); if(spec.sign == '-') { const auto &g(generator.aligned_left(spec.width)); return karma::generate(out, mw[g] | ep, integer); } const auto &g(generator.aligned_right(spec.width)); return karma::generate(out, mw[g] | ep, integer); }); return !until(types, [&](auto type) { return !visit_type(val, closure); }); } bool fmt::hex_lowercase_specifier::operator()(char *&out, const size_t &max, const spec &s, const arg &val) const { static const auto throw_illegal([] { throw illegal("Failed to print hexadecimal value"); }); const auto closure([&](const uint &integer) { using karma::maxwidth; struct generator :karma::grammar { karma::rule rule { karma::lower[karma::hex] ,"unsigned lowercase hexadecimal" }; generator(): generator::base_type{rule} {} } static const generator; return karma::generate(out, maxwidth(max)[generator] | eps[throw_illegal], integer); }); return !until(types, [&](auto type) { return !visit_type(val, closure); }); } bool fmt::float_specifier::operator()(char *&out, const size_t &max, const spec &s, const arg &val) const { static const auto throw_illegal([] { throw illegal("Failed to print floating point value"); }); thread_local uint _precision_; _precision_ = s.precision; const auto closure([&](const long double &floating) { using karma::double_; using karma::maxwidth; struct generator :karma::grammar { struct policy :karma::real_policies { static uint precision(const long double &) { return _precision_; } static bool trailing_zeros(const long double &) { return _precision_ > 0; } }; karma::rule rule { karma::real_generator() ,"floating point real" }; generator(): generator::base_type{rule} {} } static const generator; return karma::generate(out, maxwidth(max)[generator] | eps[throw_illegal], floating); }); return !until(types, [&](auto type) { return !visit_type(val, closure); }); } bool fmt::string_specifier::operator()(char *&out, const size_t &max, const spec &spec, const arg &val) const { using karma::char_; using karma::eps; using karma::maxwidth; using karma::unused_type; static const auto throw_illegal([] { throw illegal("Not a printable string"); }); struct generator :karma::grammar { karma::rule string { *(karma::print) ,"string" }; _r1_type width; karma::rule aligned_left { karma::left_align(width)[string] ,"left aligned" }; karma::rule aligned_right { karma::right_align(width)[string] ,"right aligned" }; karma::rule aligned_center { karma::center(width)[string] ,"center aligned" }; generator() :generator::base_type{string} {} } static const generator; const auto &mw(maxwidth(max)); static const auto &ep(eps[throw_illegal]); if(!spec.width) return generate_string(out, mw[generator] | ep, val); if(spec.sign == '-') { const auto &g(generator.aligned_left(spec.width)); return generate_string(out, mw[g] | ep, val); } const auto &g(generator.aligned_right(spec.width)); return generate_string(out, mw[g] | ep, val); } template bool fmt::generate_string(char *&out, const generator &gen, const arg &val) { using karma::eps; const auto &ptr(get<0>(val)); const auto &type(get<1>(val)); if(type == typeid(ircd::string_view) || type == typeid(ircd::json::string) || type == typeid(ircd::json::object) || type == typeid(ircd::json::array)) { const auto &str(*static_cast(ptr)); return karma::generate(out, gen, str); } else if(type == typeid(std::string_view)) { const auto &str(*static_cast(ptr)); return karma::generate(out, gen, str); } else if(type == typeid(std::string)) { const auto &str(*static_cast(ptr)); return karma::generate(out, gen, string_view{str}); } else if(type == typeid(const char *)) { const char *const &str{*static_cast(ptr)}; return karma::generate(out, gen, string_view{str}); } // This for string literals which have unique array types depending on their size. // There is no reasonable way to match them. The best that can be hoped for is the // grammar will fail gracefully (most of the time) or not print something bogus when // it happens to be legal. const auto &str(static_cast(ptr)); return karma::generate(out, gen, string_view{str}); }