// // docopt.cpp // docopt // // Created by Jared Grubb on 2013-11-03. // Copyright (c) 2013 Jared Grubb. All rights reserved. // //#define DOCTOPT_USE_BOOST_REGEX 1 #include "docopt.h" #include "docopt_util.h" #include "docopt_private.h" #include "docopt_value.h" #include #include #include #include #include #include #include #include using namespace docopt; DOCOPT_INLINE std::ostream& docopt::operator<<(std::ostream& os, value const& val) { if (val.isBool()) { bool b = val.asBool(); os << (b ? "true" : "false"); } else if (val.isLong()) { long v = val.asLong(); os << v; } else if (val.isString()) { std::string const& str = val.asString(); os << '"' << str << '"'; } else if (val.isStringList()) { auto const& list = val.asStringList(); os << "["; bool first = true; for(auto const& el : list) { if (first) { first = false; } else { os << ", "; } os << '"' << el << '"'; } os << "]"; } else { os << "null"; } return os; } #if 0 #pragma mark - #pragma mark Parsing stuff #endif class Tokens { public: Tokens(std::vector tokens, bool isParsingArgv = true) : fTokens(std::move(tokens)), fIsParsingArgv(isParsingArgv) {} explicit operator bool() const { return fIndex < fTokens.size(); } static Tokens from_pattern(std::string const& source) { static const std::regex re_separators { "(?:\\s*)" // any spaces (non-matching subgroup) "(" "[\\[\\]\\(\\)\\|]" // one character of brackets or parens or pipe character "|" "\\.\\.\\." // elipsis ")" }; static const std::regex re_strings { "(?:\\s*)" // any spaces (non-matching subgroup) "(" "\\S*<.*?>" // strings, but make sure to keep "< >" strings together "|" "[^<>\\s]+" // string without <> ")" }; // We do two stages of regex matching. The '[]()' and '...' are strong delimeters // and need to be split out anywhere they occur (even at the end of a token). We // first split on those, and then parse the stuff between them to find the string // tokens. This is a little harder than the python version, since they have regex.split // and we dont have anything like that. std::vector tokens; std::for_each(std::sregex_iterator{ source.begin(), source.end(), re_separators }, std::sregex_iterator{}, [&](std::smatch const& match) { // handle anything before the separator (this is the "stuff" between the delimeters) if (match.prefix().matched) { std::for_each(std::sregex_iterator{match.prefix().first, match.prefix().second, re_strings}, std::sregex_iterator{}, [&](std::smatch const& m) { tokens.push_back(m[1].str()); }); } // handle the delimter token itself if (match[1].matched) { tokens.push_back(match[1].str()); } }); return Tokens(tokens, false); } std::string const& current() const { if (*this) return fTokens[fIndex]; static std::string const empty; return empty; } std::string the_rest() const { if (!*this) return {}; return join(fTokens.begin()+static_cast(fIndex), fTokens.end(), " "); } std::string pop() { return std::move(fTokens.at(fIndex++)); } bool isParsingArgv() const { return fIsParsingArgv; } struct OptionError : std::runtime_error { using runtime_error::runtime_error; }; private: std::vector fTokens; size_t fIndex = 0; bool fIsParsingArgv; }; // Get all instances of 'T' from the pattern template std::vector flat_filter(Pattern& pattern) { std::vector flattened = pattern.flat([](Pattern const* p) -> bool { return dynamic_cast(p) != nullptr; }); // now, we're guaranteed to have T*'s, so just use static_cast std::vector ret; std::transform(flattened.begin(), flattened.end(), std::back_inserter(ret), [](Pattern* p) { return static_cast(p); }); return ret; } static std::vector parse_section( std::string const& name, std::string const& source ) { #ifndef _MSC_VER // ECMAScript regex only has "?=" for a non-matching lookahead. In order to make sure we always have // a newline to anchor our matching, we have to avoid matching the final newline of each grouping. // Therefore, our regex is adjusted from the docopt Python one to use ?= to match the newlines before // the following lines, rather than after. std::regex const re_section_pattern{ "(?:^|\\n)" // anchored at a linebreak (or start of string) "(" "[^\\n]*" + name + "[^\\n]*(?=\\n?)" // a line that contains the name "(?:\\n[ \\t].*?(?=\\n|$))*" // followed by any number of lines that are indented ")", std::regex::icase }; std::vector ret; std::for_each( std::sregex_iterator( source.begin(), source.end(), re_section_pattern ), std::sregex_iterator(), [&]( std::smatch const& match ) { ret.push_back( trim( match[1].str() ) ); } ); return ret; #else //Parse the sections in a more old-fashioned way in order to avoid stack overflows in Microsoft's regex implementation std::regex const re_section_start_pattern{ "(?:^|\\n)[^\\n]*" + name, std::regex::icase }; std::sregex_iterator const re_end; std::vector ret; auto const source_end = source.end(); std::sregex_iterator section_head( source.begin(), source_end, re_section_start_pattern ); for (; section_head != re_end; ++section_head) { //We found a section header auto section_start = source.begin() + section_head->position(); if (*section_start == '\n') ++section_start; //If it is positioned on a newline, move ahead one char //Add the complete header line to the section auto section_end = std::find( section_start, source_end, '\n' ); if (section_end != source_end) ++section_end; //skip '\n' while (section_end != source_end) { //Add subsequent lines to the section if they're indented if (*section_end != '\t' && *section_end != ' ') break; //Unindented lines end the section section_end = std::find( section_end, source_end, '\n' ); if (section_end != source_end) ++section_end; //skip '\n' } ret.push_back( trim( { section_start,section_end } ) ); } return ret; #endif } static bool is_argument_spec(std::string const& token) { if (token.empty()) return false; if (token[0]=='<' && token[token.size()-1]=='>') return true; if (std::all_of(token.begin(), token.end(), &::isupper)) return true; return false; } template std::vector longOptions(I iter, I end) { std::vector ret; std::transform(iter, end, std::back_inserter(ret), [](typename I::reference opt) { return opt->longOption(); }); return ret; } static PatternList parse_long(Tokens& tokens, std::vector