123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399 |
- /* Distributed under the OSI-approved BSD 3-Clause License. See accompanying
- file Copyright.txt or https://cmake.org/licensing for details. */
- #pragma once
- #include "cmConfigure.h" // IWYU pragma: keep
- #include <cctype>
- #include <cstring>
- #include <initializer_list>
- #include <iterator>
- #include <numeric>
- #include <sstream>
- #include <string>
- #include <utility>
- #include <vector>
- #include <cm/string_view>
- #include "cmRange.h"
- #include "cmValue.h"
- /** String range type. */
- using cmStringRange = cmRange<std::vector<std::string>::const_iterator>;
- /** Returns length of a literal string. */
- template <size_t N>
- constexpr size_t cmStrLen(const char (&)[N])
- {
- return N - 1;
- }
- /** Callable string comparison struct. */
- struct cmStrCmp
- {
- cmStrCmp(std::string str)
- : Test_(std::move(str))
- {
- }
- bool operator()(cm::string_view sv) const { return this->Test_ == sv; }
- private:
- std::string const Test_;
- };
- /**
- * Test if two strings are identical, ignoring case.
- *
- * Note that this is not guaranteed to work correctly on non-ASCII strings.
- */
- bool cmStrCaseEq(cm::string_view a, cm::string_view b);
- /** Returns true if the character @a ch is a whitespace character. **/
- inline bool cmIsSpace(char ch)
- {
- // isspace takes 'int' but documents that the value must be representable
- // by 'unsigned char', or be EOF. Cast to 'unsigned char' to avoid sign
- // extension while converting to 'int'.
- return std::isspace(static_cast<unsigned char>(ch));
- }
- /** Returns a string that has whitespace removed from the start and the end. */
- std::string cmTrimWhitespace(cm::string_view str);
- /** Returns a string that has quotes removed from the start and the end. */
- std::string cmRemoveQuotes(cm::string_view str);
- /** Escape quotes in a string. */
- std::string cmEscapeQuotes(cm::string_view str);
- /** Joins elements of a range with separator into a single string. */
- template <typename Range>
- std::string cmJoin(Range const& rng, cm::string_view separator)
- {
- if (rng.empty()) {
- return std::string();
- }
- std::ostringstream os;
- auto it = rng.begin();
- auto const end = rng.end();
- os << *it;
- while (++it != end) {
- os << separator << *it;
- }
- return os.str();
- }
- /** Generic function to join strings range with separator
- * and initial leading string into a single string.
- */
- template <typename Range>
- std::string cmJoinStrings(Range const& rng, cm::string_view separator,
- cm::string_view initial)
- {
- if (rng.empty()) {
- return { std::begin(initial), std::end(initial) };
- }
- std::string result;
- result.reserve(std::accumulate(
- std::begin(rng), std::end(rng),
- initial.size() + (rng.size() - 1) * separator.size(),
- [](std::size_t sum, typename Range::value_type const& item) {
- return sum + item.size();
- }));
- result.append(std::begin(initial), std::end(initial));
- auto begin = std::begin(rng);
- auto end = std::end(rng);
- result += *begin;
- for (++begin; begin != end; ++begin) {
- result.append(std::begin(separator), std::end(separator));
- result += *begin;
- }
- return result;
- }
- /**
- * Faster overloads for std::string ranges.
- * If @a initial is provided, it prepends the resulted string without
- * @a separator between them.
- */
- std::string cmJoin(std::vector<std::string> const& rng,
- cm::string_view separator, cm::string_view initial = {});
- std::string cmJoin(cmStringRange const& rng, cm::string_view separator,
- cm::string_view initial = {});
- enum class cmTokenizerMode
- {
- /// A backward-compatible behavior when in the case of no
- /// tokens have found in an input text it'll return one empty
- /// token in the result container (vector).
- Legacy,
- /// The new behavior is to return an empty vector.
- New
- };
- /**
- * \brief A generic version of a tokenizer.
- *
- * Extract tokens from the input string separated by any
- * of the characters in `sep` and assign them to the
- * given output iterator.
- *
- * The `mode` parameter defines the behavior in the case when
- * no tokens have found in the input text.
- *
- */
- template <typename StringT, typename OutIt, typename Sep = char>
- void cmTokenize(OutIt outIt, cm::string_view str, Sep sep,
- cmTokenizerMode mode)
- {
- auto hasTokens = false;
- // clang-format off
- for (auto start = str.find_first_not_of(sep)
- , end = str.find_first_of(sep, start)
- ; start != cm::string_view::npos
- ; start = str.find_first_not_of(sep, end)
- , end = str.find_first_of(sep, start)
- , hasTokens = true
- ) {
- *outIt++ = StringT{ str.substr(start, end - start) };
- }
- // clang-format on
- if (!hasTokens && mode == cmTokenizerMode::Legacy) {
- *outIt = {};
- }
- }
- /**
- * \brief Extract tokens that are separated by any of the
- * characters in `sep`.
- *
- * Backward compatible signature.
- *
- * \return A vector of strings.
- */
- template <typename Sep = char>
- std::vector<std::string> cmTokenize(
- cm::string_view str, Sep sep, cmTokenizerMode mode = cmTokenizerMode::Legacy)
- {
- using StringType = std::string;
- std::vector<StringType> tokens;
- cmTokenize<StringType>(std::back_inserter(tokens), str, sep, mode);
- return tokens;
- }
- /**
- * \brief Extract tokens that are separated by any of the
- * characters in `sep`.
- *
- * \return A vector of string views.
- */
- template <typename Sep = char>
- std::vector<cm::string_view> cmTokenizedView(
- cm::string_view str, Sep sep, cmTokenizerMode mode = cmTokenizerMode::Legacy)
- {
- using StringType = cm::string_view;
- std::vector<StringType> tokens;
- cmTokenize<StringType>(std::back_inserter(tokens), str, sep, mode);
- return tokens;
- }
- /** Concatenate string pieces into a single string. */
- std::string cmCatViews(
- std::initializer_list<std::pair<cm::string_view, std::string*>> views);
- /** Utility class for cmStrCat. */
- class cmAlphaNum
- {
- public:
- cmAlphaNum(cm::string_view view)
- : View_(view)
- {
- }
- cmAlphaNum(std::string const& str)
- : View_(str)
- {
- }
- cmAlphaNum(std::string&& str)
- : RValueString_(&str)
- {
- }
- cmAlphaNum(const char* str)
- : View_(str ? cm::string_view(str) : cm::string_view())
- {
- }
- cmAlphaNum(char ch)
- : View_(this->Digits_, 1)
- {
- this->Digits_[0] = ch;
- }
- cmAlphaNum(int val);
- cmAlphaNum(unsigned int val);
- cmAlphaNum(long int val);
- cmAlphaNum(unsigned long int val);
- cmAlphaNum(long long int val);
- cmAlphaNum(unsigned long long int val);
- cmAlphaNum(float val);
- cmAlphaNum(double val);
- cmAlphaNum(cmValue value)
- : View_(*value)
- {
- }
- cm::string_view View() const
- {
- if (this->RValueString_) {
- return *this->RValueString_;
- }
- return this->View_;
- }
- std::string* RValueString() const { return this->RValueString_; }
- private:
- std::string* RValueString_ = nullptr;
- cm::string_view View_;
- char Digits_[32];
- };
- /** Concatenate string pieces and numbers into a single string. */
- template <typename A, typename B, typename... AV>
- inline std::string cmStrCat(A&& a, B&& b, AV&&... args)
- {
- static auto const makePair =
- [](const cmAlphaNum& arg) -> std::pair<cm::string_view, std::string*> {
- return { arg.View(), arg.RValueString() };
- };
- return cmCatViews({ makePair(std::forward<A>(a)),
- makePair(std::forward<B>(b)),
- makePair(std::forward<AV>(args))... });
- }
- /** Joins wrapped elements of a range with separator into a single string. */
- template <typename Range>
- std::string cmWrap(cm::string_view prefix, Range const& rng,
- cm::string_view suffix, cm::string_view sep)
- {
- if (rng.empty()) {
- return std::string();
- }
- return cmCatViews({ { prefix, nullptr },
- { cmJoin(rng,
- cmCatViews({ { suffix, nullptr },
- { sep, nullptr },
- { prefix, nullptr } })),
- nullptr },
- { suffix, nullptr } });
- }
- /** Joins wrapped elements of a range with separator into a single string. */
- template <typename Range>
- std::string cmWrap(char prefix, Range const& rng, char suffix,
- cm::string_view sep)
- {
- return cmWrap(cm::string_view(&prefix, 1), rng, cm::string_view(&suffix, 1),
- sep);
- }
- /** Returns true if string @a str starts with the character @a prefix. */
- inline bool cmHasPrefix(cm::string_view str, char prefix)
- {
- return !str.empty() && (str.front() == prefix);
- }
- /** Returns true if string @a str starts with string @a prefix. */
- inline bool cmHasPrefix(cm::string_view str, cm::string_view prefix)
- {
- return str.compare(0, prefix.size(), prefix) == 0;
- }
- /** Returns true if string @a str starts with string @a prefix. */
- inline bool cmHasPrefix(cm::string_view str, cmValue prefix)
- {
- if (!prefix) {
- return false;
- }
- return str.compare(0, prefix->size(), *prefix) == 0;
- }
- /** Returns true if string @a str starts with string @a prefix. */
- template <size_t N>
- inline bool cmHasLiteralPrefix(cm::string_view str, const char (&prefix)[N])
- {
- return cmHasPrefix(str, cm::string_view(prefix, N - 1));
- }
- /** Returns true if string @a str ends with the character @a suffix. */
- inline bool cmHasSuffix(cm::string_view str, char suffix)
- {
- return !str.empty() && (str.back() == suffix);
- }
- /** Returns true if string @a str ends with string @a suffix. */
- inline bool cmHasSuffix(cm::string_view str, cm::string_view suffix)
- {
- return str.size() >= suffix.size() &&
- str.compare(str.size() - suffix.size(), suffix.size(), suffix) == 0;
- }
- /** Returns true if string @a str ends with string @a suffix. */
- inline bool cmHasSuffix(cm::string_view str, cmValue suffix)
- {
- if (!suffix) {
- return false;
- }
- return str.size() >= suffix->size() &&
- str.compare(str.size() - suffix->size(), suffix->size(), *suffix) == 0;
- }
- /** Returns true if string @a str ends with string @a suffix. */
- template <size_t N>
- inline bool cmHasLiteralSuffix(cm::string_view str, const char (&suffix)[N])
- {
- return cmHasSuffix(str, cm::string_view(suffix, N - 1));
- }
- /** Removes an existing suffix character of from the string @a str. */
- inline void cmStripSuffixIfExists(std::string& str, char suffix)
- {
- if (cmHasSuffix(str, suffix)) {
- str.pop_back();
- }
- }
- /** Removes an existing suffix string of from the string @a str. */
- inline void cmStripSuffixIfExists(std::string& str, cm::string_view suffix)
- {
- if (cmHasSuffix(str, suffix)) {
- str.resize(str.size() - suffix.size());
- }
- }
- /** Converts a string to long. Expects that the whole string is an integer. */
- bool cmStrToLong(const char* str, long* value);
- bool cmStrToLong(std::string const& str, long* value);
- /** Converts a string to unsigned long. Expects that the whole string is an
- * integer */
- bool cmStrToULong(const char* str, unsigned long* value);
- bool cmStrToULong(std::string const& str, unsigned long* value);
- /** Converts a string to long long. Expects that the whole string
- * is an integer */
- bool cmStrToLongLong(const char* str, long long* value);
- bool cmStrToLongLong(std::string const& str, long long* value);
- /** Converts a string to unsigned long long. Expects that the whole string
- * is an integer */
- bool cmStrToULongLong(const char* str, unsigned long long* value);
- bool cmStrToULongLong(std::string const& str, unsigned long long* value);
|