mijin2/source/mijin/util/string.hpp

327 lines
9.0 KiB
C++

#pragma once
#if !defined(MIJIN_UTIL_STRING_HPP_INCLUDED)
#define MIJIN_UTIL_STRING_HPP_INCLUDED 1
#include <algorithm>
#include <array>
#include <charconv>
#include <iterator>
#include <limits>
#include <locale>
#include <sstream>
#include <string>
#include <string_view>
#include <vector>
#include "./iterators.hpp"
namespace mijin
{
//
// public defines
//
//
// public constants
//
//
// public traits
//
template<typename TString>
using char_type_t = decltype(std::string_view(std::declval<TString>()))::value_type;
//
// public types
//
struct SplitOptions
{
std::size_t limitParts = std::numeric_limits<std::size_t>::max();
bool ignoreEmpty = true;
};
//
// public functions
//
template <typename TRange, typename TValue = typename TRange::value_type>
[[nodiscard]] std::string join(const TRange& elements, const char* const delimiter)
{
std::ostringstream oss;
auto first = std::begin(elements);
auto last = std::end(elements);
if (first != last)
{
std::copy(first, std::prev(last), std::ostream_iterator<TValue>(oss, delimiter));
first = std::prev(last);
}
if (first != last)
{
oss << *first;
}
return oss.str();
}
namespace detail
{
template<typename TChar, typename TTraits>
std::vector<std::basic_string_view<TChar, TTraits>> splitImpl(std::basic_string_view<TChar, TTraits> stringView,
std::basic_string_view<TChar, TTraits> separator,
const SplitOptions& options)
{
using sv_t = std::basic_string_view<TChar, TTraits>;
MIJIN_ASSERT(options.limitParts > 0, "Cannot split to zero parts.");
MIJIN_ASSERT(!separator.empty(), "Separator cannot be empty.");
if (separator.empty())
{
return {};
}
std::vector<sv_t> result;
if (options.limitParts <= 1)
{
result.push_back(stringView);
return result;
}
auto start = stringView.begin();
auto pos = start;
const auto end = stringView.end();
auto seperatorFound = [&]()
{
return pos <= (end - separator.size()) && sv_t(pos, pos + separator.size()) == separator;
};
while (pos != end)
{
if (seperatorFound())
{
if (!options.ignoreEmpty || pos != start)
{
result.emplace_back(start, pos);
}
start = pos = (pos + separator.size());
if (result.size() == options.limitParts - 1)
{
if (options.ignoreEmpty)
{
while (seperatorFound())
{
pos += separator.size();
}
}
result.emplace_back(pos, end);
return result;
}
if (!options.ignoreEmpty && pos == end)
{
// skipped a separator at the very end, add an empty entry
result.emplace_back("");
return result;
}
}
else
{
++pos;
}
}
if (start != end)
{
result.emplace_back(start, end);
}
return result;
}
template<typename TChar, typename TTraitsA, typename TTraitsB>
bool equalsIgnoreCaseImpl(std::basic_string_view<TChar, TTraitsA> stringA, std::basic_string_view<TChar, TTraitsB> stringB) noexcept
{
if (stringA.size() != stringB.size())
{
return false;
}
for (const auto [charA, charB] : zip(stringA, stringB))
{
if (std::tolower(charA) != std::tolower(charB))
{
return false;
}
}
return true;
}
template<typename TChar, typename TTraits>
std::basic_string_view<TChar, TTraits> trimPrefixImpl(std::basic_string_view<TChar, TTraits> stringView,
std::basic_string_view<TChar, TTraits> charsToTrim)
{
stringView.remove_prefix(std::min(stringView.find_first_not_of(charsToTrim), stringView.size()));
return stringView;
}
template<typename TChar, typename TTraits>
std::basic_string_view<TChar, TTraits> trimSuffixImpl(std::basic_string_view<TChar, TTraits> stringView,
std::basic_string_view<TChar, TTraits> charsToTrim)
{
stringView.remove_suffix(stringView.size() - std::min(stringView.find_last_not_of(charsToTrim) + 1, stringView.size()));
return stringView;
}
template<typename TChar, typename TTraits>
std::basic_string_view<TChar, TTraits> trimImpl(std::basic_string_view<TChar, TTraits> stringView,
std::basic_string_view<TChar, TTraits> charsToTrim)
{
return trimPrefixImpl(trimSuffixImpl(stringView, charsToTrim), charsToTrim);
}
template<typename TChar>
static const std::array DEFAULT_TRIM_CHARS_DATA = {TChar(' '), TChar('\t'), TChar('\r'), TChar('\n')};
template<typename TChar>
static const std::basic_string_view<TChar, std::char_traits<TChar>> DEFAULT_TRIM_CHARS
= {DEFAULT_TRIM_CHARS_DATA<TChar>.begin(), DEFAULT_TRIM_CHARS_DATA<TChar>.end()};
}
template<typename TLeft, typename TRight>
[[nodiscard]] auto split(TLeft&& stringView, TRight&& separator, const SplitOptions& options = {})
{
return detail::splitImpl(std::basic_string_view(std::forward<TLeft>(stringView)),
std::basic_string_view(std::forward<TRight>(separator)), options);
}
template<typename TString, typename TChars>
[[nodiscard]]
auto trimPrefix(TString&& string, TChars&& chars)
{
return detail::trimPrefixImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
}
template<typename TString>
[[nodiscard]]
auto trimPrefix(TString&& string)
{
return trimPrefix(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
}
template<typename TString, typename TChars>
[[nodiscard]]
auto trimSuffix(TString&& string, TChars&& chars)
{
return detail::trimSuffixImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
}
template<typename TString>
[[nodiscard]]
auto trimSuffix(TString&& string)
{
return trimSuffix(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
}
template<typename TString, typename TChars>
[[nodiscard]]
auto trim(TString&& string, TChars&& chars)
{
return detail::trimImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
}
template<typename TString>
[[nodiscard]]
auto trim(TString&& string)
{
return trim(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
}
template<typename TLeft, typename TRight>
[[nodiscard]] bool equalsIgnoreCase(TLeft&& left, TRight&& right) noexcept
{
return detail::equalsIgnoreCaseImpl(std::string_view(left), std::string_view(right));
}
template<typename TChar, typename TTraits, typename TAllocator>
constexpr void makeLower(std::basic_string<TChar, TTraits, TAllocator>& string)
{
std::transform(string.begin(), string.end(), string.begin(), [locale = std::locale()](TChar chr)
{
return std::tolower<TChar>(chr, locale);
});
}
template<typename TChar, typename TTraits, typename TAllocator>
constexpr void makeUpper(std::basic_string<TChar, TTraits, TAllocator>& string)
{
std::transform(string.begin(), string.end(), string.begin(), [locale = std::locale()](TChar chr)
{
return std::toupper<TChar>(chr, locale);
});
}
template<typename... TArgs>
[[nodiscard]]
constexpr auto toLower(TArgs&&... args)
{
std::basic_string string(std::forward<TArgs>(args)...);
makeLower(string);
return string;
}
template<typename... TArgs>
[[nodiscard]]
constexpr auto toUpper(TArgs&&... args)
{
std::basic_string string(std::forward<TArgs>(args)...);
makeUpper(string);
return string;
}
template<typename TNumber>
[[nodiscard]]
constexpr bool toNumber(std::string_view stringView, TNumber& outNumber, int base = 10) noexcept
{
const char* start = &*stringView.begin();
const char* end = start + stringView.size();
const std::from_chars_result res = std::from_chars(start, end, outNumber, base);
return res.ec == std::errc{} && res.ptr == end;
}
template<typename TChar, typename TTraits, typename TNumber>
[[nodiscard]]
constexpr bool toNumber(std::basic_string_view<TChar, TTraits> stringView, TNumber& outNumber, int base = 10) noexcept requires (!std::is_same_v<TChar, char>)
{
std::string asString;
asString.resize(stringView.size());
// should only contain number symbols, so just cast down to char
std::transform(stringView.begin(), stringView.end(), asString.begin(), [](TChar chr) { return static_cast<char>(chr); });
return toNumber(asString, outNumber, base);
}
namespace pipe
{
struct Join
{
const char* delimiter;
explicit Join(const char* delimiter_) noexcept : delimiter(delimiter_) {}
};
template<typename TIterable>
auto operator|(TIterable&& iterable, const Join& joiner)
{
return join(std::forward<TIterable>(iterable), joiner.delimiter);
}
}
} // namespace mijin
#endif // !defined(MIJIN_UTIL_STRING_HPP_INCLUDED)