387 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			387 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| 
 | |
| #pragma once
 | |
| 
 | |
| #if !defined(MIJIN_UTIL_STRING_HPP_INCLUDED)
 | |
| #define MIJIN_UTIL_STRING_HPP_INCLUDED 1
 | |
| 
 | |
| #include <algorithm>
 | |
| #include <array>
 | |
| #include <charconv>
 | |
| #include <iterator>
 | |
| #include <limits>
 | |
| #include <locale>
 | |
| #include <sstream>
 | |
| #include <string>
 | |
| #include <string_view>
 | |
| #include <vector>
 | |
| 
 | |
| #include "./iterators.hpp"
 | |
| #include "../internal/common.hpp"
 | |
| 
 | |
| namespace mijin
 | |
| {
 | |
| 
 | |
| //
 | |
| // public defines
 | |
| //
 | |
| 
 | |
| //
 | |
| // public constants
 | |
| //
 | |
| 
 | |
| //
 | |
| // public traits
 | |
| //
 | |
| 
 | |
| template<typename TString>
 | |
| using char_type_t = decltype(std::string_view(std::declval<TString>()))::value_type;
 | |
| 
 | |
| //
 | |
| // public types
 | |
| //
 | |
| 
 | |
| struct SplitOptions
 | |
| {
 | |
|     std::size_t limitParts = std::numeric_limits<std::size_t>::max();
 | |
|     bool ignoreEmpty = true;
 | |
| };
 | |
| 
 | |
| //
 | |
| // public functions
 | |
| //
 | |
| 
 | |
| template <typename TRange, typename TValue = typename TRange::value_type>
 | |
| [[nodiscard]] std::string join(const TRange& elements, const char* const delimiter)
 | |
| {
 | |
|     std::ostringstream oss;
 | |
|     auto first = std::begin(elements);
 | |
|     auto last = std::end(elements);
 | |
| 
 | |
|     if (first != last)
 | |
|     {
 | |
|         std::copy(first, std::prev(last), std::ostream_iterator<TValue>(oss, delimiter));
 | |
|         first = std::prev(last);
 | |
|     }
 | |
|     if (first != last)
 | |
|     {
 | |
|         oss << *first;
 | |
|     }
 | |
| 
 | |
|     return oss.str();
 | |
| }
 | |
| 
 | |
| namespace detail
 | |
| {
 | |
| template<typename TChar, typename TTraits, typename TOutIterator>
 | |
| void splitImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                std::basic_string_view<TChar, TTraits> separator,
 | |
|                const SplitOptions& options,
 | |
|                TOutIterator outIterator,
 | |
|                std::size_t& numEmitted)
 | |
| {
 | |
|     using sv_t = std::basic_string_view<TChar, TTraits>;
 | |
| 
 | |
|     MIJIN_ASSERT(options.limitParts > 0, "Cannot split to zero parts.");
 | |
|     MIJIN_ASSERT(!separator.empty(), "Separator cannot be empty.");
 | |
| 
 | |
|     if (separator.empty())
 | |
|     {
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     auto emit = [&](std::string_view result)
 | |
|     {
 | |
|         *outIterator = result;
 | |
|         ++outIterator;
 | |
|         ++numEmitted;
 | |
|     };
 | |
| 
 | |
|     if (options.limitParts <= 1)
 | |
|     {
 | |
|         emit(stringView);
 | |
|         return;
 | |
|     }
 | |
|     auto start = stringView.begin();
 | |
|     auto pos = start;
 | |
|     const auto end = stringView.end();
 | |
| 
 | |
|     auto seperatorFound = [&]()
 | |
|     {
 | |
|         return pos <= (end - separator.size()) && sv_t(pos, pos + separator.size()) == separator;
 | |
|     };
 | |
| 
 | |
|     while (pos != end)
 | |
|     {
 | |
|         if (seperatorFound())
 | |
|         {
 | |
|             if (!options.ignoreEmpty || pos != start)
 | |
|             {
 | |
|                 emit(std::string_view(start, pos));
 | |
|             }
 | |
|             start = pos = (pos + separator.size());
 | |
|             if (numEmitted == options.limitParts - 1)
 | |
|             {
 | |
|                 if (options.ignoreEmpty)
 | |
|                 {
 | |
|                     while (seperatorFound())
 | |
|                     {
 | |
|                         pos += separator.size();
 | |
|                     }
 | |
|                 }
 | |
|                 emit(std::string_view(pos, end));
 | |
|                 return;
 | |
|             }
 | |
|             if (!options.ignoreEmpty && pos == end)
 | |
|             {
 | |
|                 // skipped a separator at the very end, add an empty entry
 | |
|                 emit("");
 | |
|                 return;
 | |
|             }
 | |
|         }
 | |
|         else
 | |
|         {
 | |
|             ++pos;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (start != end)
 | |
|     {
 | |
|         emit(std::string_view(start, end));
 | |
|     }
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits>
 | |
| std::vector<std::basic_string_view<TChar, TTraits>> splitImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                                                               std::basic_string_view<TChar, TTraits> separator,
 | |
|                                                               const SplitOptions& options)
 | |
| {
 | |
|     std::vector<std::basic_string_view<TChar, TTraits>> result;
 | |
|     std::size_t numEmitted = 0;
 | |
|     splitImpl(stringView, separator, options, std::back_inserter(result), numEmitted);
 | |
|     return result;
 | |
| }
 | |
| 
 | |
| 
 | |
| template<std::size_t count, typename TChar, typename TTraits>
 | |
| std::array<std::basic_string_view<TChar, TTraits>, count> splitFixedImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                                                                          std::basic_string_view<TChar, TTraits> separator,
 | |
|                                                                          SplitOptions options,
 | |
|                                                                          std::size_t* outNumResults)
 | |
| {
 | |
|     options.limitParts = count;
 | |
| 
 | |
|     std::array<std::basic_string_view<TChar, TTraits>, count> result;
 | |
|     std::size_t numEmitted = 0;
 | |
|     splitImpl(stringView, separator, options, result.begin(), numEmitted);
 | |
|     if (outNumResults != nullptr)
 | |
|     {
 | |
|         *outNumResults = numEmitted;
 | |
|     }
 | |
|     return result;
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraitsA, typename TTraitsB>
 | |
| bool equalsIgnoreCaseImpl(std::basic_string_view<TChar, TTraitsA> stringA, std::basic_string_view<TChar, TTraitsB> stringB) MIJIN_NOEXCEPT
 | |
| {
 | |
|     if (stringA.size() != stringB.size())
 | |
|     {
 | |
|         return false;
 | |
|     }
 | |
| 
 | |
|     for (const auto [charA, charB] : zip(stringA, stringB))
 | |
|     {
 | |
|         if (std::tolower(charA) != std::tolower(charB))
 | |
|         {
 | |
|             return false;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return true;
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits>
 | |
| std::basic_string_view<TChar, TTraits> trimPrefixImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                                                       std::basic_string_view<TChar, TTraits> charsToTrim)
 | |
| {
 | |
|     stringView.remove_prefix(std::min(stringView.find_first_not_of(charsToTrim), stringView.size()));
 | |
|     return stringView;
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits>
 | |
| std::basic_string_view<TChar, TTraits> trimSuffixImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                                                       std::basic_string_view<TChar, TTraits> charsToTrim)
 | |
| {
 | |
|     stringView.remove_suffix(stringView.size() - std::min(stringView.find_last_not_of(charsToTrim) + 1, stringView.size()));
 | |
|     return stringView;
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits>
 | |
| std::basic_string_view<TChar, TTraits> trimImpl(std::basic_string_view<TChar, TTraits> stringView,
 | |
|                                                 std::basic_string_view<TChar, TTraits> charsToTrim)
 | |
| {
 | |
|     return trimPrefixImpl(trimSuffixImpl(stringView, charsToTrim), charsToTrim);
 | |
| }
 | |
| 
 | |
| template<typename TChar>
 | |
| static const std::array DEFAULT_TRIM_CHARS_DATA = {TChar(' '), TChar('\t'), TChar('\r'), TChar('\n')};
 | |
| 
 | |
| template<typename TChar>
 | |
| static const std::basic_string_view<TChar, std::char_traits<TChar>> DEFAULT_TRIM_CHARS
 | |
|     = {DEFAULT_TRIM_CHARS_DATA<TChar>.begin(), DEFAULT_TRIM_CHARS_DATA<TChar>.end()};
 | |
| }
 | |
| 
 | |
| template<typename TLeft, typename TRight>
 | |
| [[nodiscard]] auto split(TLeft&& stringView, TRight&& separator, const SplitOptions& options = {})
 | |
| {
 | |
|     return detail::splitImpl(std::basic_string_view(std::forward<TLeft>(stringView)),
 | |
|                              std::basic_string_view(std::forward<TRight>(separator)), options);
 | |
| }
 | |
| 
 | |
| template<std::size_t count, typename TLeft, typename TRight>
 | |
| [[nodiscard]] auto splitFixed(TLeft&& stringView, TRight&& separator, SplitOptions options = {}, std::size_t* outNumResults = nullptr)
 | |
| {
 | |
|     return detail::splitFixedImpl<count>(std::basic_string_view(std::forward<TLeft>(stringView)),
 | |
|                                          std::basic_string_view(std::forward<TRight>(separator)), options, outNumResults);
 | |
| }
 | |
| 
 | |
| template<typename TString, typename TChars>
 | |
| [[nodiscard]]
 | |
| auto trimPrefix(TString&& string, TChars&& chars)
 | |
| {
 | |
|     return detail::trimPrefixImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
 | |
| }
 | |
| 
 | |
| template<typename TString>
 | |
| [[nodiscard]]
 | |
| auto trimPrefix(TString&& string)
 | |
| {
 | |
|     return trimPrefix(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
 | |
| }
 | |
| 
 | |
| template<typename TString, typename TChars>
 | |
| [[nodiscard]]
 | |
| auto trimSuffix(TString&& string, TChars&& chars)
 | |
| {
 | |
|     return detail::trimSuffixImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
 | |
| }
 | |
| 
 | |
| template<typename TString>
 | |
| [[nodiscard]]
 | |
| auto trimSuffix(TString&& string)
 | |
| {
 | |
|     return trimSuffix(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
 | |
| }
 | |
| 
 | |
| template<typename TString, typename TChars>
 | |
| [[nodiscard]]
 | |
| auto trim(TString&& string, TChars&& chars)
 | |
| {
 | |
|     return detail::trimImpl(std::string_view(std::forward<TString>(string)), std::string_view(std::forward<TChars>(chars)));
 | |
| }
 | |
| 
 | |
| template<typename TString>
 | |
| [[nodiscard]]
 | |
| auto trim(TString&& string)
 | |
| {
 | |
|     return trim(string, detail::DEFAULT_TRIM_CHARS<char_type_t<TString>>);
 | |
| }
 | |
| 
 | |
| template<typename TLeft, typename TRight>
 | |
| [[nodiscard]] bool equalsIgnoreCase(TLeft&& left, TRight&& right) MIJIN_NOEXCEPT
 | |
| {
 | |
|     return detail::equalsIgnoreCaseImpl(std::string_view(left), std::string_view(right));
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits, typename TAllocator>
 | |
| constexpr void makeLower(std::basic_string<TChar, TTraits, TAllocator>& string)
 | |
| {
 | |
|     std::transform(string.begin(), string.end(), string.begin(), [locale = std::locale()](TChar chr)
 | |
|     {
 | |
|         return std::tolower<TChar>(chr, locale);
 | |
|     });
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits, typename TAllocator>
 | |
| constexpr void makeUpper(std::basic_string<TChar, TTraits, TAllocator>& string)
 | |
| {
 | |
|     std::transform(string.begin(), string.end(), string.begin(), [locale = std::locale()](TChar chr)
 | |
|     {
 | |
|         return std::toupper<TChar>(chr, locale);
 | |
|     });
 | |
| }
 | |
| 
 | |
| template<typename... TArgs>
 | |
| [[nodiscard]]
 | |
| constexpr auto toLower(TArgs&&... args)
 | |
| {
 | |
|     std::basic_string string(std::forward<TArgs>(args)...);
 | |
|     makeLower(string);
 | |
|     return string;
 | |
| }
 | |
| 
 | |
| template<typename... TArgs>
 | |
| [[nodiscard]]
 | |
| constexpr auto toUpper(TArgs&&... args)
 | |
| {
 | |
|     std::basic_string string(std::forward<TArgs>(args)...);
 | |
|     makeUpper(string);
 | |
|     return string;
 | |
| }
 | |
| 
 | |
| 
 | |
| template<typename TNumber>
 | |
| [[nodiscard]]
 | |
| constexpr bool toNumber(std::string_view stringView, TNumber& outNumber, int base = 10) MIJIN_NOEXCEPT
 | |
| {
 | |
|     const char* start = &*stringView.begin();
 | |
|     const char* end = start + stringView.size();
 | |
|     const std::from_chars_result res = std::from_chars(start, end, outNumber, base);
 | |
|     return res.ec == std::errc{} && res.ptr == end;
 | |
| }
 | |
| 
 | |
| template<typename TChar, typename TTraits, typename TNumber>
 | |
| [[nodiscard]]
 | |
| constexpr bool toNumber(std::basic_string_view<TChar, TTraits> stringView, TNumber& outNumber, int base = 10) MIJIN_NOEXCEPT requires (!std::is_same_v<TChar, char>)
 | |
| {
 | |
|     std::string asString;
 | |
|     asString.resize(stringView.size());
 | |
|     // should only contain number symbols, so just cast down to char
 | |
|     std::transform(stringView.begin(), stringView.end(), asString.begin(), [](TChar chr) { return static_cast<char>(chr); });
 | |
|     return toNumber(asString, outNumber, base);
 | |
| }
 | |
| 
 | |
| template<typename TChar>
 | |
| [[nodiscard]]
 | |
| constexpr bool isDecimalChar(TChar chr) noexcept
 | |
| {
 | |
|     return (chr >= TChar('0') && chr <= TChar('9'));
 | |
| }
 | |
| 
 | |
| template<typename TChar>
 | |
| [[nodiscard]]
 | |
| constexpr bool isHexadecimalChar(TChar chr) noexcept
 | |
| {
 | |
|     return isDecimalChar(chr)
 | |
|         || (chr >= TChar('A') && chr <= TChar('F'))
 | |
|         || (chr >= TChar('a') && chr <= TChar('f'));
 | |
| }
 | |
| 
 | |
| namespace pipe
 | |
| {
 | |
| struct Join
 | |
| {
 | |
|     const char* delimiter;
 | |
| 
 | |
|     explicit Join(const char* delimiter_) MIJIN_NOEXCEPT : delimiter(delimiter_) {}
 | |
| };
 | |
| 
 | |
| template<typename TIterable>
 | |
| auto operator|(TIterable&& iterable, const Join& joiner)
 | |
| {
 | |
|     return join(std::forward<TIterable>(iterable), joiner.delimiter);
 | |
| }
 | |
| }
 | |
| } // namespace mijin
 | |
| 
 | |
| #endif // !defined(MIJIN_UTIL_STRING_HPP_INCLUDED)
 |