Stroika/_string_8h_source.html

/*

 * Copyright(c) Sophist Solutions, Inc. 1990-2025.  All rights reserved

 */

#ifndef _Stroika_Foundation_Characters_String_h_

#define _Stroika_Foundation_Characters_String_h_ 1


#include "Stroika/Foundation/StroikaPreComp.h"


#include <compare>

#include <iosfwd>

#include <locale>

#include <string>

#include <string_view>


#include "Stroika/Foundation/Characters/Character.h"

#include "Stroika/Foundation/Characters/SDKString.h"

#include "Stroika/Foundation/Common/Compare.h"

#include "Stroika/Foundation/Common/StdCompat.h"

#include "Stroika/Foundation/Containers/Sequence.h"

#include "Stroika/Foundation/Containers/Set.h"

#include "Stroika/Foundation/Memory/SharedByValue.h"

#include "Stroika/Foundation/Memory/StackBuffer.h"

#include "Stroika/Foundation/Traversal/Iterable.h"


/**

 *  \file

 *

 *  \note Code-Status:  <a href="Code-Status.md#Beta">Beta</a>

 *

 * TODO:

 *

 *      @todo   Cleanup SubString (), and String::SubString_ use of SharedByValue<TRAITS>::ReadOnlyReference for

 *              performance. At some level - in String::SubString_ - we have a (hidden) sharedPtr and it would

 *              be safe and performant in that case to re-use that shared_ptr to make a new String envelope.

 *

 *              However, I'm not sure its safe in general to have SharedByValue<TRAITS>::ReadOnlyReference expose

 *              its shared_ptr, which appears needed to make this happen.

 *

 *              Not a biggie opportunity, so we can delay this -- LGP 2014-04-10

 *

 *      @todo   Add PadLeft/PadRight or FillLeft/FilLRight() - not sure which name is better. But idea is to

 *              produce a string which is identical to the orig except that IF start len < n, then expand it with

 *              the given arg char repeated on the left or right.

 *

 *      @todo   RFind() API should be embellished to include startAt etc, like regular Find () - but not 100%

 *              sure - think through...

 *

 *      @todo   MAYBE also add ReplaceOne() function (we have ReplaceAll() now) ; see Replace() API in this function? - maybe overload?

 *

 *      @todo   Move DOCS in the top of this file down to the appropriate major classes - and then review the implementation and make sure

 *              it is all correct for each (especially SetStorage () stuff looks questionable)

 *

 */


namespace Stroika::Foundation::Containers {

    template <typename T>

    class Set;

}


namespace Stroika::Foundation::Characters {


    /*

     *  \brief On Windows, affects the behavior of String::As<filesystem::path> ()

     *

     *  On windows, its helpful when mapping String to std::filesystem::pathname to map certain common name

     *  prefixes to things that will be found on Windows.

     *

     *  MSYS creates paths like /c/folder for c:/folder

     *  CYGWIN creates paths like /cygdrive/c/folder for c:/folder

     *

     *  Automatically map these (since Stroika v3.0d6) in (was ToPath) As<filesystem::path> ();

     *

     *   \see https://www.msys2.org/docs/filesystem-paths/

     *        this API is for getting strings from the commandline, or user input, or configuration files etc, where Cygwin

     *        or msys style paths maybe present. APIs that talk directly to the OS are more likely to more directly produce

     *        filesystem::path than String. Anyhow - because of this, on windows, its probably more helpful than not to map

     *        the MSYS/cygdrive crap to a path more likely to actually work right. --LGP 2024-03-06

     */

#ifndef qStroika_Foundation_Characters_AsPathAutoMapMSYSAndCygwin

#define qStroika_Foundation_Characters_AsPathAutoMapMSYSAndCygwin qStroika_Foundation_Common_Platform_Windows

#endif


}


#if qStroika_Foundation_Characters_AsPathAutoMapMSYSAndCygwin

namespace std::filesystem {

    class path; // forward declare for template specialization

}

#endif


namespace Stroika::Foundation::Characters {


    class RegularExpression;

    class RegularExpressionMatch;


    /**

     *  Flag principally for LimitLength, but used elsewhere as well (e.g. ToString ()).

     */


    enum class StringShorteningPreference {

        ePreferKeepLeft,

        ePreferKeepRight,

        ePreferKeepMid,


        eDEFAULT = ePreferKeepLeft,


        Stroika_Define_Enum_Bounds (ePreferKeepLeft, ePreferKeepMid)

    };


    using StringShorteningPreference::ePreferKeepLeft;

    using StringShorteningPreference::ePreferKeepMid;

    using StringShorteningPreference::ePreferKeepRight;


    /**

     *  \brief returns true iff T == u8string, u16string, u32string, or wstring - which std::string types can be unambiguously converted to UNICODE

     */

    template <typename T>

    concept IBasicUNICODEStdString = same_as<T, u8string> or same_as<T, u16string> or same_as<T, u32string> or same_as<T, wstring>;


    /**

     *  \brief anything with a 'special .STRINGTYPE conversion' method to UNICODE string, such as filesystem::path

     *

     *  Really, this is a thinly veiled attempt to avoid #include <filesystem> for modularity reasons.

     */

    template <typename T>


    concept IStdPathLike2UNICODEString = requires (T t) {

        { t.wstring () } -> same_as<wstring>;

    } or requires (T t) {

        { t.u8string () } -> same_as<u8string>;

    } or requires (T t) {

        { t.u16string () } -> same_as<u16string>;

    } or requires (T t) {

        { t.u32string () } -> same_as<u32string>;

    };


    class String;


    /**

     *  The concept IConvertibleToString is satisfied iff the argument type can be used to construct a (Stroika) String.

     *  Note subtly, const char* is treated (as of Stroika v3) as convertible to String, but the characters must be ASCII, or

     *  an exception will be generated in the constructor.

     */

    template <typename T>

    concept IConvertibleToString = convertible_to<T, String>;


    /**

     *  \brief String is like std::u32string, except it is much easier to use, often much more space efficient, and more easily interoperates with other string types

     *

     *  The Stroika String class is conceptually a sequence of (UNICODE) Characters, and so there is

     *  no obvious way to map the Stroika String to a std::string (in general). However, if you specify a codepage

     *  for conversion, or are converting to/from SDKString/SDKChar, or u8string, etc, there is builtin support for that.

     *

     *  EOS Handling:

     *      The Stroika String class supports having embedded NUL-characters. It also supports

     *      easy construction from NUL-terminated character strings.

     *

     *      Since Stroika v3, there is no longer c_str () support, since Stroika doesn't internally

     *      require NUL-terminated strings, and actively encourages different compact representations of

     *      strings (c_str() requires a choice of a particular encoding to make sense).

     *

     *      About spans, and the \0 NUL-termination - generally do NOT include

     *      the NUL-character in your span! Stroika strings will allow this, and treat

     *      it as just another character, but its probably not what you meant.

     *

     *  \note Narrow String handling

     *      Because the character set of strings of type 'char' is ambiguous, if you construct a String

     *      with char (char* etc) - it is somehow 'required' that the characters be ASCII. If using the FromConstantString () API

     *      , or operator""_k, it is checked with Require () - so assertion failure. If you construct

     *      with String::CTOR, it will generate a runtime exception (so more costly runtime checking).

     *

     *  \note Satisfies Concepts:

     *      o   static_assert (regular<String>);

     *

     *  \note   \em Thread-Safety   <a href="Thread-Safety.md#C++-Standard-Thread-Safety">C++-Standard-Thread-Safety</a>

     *

     *  \note   Design note - mutability vs. immutability

     *          http://stroika-bugs.sophists.com/browse/STK-968 (see about deleting deprecated APIs and remnants of mutability) and c_str()

     *

     *          String objects are IMMUTABLE (except for the OBVIOUS meaning case of operator= being allowed).

     *

     *          String reps are IMMUTABLE.

     *

     *          Use StringBuilder for a 'mutable' String (can be used mostly interchangeably with String).

     *

     *          Current Mutating methods (as of v3.0d1x)

     *          o   c_str ()  -- non-const                  deprecated in v3.0d13

     *          o   SetCharAt       - deprecated v3.0d12

     *          o   c_str()           (consider deprecating?)

     *          o   operator=       - deprecated v3.0d12

     *          o   clear()- deprecated v3.0d12

     *          o   Append           - deprecated v3.0d12

     *          o   operator+=       - deprecated v3.0d12

     *          o   erase()          - deprecated v3.0d12

     *

     *          SOMEWHAT ironically, the only of these methods hard to replace is the non-const c_str () - and maybe there

     *          not bad cuz I deprecated? COULD just deprecate ALL of these, and then the class is fully immutable. Probably

     *          easier to understand/reason about.

     *

     *  \note <a href="Design-Overview.md#Comparisons">Comparisons</a>:

     *      o   static_assert (totally_ordered<String>);

     *      o   String::EqualsComparer, String::ThreeWayComparer and String::LessComparer provided with construction parameters to allow case insensitive compares

     */


    class String : public Traversal::Iterable<Character> {

    private:

        using inherited = Iterable<Character>;


    protected:

        class _IRep;


    public:

        /**

         * All the constructors are obvious, except

         *      o   NUL-character ARE allowed in strings, except for the case of single

         *          charX* argument constructors - which find the length based on

         *          the terminating NUL-character.

         *

         *      o   CTOR (PATHLIKE_TOSTRINGABLE&& s) - IStdPathLike2UNICODEString PATHLIKE_TOSTRINGABLE

         *          carefully excludes conflicting CTOR overloads, and purpose is to allow constructing a String

         *          from anything with a 'special conversion' method to UNICODE string, such as filesystem::path.

         *

         *  \note about lifetime of argument data (basic_string_view<CHAR_T> constructors)

         *        All data is copied out / saved by the end of the constructor for all constructors EXCEPT

         *        the basic_string_view<CHAR_T> constructors - where it is REQUIRED the data last 'forever'.

         *

         *  \pre for String (const basic_string_view<wchar_t>& str) - str[str.length()]=='\0';

         *       c-string nul-terminated (which happens automatically with L"xxx"sv)

         *

         *  \note 'char' (using ASCII = char) constructors:

         *        Because the character-set of strings of type 'char' is ambiguous, if you construct a String

         *        with char (char* etc) - it runtime checked that the characters are ASCII (except for the basic_string_view

         *        constructors where we check but with assertions).

         *

         *        This mimics the behavior in Stroika v2.1 with String::FromASCII ()

         *

         *  \note the basic_string move Constructors MAY move or copy the underlying std string, but they still maintain

         *        the same requirements on their arguments as the copy basic_string constructors (eg. char must be ascii)

         *

         *  \see also - FromUTF8, FromSDKString, FromNarrowSDKString, FromStringConstant, FromLatin1, which are all like constructors

         *       but with special names to avoid confusion and make clear their arguments, and not participate in overloading. Note, chose

         *       this path instead of FLAG argument and explicit on CTOR, cuz more terse.

         */

        String ();

        explicit String (Character c);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        String (const CHAR_T* cString);

        template <Memory::ISpan SPAN_OF_CHAR_T>

        String (SPAN_OF_CHAR_T s)

            requires (IUNICODECanUnambiguouslyConvertFrom<typename SPAN_OF_CHAR_T::value_type>);

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        String (const basic_string<CHAR_T>& s);

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        String (const basic_string_view<CHAR_T>& s);

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        explicit String (basic_string<CHAR_T>&& s);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        String (const Iterable<CHAR_T>& src)

            requires (not Memory::ISpan<CHAR_T>);

        template <IStdPathLike2UNICODEString PATHLIKE_TOSTRINGABLE>

        explicit String (PATHLIKE_TOSTRINGABLE&& s);

        String (String&& from) noexcept      = default;

        String (const String& from) noexcept = default;


    private:

        template <IStdPathLike2UNICODEString PATHLIKE_TOSTRINGABLE>

        static String mkSTR_ (PATHLIKE_TOSTRINGABLE&& s);


    private:

        static shared_ptr<_IRep> CTORFromBasicStringView_ (const basic_string_view<ASCII>& str);

        static shared_ptr<_IRep> CTORFromBasicStringView_ (const basic_string_view<char8_t>& str);

        static shared_ptr<_IRep> CTORFromBasicStringView_ (const basic_string_view<char16_t>& str);

        static shared_ptr<_IRep> CTORFromBasicStringView_ (const basic_string_view<char32_t>& str);

        static shared_ptr<_IRep> CTORFromBasicStringView_ (const basic_string_view<wchar_t>& str);


    public:

        ~String () = default;


    protected:

        /**

         */

        using _SafeReadRepAccessor = Iterable<Character>::_SafeReadRepAccessor<_IRep>;


    protected:

        /**

         * \pre rep MUST be not-null

         *  However, with move constructor, it maybe null on exit.

         */

        String (const shared_ptr<_IRep>& rep) noexcept;

        String (shared_ptr<_IRep>&& rep) noexcept;


    public:

        nonvirtual String& operator= (String&& rhs) noexcept      = default;

        nonvirtual String& operator= (const String& rhs) noexcept = default;


    public:

        /**

         *  Create a String object from a 'char-based' utf-8 encoded string.

         *

         *  \par Example Usage

         *      \code

         *          EXPECT_TRUE (string{u8"שלום"} == String::FromUTF8 (u8"שלום").AsUTF8 ());

         *      \endcode

         *

         *  \note   This is not generally needed, as you can just use the String::CTOR, but for cases like

         *          std::string-> String - where the conversion needs extra information (an assertion about character encoding of source characters).

         *

         *  \note   Reading improperly encoded text may result in a RuntimeException indicating improperly encoded characters.

         */

        template <typename CHAR_T>

        static String FromUTF8 (span<CHAR_T> from)

            requires (same_as<remove_cv_t<CHAR_T>, char8_t> or same_as<remove_cv_t<CHAR_T>, char>);

        template <typename CHAR_T>

        static String FromUTF8 (const basic_string<CHAR_T>& from)

            requires (same_as<remove_cv_t<CHAR_T>, char8_t> or same_as<remove_cv_t<CHAR_T>, char>);

        template <typename CHAR_T>

        static String FromUTF8 (const CHAR_T* from)

            requires (same_as<remove_cv_t<CHAR_T>, char8_t> or same_as<remove_cv_t<CHAR_T>, char>);


    public:

        /**

         *  Create a String object from a 'SDKChar' (os-setting - current code page) encoded string.

         *  See @SDKChar

         *  See @SDKString

         *

         *  \note   Reading improperly encoded text may result in a RuntimeException indicating improperly encoded characters.

         */

        static String FromSDKString (const SDKChar* from);

        static String FromSDKString (span<const SDKChar> s);

        static String FromSDKString (const SDKString& from);


    public:

        /**

         *  Create a String object from a 'char-based' (os-setting - current code page) encoded string.

         *

         *  \note   Reading improperly encoded text may result in a RuntimeException indicating improperly encoded characters.

         */

        static String FromNarrowSDKString (const char* from);

        static String FromNarrowSDKString (span<const char> s);

        static String FromNarrowSDKString (const string& from);


    public:

        /**

         *  Create a String object from a char based on the encoding from the argument locale.

         *  This throws an exception if there is an error performing the conversion.

         *

         *  \note   Reading improperly encoded text may result in a RuntimeException indicating improperly encoded characters.

         */

        static String FromNarrowString (const char* from, const locale& l);

        static String FromNarrowString (span<const char> s, const locale& l);

        static String FromNarrowString (const string& from, const locale& l);


    public:

        /**

         *   \brief Take the given argument data (constant span) - which must remain unchanged - constant - for the application lifetime - and treat it as a Stroika String object

         *

         *  This allows creation of String objects with fewer memory allocations and less copyinh, and more efficient storage, in most situations

         *

         *  The resulting String is a perfectly compliant Stroika String (somewhat akin to std::string_view vs std::string).

         *

         *  \par Example:

         *      \code

         *          String  tmp1    =   "FRED";

         *          String  tmp2    =   String{"FRED"};

         *          String  tmp3    =   String::FromStringConstant ("FRED");    // same as 2 above, but faster

         *          String  tmp4    =   "FRED"sv;                               // equivalent to FromStringConstant

         *          String  tmp5    =   "FRED"_k;                               // equivalent to FromStringConstant

         *      \endcode

         *

         *  \em WARNING - BE VERY CAREFUL - be sure arguments have application lifetime (intended use case is C string literals).

         *

         *  \pre argument string MAY contain embedded nul characters (but for char* overloads wrong size inferred).

         *

         *  \note In Stroika v2.1 this was called class String_ExternalMemoryOwnership_ApplicationLifetime.

         *  \note In Stroika v2.1 this was called class String_Constant.

         *  \note In Stroika v2.1 this required NUL-char termination, but no longer

         *

         *  \note FromStringConstant with 'char' - REQUIRES that the char elements are ASCII (someday this maybe lifted and interpret as Latin1)

         *        For the case of char, we also do not check/require the nul-termination bit.

         */

        template <size_t SIZE, IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static String FromStringConstant (const CHAR_T (&cString)[SIZE]);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static String FromStringConstant (const basic_string_view<CHAR_T>& str);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static String FromStringConstant (span<const CHAR_T> str);

        static String FromStringConstant (span<const ASCII> s);    // better impl in CPP file

        static String FromStringConstant (span<const char16_t> s); // ""

        static String FromStringConstant (span<const wchar_t> s);  // "" (inl file)

        static String FromStringConstant (span<const char32_t> s); // ""


    public:

        /**

         *  Create a String object from UNICODE Latin-1 Supplement (https://en.wikipedia.org/wiki/Latin-1_Supplement)

         *

         *  This is roughly, but not exactly, the same as the ISO-Latin-1 single-byte character set (https://en.wikipedia.org/wiki/ISO/IEC_8859-1)

         *

         *  \note if character code point >= 256, this will throw an exception - not defined for that range (only checked if sizeof (CHAR_T) > 1)

         *

         *  @aliases From8bitASCII () or FromExtendedASCII ()

         */

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static String FromLatin1 (const CHAR_T* cString);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static String FromLatin1 (span<const CHAR_T> s);

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        static String FromLatin1 (const basic_string<CHAR_T>& s);


    public:

        /**

         *  \brief appends 'rhs' string to this string (without modifying this string) and returns the combined string

         *

         *  @see    Append() for a similar function that modifies 'this'

         */

        template <typename T>

        nonvirtual String Concatenate (T&& rhs) const

            requires (is_convertible_v<T, String>);


    private:

        nonvirtual String Concatenate_ (const String& rhs) const;


    public:

        /**

         *  Returns the number of characters in the String. Note that this may not be the same as bytes,

         *  does not include NUL termination, and doesn't in any way respect NUL termination (meaning

         *  a nul-character is allowed in a Stroika string.

         *

         * @aliases GetLength ()

         */

        nonvirtual size_t size () const noexcept;


    public:

        /**

         */

        nonvirtual bool empty () const noexcept;


    public:

        /**

         */

        nonvirtual const Character GetCharAt (size_t i) const noexcept;


    public:

        /**

         *  \brief return (read-only) Character object

         *

         *  @aliases GetCharAt (size_t i) const;

         *

         *  \note returns const due to https://stroika.atlassian.net/browse/STK-376 - so cannot accidentally have illusion of assignment being legal

         */

        nonvirtual const Character operator[] (size_t i) const noexcept;


    public:

        /**

         *  InsertAt() constructs a new string by taking this string, and inserting the argument

         *  characters.

         *

         *  \em Note that for repeated insertions, this is much less efficient than just

         *      using StringBuilder.

         *

         *  \note that if at == this->size (), you are appending.

         */

        nonvirtual String InsertAt (Character c, size_t at) const;

        nonvirtual String InsertAt (const String& s, size_t at) const;

        nonvirtual String InsertAt (span<const Character> s, size_t at) const;

        nonvirtual String InsertAt (span<Character> s, size_t at) const;


    public:

        /**

         * Remove the characters at 'charAt' (RemoveAt/1) or between 'from' and 'to' (const method - doesn't modify this)

         *

         * It is an error if this implies removing characters off the end of the string.

         *

         *  \par Example Usage

         *      \code

         *          String mungedData = "04 July 2014";

         *          if (optional<pair<size_t, size_t>> i = mungedData.Find (RegularExpression{"0[^\b]"})) {

         *              mungedData = mungedData.RemoveAt (*i);

         *          }

         *      \endcode

         *

         *  \pre (charAt < size ())

         *  \pre (from <= to)

         *  \pre (to <= size ())

         *

         *  \em Note that this is quite inefficient: consider using StringBuilder

         */

        nonvirtual String RemoveAt (size_t charAt) const;

        nonvirtual String RemoveAt (size_t from, size_t to) const;

        nonvirtual String RemoveAt (pair<size_t, size_t> fromTo) const;


    public:

        /**

         *  Remove the first occurrence of Character 'c'/'/subString/ from the string. Not an error if none

         *  found. Doesn't modify this (const method) - returns resulting string.

         *

         *  \em Note that this is quite inefficient: consider using StringBuffer

         */

        nonvirtual String RemoveFirstIf (Character c) const;

        nonvirtual String RemoveFirstIf (const String& subString) const;


    public:

        /**

         *  Remove the all occurrences of Character 'c/subString' from this string

         *  (walking front to back - if removal creates one, it too is removed).

         *  Not an error if none found. Doesn't modify this (const method) - returns resulting string.

         */

        nonvirtual String RemoveAll (Character c) const;

        nonvirtual String RemoveAll (const String& subString) const;


    public:

        /**

         *  OVERLOADS WITH size_t:

         *

         *  Produce a substring of this string, starting at 'from', and up to 'to' (or end of string

         *  for one-arg overload).

         *

         *  *NB* This function treats the second argument differently than String::substr () -

         *  which respects the STL basic_string API. This function treats the second argument

         *  as a 'to', STL substr() treats it as a count. This amounts to the same thing for the

         *  very common cases of substr(N) - because second argument is defaulted, and,

         *  substr (0, N) - because then the count and end are the same.

         *

         *  \pre  (from <= to);

         *  \pre  (to <= size ());     // for 2-arg variant

         *

         *  \par Example Usage

         *      \code

         *          String tmp { "This is good" };

         *          Assert (tmp.SubString (5) == "is good");

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          const String kTest_ { "a=b"sv };

         *          const String kLbl2LookFor_ { "a="_k };

         *          if (resultLine.Find (kLbl2LookFor_)) {

         *              String  tmp { resultLine.SubString (kLbl2LookFor_.length ()) };

         *          }

         *          Assert (tmp == "b");

         *      \endcode

         *

         *  OVERLOADS WITH ptrdiff_t:

         *

         *  This is like SubString() except that if from/to are negative, they are treated as relative to the end

         *  of the String.

         *

         *  So for example, SubString (0, -1) is equivalent to SubString (0, size () - 1) - and so is an

         *  error if the string is empty.

         *

         *  Similarly, SubString (-5) is equivalent to SubString (size ()-5, size ()) - so can be used

         *  to grab the end of a string.

         *

         *  \pre  (adjustedFrom <= adjustedTo);

         *  \pre  (adjustedTo <= size ());     // for 2-arg variant

         *

         *  \note \em Design Note

         *      We chose not to overload SubString() with this functionality because it would have been to easy

         *      to mask bugs.

         *

         *  \note \em Design Note

         *      This was originally inspired by Python arrays. From https://docs.python.org/2/tutorial/introduction.html:

         *          Indices may also be negative numbers, to start counting from the right

         *

         *  @aliases

         *      This API is identical to the javascript String.slice () method/behavior

         *      @see http://www.ecma-international.org/publications/files/ECMA-ST/Ecma-262.pdf

         *           15.5.4.13 String.prototype.slice (start, end)

         *

         *  @aliases

         *      This API - when called with negative indexes - used to be called CircularSubString ().

         *

         *  @see substr

         *  @see SafeSubString

         */

        template <typename SZ>

        nonvirtual String SubString (SZ from) const;

        template <typename SZ1, typename SZ2>

        nonvirtual String SubString (SZ1 from, SZ2 to) const;


    public:

        /**

         *  Like SubString(), but no requirements on from/to. These are just adjusted to the edge of the string

         *  if the exceed those endpoints. And if arguments are <0, they are interpreted as end-relative.

         *

         *  @aliases

         *      This API - when called with negative indexes - used to be called SafeCircularSubString ().

         *

         *  @see substr

         *  @see SubString

         */

        template <typename SZ>

        nonvirtual String SafeSubString (SZ from) const;

        template <typename SZ1, typename SZ2>

        nonvirtual String SafeSubString (SZ1 from, SZ2 to) const;


    public:

        /**

         * \brief Return a substring of this string, starting at 'argument' n. If n > size(), return empty string.

         *

         *  \note   This hides inherited Skip, and returns a subtype of what it returns, and is just slightly more

         *          efficient, but otherwise completley compatible behavior.

         */

        nonvirtual String Skip (size_t n) const;


    public:

        /**

         *  Return 'count' copies of this String (concatenated after one another).

         */

        nonvirtual String Repeat (unsigned int count) const;


    public:

        /**

         *  Returns true if the argument character or string is found anywhere inside this string.

         *  This is equivalent to

         *      return Matches (".*" + X + ".*");    // If X had no characters which look like they are part of

         *                                            // a regular expression

         *

         *  @see Match

         */

        nonvirtual bool Contains (Character c, CompareOptions co = eWithCase) const;

        nonvirtual bool Contains (const String& subString, CompareOptions co = eWithCase) const;


    public:

        /**

         *

         */

        nonvirtual bool ContainsAny (Iterable<Character> cs, CompareOptions co = eWithCase) const;


    public:

        /**

         *  Returns true iff the given substring is contained in this string.

         *

         *  Similar to:

         *      return Matches (X + ".*");

         *  except for the fact that with StartsWith() doesn't interpret 'X' as a regular expression

         *

         *  \pre not subString.empty () -- for the subString overload (because otherwise "".StartsWith("") would be ill-defined)

         *

         *  @see Match

         *  @see EndsWith

         */

        nonvirtual bool StartsWith (const Character& c, CompareOptions co = eWithCase) const;

        nonvirtual bool StartsWith (const String& subString, CompareOptions co = eWithCase) const;


    public:

        /**

         *  Returns true iff the given substring is contained in this string.

         *

         *  Similar to:

         *      return Matches (X + ".*");

         *  except for the fact that with StartsWith() doesn't interpret 'X' as a regular expression

         *

         *  \pre not subString.empty () -- for the subString overload (because otherwise "".EndsWith("") would be ill-defined)

         *

         *  @see Match

         *  @see StartsWith

         */

        nonvirtual bool EndsWith (const Character& c, CompareOptions co = eWithCase) const;

        nonvirtual bool EndsWith (const String& subString, CompareOptions co = eWithCase) const;


    public:

        /**

         *  \brief Return *this if it ends with argument character, or append 'c' so that it ends with a 'c'.

         *

         *  \note this is to specific-purpose to be a very sensible API, but I find it pretty often pretty useful. So what-the-heck.

         */

        nonvirtual String AssureEndsWith (const Character& c, CompareOptions co = eWithCase) const;


    public:

        /**

         *  Apply the given regular expression return true if it matches this string. This only

         *  returns true if the expression matches the ENTIRE string - all the way to the end.

         *  @see FindEach() or @see Find - to find a set of things which match.

         *

         *  \par Example Usage

         *      \code

         *          Assert (String{"abc"}.Matches ("abc"));

         *          Assert (not (String{"abc"}.Matches ("bc")));

         *          Assert (String{"abc"}.Matches (".*bc"));

         *          Assert (not String{"abc"}.Matches ("b.*c"));

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          static const RegularExpression kSonosRE_{"([0-9.:]*)( - .*)"_RegEx};

         *          static const String            kTestStr_{"192.168.244.104 - Sonos Play:5"};

         *          optional<String> match1;

         *          optional<String> match2;

         *          EXPECT_TRUE (kTestStr_.Matches (kSonosRE_, &match1, &match2) and match1 == "192.168.244.104" and match2 == " - Sonos Play:5");

         *          EXPECT_EQ (kTestStr_.Matches<1> (kSonosRE_), make_tuple ("192.168.244.104"_k));

         *          EXPECT_EQ (kTestStr_.Matches<2> (kSonosRE_), make_tuple ("192.168.244.104"_k, "Sonos Play:5"_k));

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          // https://tools.ietf.org/html/rfc3986#appendix-B

         *          static const RegularExpression kParseURLRegExp_{"^(([^:/?#]+):)?(//([^/?#]*))?([^?#]*)(\\?([^#]*))?(#(.*))?"_RegEx};

         *          optional<String>               scheme;

         *          optional<String>               authority;

         *          optional<String>               path;

         *          optional<String>               query;

         *          optional<String>               fragment;

         *          if (rawURL.Matches (kParseURLRegExp_, nullptr, &scheme, nullptr, &authority, &path, nullptr, &query, nullptr, &fragment)) {

         *              DbgTrace ("***good - scheme={}"_f, scheme);

         *              DbgTrace ("***good - authority={}"_f, authority);

         *              DbgTrace ("***good - path={}"_f, path);

         *              DbgTrace ("***good - query={}"_f, query);

         *              DbgTrace ("***good - fragment={}"_f, fragment);

         *          }

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          // Praat 6.4.23 (October 27 2024)

         *          String processRunnerOutput = "Praat 6.4.23 (October 27 2024)";

         *          String version;

         *          return processRunnerOutput.Matches ("(\\w+)\\s([\\w\\.]+).*"_RegEx, nullptr, &version)? version: "???"sv;

         *          return get<1> (processRunnerOutput.Matches<1> ("\\w+\\s([\\w\\.]+).*"_RegEx).value_or(make_tuple("???"_k)));       // Or better

         *      \endcode

         *

         *  Details on the regular expression language/format can be found at:

         *      http://en.wikipedia.org/wiki/C%2B%2B11#Regular_expressions

         *

         *  \note If any 'sub-match' arguments are passed to Match, they MUST be of type optional<String>* or nullptr.

         *        Passing nullptr allows matched parameters to not be returned, but still identified positionally (by index).

         *

         *  @see Contains

         *  @see StartsWith

         *  @see EndsWith

         *  @see Find

         *  @see FindEach

         */

        nonvirtual bool Matches (const RegularExpression& regEx) const;

        nonvirtual bool Matches (const RegularExpression& regEx, Containers::Sequence<String>* matches) const;

        template <Common::IAnyOf<optional<String>*, String*, nullptr_t>... OPTIONAL_STRINGS>

        nonvirtual bool Matches (const RegularExpression& regEx, OPTIONAL_STRINGS&&... subMatches) const;

        template <size_t I>

        nonvirtual optional<Common::RepeatedTuple_t<I, String>> Matches (const RegularExpression& regEx) const;


    public:

        /**

         *  Find returns the index of the first occurrence of the given Character/substring argument in

         *  this string. Find () always returns a valid string index, which is followed by the

         *  given substring, or nullopt otherwise.

         *

         *  Find () can optionally be provided a 'startAt' offset to begin the search at.

         *

         *  And the overload taking a RegularExpression - returns BOTH the location where the match

         *  is found, as well as the end of the match.

         *

         *  Note - for the special case of Find(empty-string) - the return value is 0 if this string

         *  is non-empty, and nullopt if this string was empty.

         *

         *  @aliases - could have been called IndexOf ()

         *

         *  \pre (startAt <= size ());

         *

         *  \par Example Usage

         *      \code

         *          const String kTest_{ "a=b" };

         *          const String kLbl2LookFor_ { "a=" };

         *          if (kTest_.Find (kLbl2LookFor_)) {

         *              String  tmp { kTest_.SubString (kLbl2LookFor_.length ()) };

         *          }

         *          Assert (tmp == "b");

         *      \endcode

         *

         *  @see FindEach ()

         *  @see FindEachString ()

         *  @see Tokenize

         */

        nonvirtual optional<size_t> Find (Character c, CompareOptions co = eWithCase) const;

        nonvirtual optional<size_t> Find (Character c, size_t startAt, CompareOptions co = eWithCase) const;

        nonvirtual optional<size_t> Find (const String& subString, CompareOptions co = eWithCase) const;

        nonvirtual optional<size_t> Find (const String& subString, size_t startAt, CompareOptions co = eWithCase) const;

        nonvirtual optional<pair<size_t, size_t>> Find (const RegularExpression& regEx, size_t startAt = 0) const;

        nonvirtual Traversal::Iterator<Character> Find (const function<bool (Character item)>& that) const;


    public:

        /**

         *  This is just like Find, but captures all the matching results in an iterable result.

         *  The reason the overload for RegularExpression's returns a list of pair<size_t,size_t> is because

         *  the endpoint of the match is ambiguous. For fixed string Find, the end of match is computable

         *  from the arguments.

         *

         *  FindEach () can be more handy to use than directly using Find () in scenarios where you want

         *  to iterate over each match:

         *      e.g.:

         *          for (auto i : s.FindEach ("xxx")) {....}

         *

         *  Also, to count matches, you can use:

         *      size_t nMatches = FindEach (matchexp).size ();

         *

         *  Note: FindEach handles the special case of an empty match as ignored, so FindEach(empty-str-or-regexp)

         *  always returns an empty list. Also - for the String case, it returns distinct matches, so if you

         *  search String{"AAAA"}.FindEach ("AA"), you will get 2 answers ({0, 2}).

         *

         *  @see Find ()

         *  @see FindEachString ()

         *  @see Matches ()

         */

        nonvirtual Containers::Sequence<pair<size_t, size_t>> FindEach (const RegularExpression& regEx) const;

        nonvirtual Containers::Sequence<size_t> FindEach (const String& string2SearchFor, CompareOptions co = eWithCase) const;


    public:

        /**

         *  \par Example Usage

         *      \code

         *          const String                        kTest_{ "a=b,"sv };

         *          const RegularExpression             kRE_{ "a=(.*)[, ]" };

         *          Sequence<String>                    tmp1{ kTest_.FindEachString (kRE_) };

         *          Assert (tmp1.size () == 1 and tmp1[0] == "a=b,");

         *          Sequence<RegularExpressionMatch>    tmp2 { kTest_.FindEachMatch (kRE_) };

         *          Assert (tmp2.size () == 1 and tmp2[0].GetFullMatch () == "a=b," and tmp2[0].GetSubMatches () == Sequence<String>{"b"});

         *      \endcode

         *

         *  @see Find ()

         *  @see FindEachString ()

         *  @see Matches ()

         */

        nonvirtual Containers::Sequence<RegularExpressionMatch> FindEachMatch (const RegularExpression& regEx) const;


    public:

        /**

         *  \par Example Usage

         *      \code

         *          const String            kTest_ { "a=b, c=d"_k };

         *          const RegularExpression kRE_ { "(.)=(.)" };

         *          Assert ((kTest_.FindEachString (kRE_) ==  vector<String>{"a=b", "c=d"}));

         *      \endcode

         *

         *  @see Find ()

         *  @see FindEachMatch ()

         *  @see Matches ()

         */

        nonvirtual Containers::Sequence<String> FindEachString (const RegularExpression& regEx) const;


    public:

        /**

         * RFind (substring) returns the index of the last occurrence of the given substring in

         * this string. This function always returns a valid string index, which is followed by the

         * given substring, or optional<size_t> {} otherwise.

         *

         *  @aliases RIndexOf ()

         */

        nonvirtual optional<size_t> RFind (Character c) const noexcept;

        nonvirtual optional<size_t> RFind (const String& subString) const;


    public:

        /**

         *  Replace the range of this string with the given replacement. Const method: just creates new string as described.

         */

        nonvirtual String Replace (size_t from, size_t to, const String& replacement) const;

        nonvirtual String Replace (pair<size_t, size_t> fromTo, const String& replacement) const;


    public:

        /**

         * Apply the given regular expression, with 'with' and replace each match. This doesn't

         * modify this string, but returns the replacement string.

         *

         * CHECK - BUT HI HTINK WE DEFINE TO REPLACE ALL? OR MAKE PARAM?

         * See regex_replace () for definition of the regEx language

         *

         *   Require (not string2SearchFor.empty ());

         *

         *  \par Example Usage

         *      \code

         *          mungedData = mungedData.ReplaceAll (RegularExpression{ "\\b0+" }, "");    // strip all leading zeros

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          String a = "a b   \n\t c";

         *          EXPECT_EQ (a.ReplaceAll (RegularExpression{"\\s+"sv}, " "sv), "a b c");

         *          EXPECT_EQ (a.ReplaceAll ("\\s+"_RegEx, " "sv), "a b c");

         *      \endcode

         *

         *  Note - it IS legal to have with contain the original search for string, or even

         *  to have it 'created' as part of where it gets

         *  inserted. The implementation will only replace those that pre-existed.

         *

         *  \note To perform a regular expression replace-all, which is case insensitive, create the regular expression with CompareOptions::eCaseInsensitive

         *

         *  \note ReplaceAll could have been called 'SafeString' or 'FilteredString' (was at one point - replaces that functionality)

         */

        nonvirtual String ReplaceAll (const RegularExpression& regEx, const String& with) const;

        nonvirtual String ReplaceAll (const String& string2SearchFor, const String& with, CompareOptions co = eWithCase) const;

        nonvirtual String ReplaceAll (const function<bool (Character)>& replaceCharP, const String& with) const;

        nonvirtual String ReplaceAll (const Containers::Set<Character>& charSet, const String& with) const;


    public:

        /**

         *  Replace any CR or LF or CRLF sequences with plain NL-terminated text.

         */

        nonvirtual String NormalizeTextToNL () const;


    public:

        /**

         *  \brief Replace sequences of whitespace characters (space, tab, newline etc) with a single space (or argument space character).

         *

         *  \note  see Qt 'QString::simplify()'.Idea is Trim () (right and left) - plus replace contiguous substrings with* Character::IsSpace () with a

         *         single (given) space character.

         */

        nonvirtual String NormalizeSpace (Character useSpaceCharacter = ' ') const;


    public:

        /**

         *  Break this String into constituent parts. This is a simplistic API but at least handy as is.

         *

         *  The caller can specify the token separators by set, by lambda. This defaults to the lambda "isWhitespace".

         *

         *  This is often called 'Split' in other APIs. This is NOT (as is now) a replacement for flex, but just for

         *  simple, but common string splitting needs (though if I had a regexp param, it may approach the power of flex).

         *

         *  \note If this->length () == 0, this method returns a list of length 0;

         *  \note Its fine for the split character/characters to be missing, in which case this

         *        returns a list of length 1

         *

         *  \par Example Usage

         *      \code

         *          String  t { "ABC DEF G" };

         *          Assert (t.Tokenize ().length () == 3);

         *          Assert (t.Tokenize ()[1] == "DEF");

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          String  t { "foo=   7" };

         *          auto    tt = t.Tokenize ({ '=' });

         *          Assert (t.length () == 2);

         *          Assert (t[1] == "   7");

         *          Assert (t[1].Trim () == "7");

         *      \endcode

         *

         *  \par Example Usage

         *      \code

         *          String  t { "foo=   7" };

         *          auto    tt = t.Tokenize ({ '=', ' ' });

         *          Assert (t.length () == 2);

         *          Assert (t[1] == "7");

         *      \endcode

         *

         *  @see Find

         *

         *  TODO:

         *      @todo   Review:

         *                  http://qt-project.org/doc/qt-5.0/qtcore/qstring.html#split

         *              especially:

         *                  QString line = "forename\tmiddlename  surname \t \t phone";

         *                  QRegularExpression sep("\\s+");

         *                  str = line.section(sep, 2, 2); // str == "surname"

         *                  str = line.section(sep, -3, -2); // str == "middlename  surname"

         *              Make sure our Find/Tokenize is at least this simple, and maybe diff between find and split

         *              is FIND the regular expression names the things looked for and SPLIT() uses regexp to name the separators?

         *              Add something like the above to the String String demo app (when it exists)

         */

        nonvirtual Containers::Sequence<String> Tokenize () const;

        nonvirtual Containers::Sequence<String> Tokenize (const function<bool (Character)>& isTokenSeperator) const;

        nonvirtual Containers::Sequence<String> Tokenize (const RegularExpression& isSeparator) const;

        nonvirtual Containers::Sequence<String> Tokenize (const Containers::Set<Character>& delimiters) const;


    public:

        /**

         *  \brief break the String into a series of lines;

         *

         *  \note could almost be done with Tokenize(), except for the one-sided nl-specific trimming.

         *

         *  \note removes line-endings (\r\n, or \n, or \r).

         */

        nonvirtual Containers::Sequence<String> AsLines () const;


    public:

        /**

         *  \brief Breaks this string into Lines, with AsLines (), and applies the argument filter (as if with .Map<>) producing a subset of the lines which match

         *

         *  note this is useful to replace 'shell script' logic where you might run some command and grep through its output for all

         *  matching lines.

         *

         *  \par Example Usage

         *      \code

         *          String firstALineOrEmpty = String{"...e.g. from output of ProcessRunner..."}.Grep ("a:").NthValue (0);

         *      \endcode

         */

        nonvirtual Containers::Sequence<String> Grep (const String& fgrepArg) const;

        nonvirtual Containers::Sequence<String> Grep (const RegularExpression& egrepArg) const;


    public:

        /**

         *  \brief Useful to replace 'awk print $3' - replace with Col(2) - zero based

         *

         *  default separator =  = "\\s+"_RegEx;

         *

         *  \par Example Usage

         *      \code

         *          Assert (String{"ffmpeg version 7.1"}.Col (2) == "7.1");

         *      \endcode

         *

         */

        nonvirtual optional<String> Col (size_t i) const;

        nonvirtual optional<String> Col (size_t i, const RegularExpression& separator) const;


    public:

        /**

         *  \brief see Col(i) - but with default value of empty string

         */

        nonvirtual String ColValue (size_t i, const String& valueIfMissing = {}) const;


    public:

        /**

         * String LTrim () scans the characters form the left to right, and applies the given

         * 'shouldBeTrimmed' function (defaults to IsWhitespace). All such characters are removed,

         * and the resulting string is returned. This does not modify the current string its

         * applied to - just returns the trimmed string.

         */

        nonvirtual String LTrim (bool (*shouldBeTrimmed) (Character) = Character::IsWhitespace) const;


    public:

        /**

         * String RTrim () scans the characters form the right to left, and applies the given

         * 'shouldBeTrimmed' function (defaults to IsWhitespace). All such characters are removed,

         * and the resulting string is returned. This does not modify the current string its

         * applied to - just returns the trimmed string.

         *

         *  \par Example Usage

         *      \code

         *          String name = origName.RTrim ([] (Character c) { return c == '\\';});        // Trim a trailing backslash(s), if present

         *      \endcode

         */

        nonvirtual String RTrim (bool (*shouldBeTrimmed) (Character) = Character::IsWhitespace) const;


    public:

        /**

         * String Trim () is locally equivalent to RTrim (shouldBeTrimmed).LTrim (shouldBeTrimmed).

         */

        nonvirtual String Trim (bool (*shouldBeTrimmed) (Character) = Character::IsWhitespace) const;


    public:

        /**

         * Walk the entire string, and produce a new string consisting of all characters for which

         * the predicate 'removeCharIf' returned false.

         */

        nonvirtual String StripAll (bool (*removeCharIf) (Character)) const;


    public:

        /**

         *  Combine the given array into a single string (typically comma space) separated.

         *  If given a list of length n, this adds n-1 separators.

         *

         *  \note .Net version - https://docs.microsoft.com/en-us/dotnet/api/system.string.join?redirectedfrom=MSDN&view=net-6.0#System_String_Join_System_String_System_String___

         *  \note Java version - https://docs.oracle.com/javase/8/docs/api/java/lang/String.html#join-java.lang.CharSequence-java.lang.CharSequence...-

         *  \note Javascript   - https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/Array/join

         *

         *  \note - CONSIDER LOSING this as 'Iterable<>::Join' just appears to work better -- LGP 2025-01-21

         */

        static String Join (const Iterable<String>& list, const String& separator = ", "sv);


    public:

        /**

         * Return a new string based on this string where each lower case character is replaced by its

         * upper case equivalent. Note that non-lower-case characters (such as punctuation) un unchanged.

         */

        nonvirtual String ToLowerCase () const;


    public:

        /**

         * Return a new string based on this string where each lower case character is replaced by its

         * upper case equivalent. Note that non-upper-case characters (such as punctuation) un unchanged.

         */

        nonvirtual String ToUpperCase () const;


    public:

        /**

         * Return true if the string contains zero non-whitespace characters.

         */

        nonvirtual bool IsWhitespace () const;


    public:

        /**

         *  \brief return the first maxLen (or fewer if string shorter) characters of this string (adding ellipsis if truncated)

         *

         *  This function is for GUI/display purposes. It returns the given string, trimmed down

         *  to at most maxLen characters, and removes whitespace (on 'to trim' side - given by keepLeft flag -

         *  if needed to get under maxLen).

         *

         *  Note in the 3-arg overload, the ellipsis string MAY be the empty string.

         */

        nonvirtual String LimitLength (size_t maxLen, StringShorteningPreference keepPref = StringShorteningPreference::ePreferKeepLeft) const;

        nonvirtual String LimitLength (size_t maxLen, StringShorteningPreference keepLeft, const String& ellipsis) const;


    public:

        /**

         *  CopyTo () copies the contents of this string to the target buffer.

         *  CopyTo () does NOT nul-terminate the target buffer

         *

         *  Returns span of CHAR_T objects written - a subspan of the argument span

         *

         *  \pre s.size () >= UTFConvert::ComputeTargetBufferSize<CHAR_T> (...this-string-data...);

         *

         *  \see See also GetData<CHAR_T> (buf) - similar functionality - except caller doesn't need to know size of buffer to allocate

         */

        template <IUNICODECanAlwaysConvertTo CHAR_T>

        nonvirtual span<CHAR_T> CopyTo (span<CHAR_T> s) const

            requires (not is_const_v<CHAR_T>);


    public:

        /**

         * Convert String losslessly into a standard C++ type.

         *

         *  Only specifically specialized variants supported: IBasicUNICODEStdString<T> or same_as<T,String>

         *      o   wstring

         *      o   u8string

         *      o   u16string

         *      o   u32string

         *      o   String    (return *this; handy sometimes in templated usage; harmless)

         *    as well as:

         *      o   filesystem::path (or anything with .wstring() -> wstring method) - note see qStroika_Foundation_Characters_AsPathAutoMapMSYSAndCygwin

         *

         *  DEPRECATED AS OF v3.0d1 because As is const method - could do non-const As<> overload for these, but that would be confusing

         *      o   const wchar_t*

         *      o   const Character*

         *

         *  \note

         *      o   As<u8string> () equivalent to AsUTF8 () call

         *      o   As<u16string> () equivalent to AsUTF16 () call

         *      o   As<u32string> () equivalent to AsUTF32 () call

         *

         *  \note   We tried to also have template<typename T> explicit operator T () const; - conversion operator - but

         *          We got too frequent confusion in complex combinations of templates, like with:

         *          Set<String> x ( *optional<String> {String{}) );       // fails cuz calls operator Set<String> ()!

         *          Set<String> x { *optional<String> {String{}) };       // works as expected

         */

        template <typename T>

        nonvirtual T As () const

            requires (IBasicUNICODEStdString<T> or same_as<T, String> or constructible_from<T, wstring>);


    public:

        /**

         *  Create a narrow string object from this, based on the encoding from the argument locale.

         *  This throws an exception if there is an error performing the conversion, and the 'into' overload

         *  leaves 'into' in an undefined (but safe) state.

         */

        nonvirtual string AsNarrowString (const locale& l) const;

        nonvirtual string AsNarrowString (const locale& l, AllowMissingCharacterErrorsFlag) const;


    public:

        /**

         * Convert String losslessly into a standard C++ type.

         * Only specifically specialized variants are supported.

         *

         *  SUPPORTED result type "T": values are:

         *      string

         *      u8string

         */

        template <typename T = u8string>

        nonvirtual T AsUTF8 () const

            requires (same_as<T, string> or same_as<T, u8string>);


    public:

        /**

         * Convert String losslessly into a standard C++ type u16string.

         *

         *  \par Example Usage:

         *      \code

         *          String s = u"hi mom";

         *          u16string su    =   AsUTF16 ();

         *      \endcode

         *

         *  \note - the resulting string may have a different length than this->size() due to surrogates

         *

         *  @todo allow wchar_t if sizeof(wchar_t) == 2

         */

        template <typename T = u16string>

        nonvirtual T AsUTF16 () const

            requires (same_as<T, u16string> or (sizeof (wchar_t) == sizeof (char16_t) and same_as<T, wstring>));


    public:

        /**

         * Convert String losslessly into a standard C++ type u32string.

         *

         *  \par Example Usage:

         *      \code

         *          String s = u"hi mom";

         *          u32string su    =   AsUTF32 ();

         *      \endcode

         *

         *  \note - As of Stroika 2.1d23 - the resulting string may have a different length than this->size() due to surrogates,

         *          but eventually the intent is to fix Stroika's string class so this is not true, and it returns the length of the string

         *          in size () with surrogates removed (in other words uses ucs32 representation). But not there yet.

         */

        template <typename T = u32string>

        nonvirtual T AsUTF32 () const

            requires (same_as<T, u32string> or (sizeof (wchar_t) == sizeof (char32_t) and same_as<T, wstring>));


    public:

        /**

         *  See docs on SDKChar for meaning (character set).

         *

         *  Note - many UNICODE Strings cannot be represented in the SDKString character set (especially if narrow - depends a lot).

         *  But in that case, AsNarrowSDKString () will throw, unless AllowMissingCharacterErrorsFlag is specified.

         */

        nonvirtual SDKString AsSDKString () const;

        nonvirtual SDKString AsSDKString (AllowMissingCharacterErrorsFlag) const;


    public:

        /**

         *  See docs on SDKChar for meaning (character set). If SDKChar is a wide character, there is probably still a

         *  default 'code page' to interpret narrow characters (Windows CP_ACP). This is a string in that character set.

         *

         *  Note - many UNICODE Strings cannot be represented in the SDKString character set (especially if narrow - depends a lot).

         *  But in that case, AsNarrowSDKString () will throw, unless AllowMissingCharacterErrorsFlag is specified.

         */

        nonvirtual string AsNarrowSDKString () const;

        nonvirtual string AsNarrowSDKString (AllowMissingCharacterErrorsFlag) const;


    public:

        /**

         * Convert String losslessly into a standard C++ type.

         * Only specifically specialized variants are supported (right now just <string> supported).

         * The source string MUST be valid ascii characters - throw RuntimeErrorException<>

         *

         *  \par Example Usage:

         *      \code

         *          string a1    =  String{"hi mom"}.AsASCII ();    // OK

         *          string a2    =  String{u"שלום"}.AsASCII ();     // throws

         *      \endcode

         *

         *  \note - this is a (compatible) change of behavior: before Stroika v2.1d23, this would assert out on invalid ASCII.

         *

         *  Supported Types:

         *      o   Memory::StackBuffer<char>

         *      o   string

         *      o   u8string        (note any ASCII string is also legit utf-8)

         */

        template <typename T = string>

        nonvirtual T AsASCII () const

            requires requires (T* into) {

                { into->empty () } -> same_as<bool>;

                { into->push_back (ASCII{0}) };

            };


    public:

        /**

         * Convert String losslessly into a standard C++ type.

         * Only specifically specialized variants are supported (right now just <string> supported).

         * If this source contains any invalid ASCII characters, this returns nullopt, and else a valid engaged string.

         *

         *  Supported Types(T):

         *      o   Memory::StackBuffer<char>

         *      o   string

         *      o   u8string (note any valid ASCII string is also valid utf-8)

         */

        template <typename T = string>

        nonvirtual optional<T> AsASCIIQuietly () const

            requires requires (T* into) {

                { into->empty () } -> same_as<bool>;

                { into->push_back (ASCII{0}) };

            };


    public:

        /**

         *  \brief Summary data for raw contents of rep - each rep will support at least one of these span forms

         *

         *  Each rep will support a span of at least one code-point type (ascii, utf8, utf16, or utf32)

         *

         *  This API is guaranteed to support a span of at least one of these types (maybe more). The caller may

         *  specify the code-point type preferred.

         *

         *  \note eAscii is a subset of eSingleByteLatin1, so when the type eAscii is returned, EITHER fSingleByteLatin1 or fAscii maybe

         *        maybe used.

         *

         *  This API is public, but best to avoid depending on internals of String API - like PeekSpanData - since

         *  this reasonably likely to change in future versions.

         */


        struct PeekSpanData {


            enum StorageCodePointType {

                /**

                 *  ASCII is useful to track in storage (though same size as eSingleByteLatin1) - because requests

                 *  to convert to UTF-8 are free - ASCII is legit UTF8 (not true for eSingleByteLatin1)

                 */

                eAscii,

                /**

                 *  Latin1 - 8 bit representation of characters. But 256 of them - more than plain ascii.

                 *  And cheap/easy to convert to UNICODE (since code points of wider characters exactly the same values).

                 */

                eSingleByteLatin1,

                eChar16,

                eChar32

            };


            StorageCodePointType fInCP;

            union {

                span<const ASCII>    fAscii;

                span<const Latin1>   fSingleByteLatin1;

                span<const char16_t> fChar16;

                span<const char32_t> fChar32;

            };

        };


    public:

        /**

         *  \brief return the constant character data inside the string in the form of a case variant union of different span types (at least one will be there)

         *         templated type arg just used to pick a preferred type.

         *

         *  \note CHAR_TYPE == char implies eAscii

         *

         *  \note Reason for the two step API - getting the PeekSpanData, and then using - is because getting

         *        the data is most expensive part (virtual function), and the packaged PeekSpanData gives enuf

         *        info to do the next steps (quickly inline usually)

         *

         *  This API is public, but best to avoid depending on internals of String API - like PeekSpanData - since

         *  this reasonably likely to change in future versions.

         */

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_TYPE = ASCII>

        nonvirtual PeekSpanData GetPeekSpanData () const;


    public:

        /**

         *  \brief return the constant character data inside the string in the form of a span or nullopt if not available for that CHAR_TYPE

         *

         *  This API is public, but best to avoid depending on internals of String API - like PeekSpanData - since

         *  this reasonably likely to change in future versions.

         *

         *  \note It is generally true that the data IsASCII (span) IFF Peek<ASCII> returns non-nullopt. But this is

         *        not ACTUALLY always true. Generally, Stroika constructs strings like this. But callers may manually construct

         *        a String with backend rep u32string, for example (e.g because of move construct) - and that might just happen

         *        to be all ascii. You can count on that IF you get back value from PeekData<ASCII> - it must be all ASCII. But

         *        the contrapositive is not always true.

         */

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_TYPE>

        static optional<span<const CHAR_TYPE>> PeekData (const PeekSpanData& pds);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_TYPE>

        nonvirtual optional<span<const CHAR_TYPE>> PeekData () const;


    public:

        /**

         *  \brief return the constant character data inside the string (rep) in the form of a span, possibly quickly and directly, and possibly copied into possiblyUsedBuffer

         *

         *  This API will typically return a span of data which is internal pointers into the data of the rep (and so its invalidated on the

         *  next change to the string).

         *

         *  BUT - it maybe a span of data stored into the argument possiblyUsedBuffer (which is why it must be provided - cannot be nullptr).

         *  If you want the freedom to not pass in this buffer, see the PeekData API.

         *

         *  \note - CHAR_T must satisfy the concept IUNICODECanAlwaysConvertTo - SAFELY - because the string MIGHT contain characters not in any

         *          unsafe char class (like ASCII or Latin1), and so there might not be a way to do the conversion. Use

         *          PeekData () to do that - where it can return nullopt if no conversion possible.

         *

         *  \par Example Usage

         *      \code

         *          Memory::StackBuffer<char8_t> maybeIgnoreBuf1;

         *          span<const char8_t>          thisData = GetData (&maybeIgnoreBuf1);

         *      \endcode

         *

         *  \note Prior to Stroika v3.0d1, GetData() took no arguments, and returned pair<const CHAR_TYPE*, const CHAR_TYPE*>

         *        which is pretty similar, but not quite the same. To adapt any existing code calling that older version of the API

         *        just add a Memory::StackBuffer<T> b; and pass &b to GetData(); And the return span is not the same as pair<> but

         *        easily convertible.

         */

        template <IUNICODECanAlwaysConvertTo CHAR_TYPE, size_t STACK_BUFFER_SZ>

        static span<const CHAR_TYPE> GetData (const PeekSpanData& pds, Memory::StackBuffer<CHAR_TYPE, STACK_BUFFER_SZ>* possiblyUsedBuffer);

        template <IUNICODECanAlwaysConvertTo CHAR_TYPE, size_t STACK_BUFFER_SZ>

        nonvirtual span<const CHAR_TYPE> GetData (Memory::StackBuffer<CHAR_TYPE, STACK_BUFFER_SZ>* possiblyUsedBuffer) const;


    public:

        struct EqualsComparer;


    public:

        struct LessComparer;


    public:

        struct ThreeWayComparer;


    public:

        /**

         *  Return true if case sensitive compare of the two IConvertibleToString objects have the same characters.

         *  Indirects to EqualsComparer{eWithCase} (...)

         *

         *  \note For reasons I don't understand, the plain function declaration of operator== and requires not do appear to be required

         *        on all major compilers due to quirks of the operator= rewrite rules, but I don't fully understand why --LGP 2024-11-18.

         */

        nonvirtual bool operator== (const String& rhs) const;

        template <IConvertibleToString T>

        nonvirtual bool operator== (T&& rhs) const

            requires (not same_as<remove_cvref_t<T>, String>);


    public:

        /**

         *  Return strong_ordering of case sensitive (three-way) compare of the two IConvertibleToString objects.

         *  Indirects to ThreeWayComparer{eWithCase} (...)

         *

         *  \see operator== ()

         */

        nonvirtual strong_ordering operator<=> (const String& rhs) const;

        template <IConvertibleToString T>

        nonvirtual strong_ordering operator<=> (T&& rhs) const

            requires (not same_as<remove_cvref_t<T>, String>);


    public:

        /**

         *  @aliases basic_string>char>::npos

         *

         *  This is only used for 'STL-compatibility APIs, like substr (), find, rfind (), etc.

         */

        static constexpr size_t npos = static_cast<size_t> (-1);


    public:

        /**

         *  @aliases size

         */

        nonvirtual size_t length () const noexcept;


    public:

        /**

         *  \note BREAKING change between Stroika 2.1 and v3 - const c_str/0 no longer guaranteed to return non-null

         *

         *        Mitigating this, the non-const c_str() still will return non-null, and the const overload taking

         *        StackBuffer<wchar_t> will also guarantee returning non-null.

         *

         *        In the case of the overloads taking no arguments, the lifetime of the returned pointer is until the

         *        next change to this string.  In the case of the StackBuffer overload, the guarantee extends for the lifetime

         *        of the argument buffer (typically just the next few lines of code).

         *

         *  This will always return a value which is NUL-terminated.

         *

         *  Note also - the c_str () function CAN now be somewhat EXPENSIVE, causing a mutation of the String object, so use

         *  one of the const overloads where possible (or where performance matters).

         *

         *  \note Why does c_str (StackBuffer) return a tuple?

         *        Sometimes you just want a plain const wchar_t* you can use with an old C pointer based API. But that

         *        fails/asserts out if you happen to have an empty string and try to get the pointer. Sometimes - you just need

         *        the pointer!

         *

         *        And why the string-view part? Because sometimes you want the LENGTH. Sure - you can just compute it again. But

         *        that is costly. Sure you can just use the original string length. BUT THAT WOULD BE A BUG once I support

         *        surrogates properly (at least on windows where wchar_t isn't char32_t).

         */

        nonvirtual tuple<const wchar_t*, wstring_view> c_str (Memory::StackBuffer<wchar_t>* possibleBackingStore) const;


    public:

        /**

         *  Follow the basic_string<>::find () API

         *

         *  need more overloads.

         *

         *  Returns String::npos if not found, else the zero based index.

         */

        nonvirtual size_t find (Character c, size_t startAt = 0) const;

        nonvirtual size_t find (const String& s, size_t startAt = 0) const;


    public:

        /**

         *  Follow the basic_string<>::rfind () API

         *

         *   need more overloads.

         *

         *   Returns String::npos if not found, else the zero based index.

         */

        nonvirtual size_t rfind (Character c) const;


    public:

        /**

         *  mimic https://en.cppreference.com/w/cpp/string/basic_string/front

         *

         *  \pre not empty ()

         */

        nonvirtual Character front () const;


    public:

        /**

         *  mimic https://en.cppreference.com/w/cpp/string/basic_string/back

         *

         *  \pre not empty ()

         */

        nonvirtual Character back () const;


    public:

        /**

         *  Compatable with STL::basic_string::subtr() - which interprets second argument as count. Not the same

         *  as Stroika::String::SubString (where the second argument is a 'to')

         *

         *  @see SubString

         *

         *  From http://en.cppreference.com/w/cpp/string/basic_string/substr

         *      Returns a substring [pos, pos+count). If the requested substring extends

         *      past the end of the string, or if count == npos, the returned substring is [pos, size()).

         *      std::out_of_range if pos > size()

         */

        nonvirtual String substr (size_t from, size_t count = npos) const;


    public:

        ///////////////// DEPRECATED FUNCTIONS /////////////////

        [[deprecated ("Since Stroika v3.0d13 - if you must use c_str() - use the overload taking StackBuffer arg), or use As<wstring> "

                      "().c_str ()")]] const wchar_t*

                                                                               c_str ();

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder::SetAt")]] void SetCharAt (Character c, size_t i);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        erase (size_t from = 0);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        erase (size_t from, size_t count);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        push_back (wchar_t c);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        push_back (Character c);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        Append (Character c);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        Append (const String& s);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        Append (const wchar_t* s);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        Append (const wchar_t* from, const wchar_t* to);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void        Append (const Character* from, const Character* to);

        template <typename CHAR_T>

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] void Append (span<const CHAR_T> s)

            requires (same_as<CHAR_T, Character> or same_as<CHAR_T, char32_t>);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] String&    operator+= (Character appendage);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] String&    operator+= (const String& appendage);

        [[deprecated ("Since Stroika v3.0d12 use StringBuilder")]] String&    operator+= (const wchar_t* appendageCStr);

        [[deprecated ("Since Stroika v3.0d12 - just use a b String{}")]] void clear ()

        {

            *this = String{};

        }

        template <typename T>

        [[deprecated ("Since Stroika v3.0d2, just use 0 arg version)")]] void As (T* into) const

            requires (IBasicUNICODEStdString<T> or same_as<T, String>)

        {

            *into = this->As<T> ();

        }

        [[deprecated ("Since Stroika v3.0d2, just use 1 arg version)")]] void AsNarrowString (const locale& l, string* into) const

        {

            *into = this->AsNarrowString (l);

        }

        template <typename T = u8string>

        [[deprecated ("Since Stroika v3.0d2 - use AsUTF8/0")]] void AsUTF8 (T* into) const

            requires (same_as<T, string> or same_as<T, u8string>)

        {

            *into = this->AsUTF8 ();

        }

        template <typename T = u16string>

        [[deprecated ("Since Stroika v3.0d2 - use AsUTF16/0")]] void AsUTF16 (T* into) const

            requires (same_as<T, u16string> or (sizeof (wchar_t) == sizeof (char16_t) and same_as<T, wstring>))

        {

            *into = AsUTF16 ();

        }

        template <typename T = u32string>

        [[deprecated ("Since Stroika v3.0d2 - use AsUTF32/0")]] void AsUTF32 (T* into) const

            requires (same_as<T, u32string> or (sizeof (wchar_t) == sizeof (char32_t) and same_as<T, wstring>))

        {

            *into = AsUTF32 ();

        }

        [[deprecated ("Since Stroika v3.0d2 - just use /0")]] void AsSDKString (SDKString* into) const

        {

            *into = AsSDKString ();

        }

        [[deprecated ("Since Stroika v3.0d2 - just use /0")]] void AsNarrowSDKString (string* into) const

        {

            *into = SDK2Narrow (AsSDKString ());

        }

        template <typename T = string>

        [[deprecated ("Since v3.0d2 use /0")]] void AsASCII (T* into) const

            requires (same_as<T, string> or same_as<T, Memory::StackBuffer<char>>)

        {

            if (not AsASCIIQuietly (into)) {

                ThrowInvalidAsciiException_ ();

            }

        }

        template <typename T = string>

        [[deprecated ("Since v3.0d2 use /0 overload")]] bool AsASCIIQuietly (T* into) const

            requires (same_as<T, string> or same_as<T, Memory::StackBuffer<char>>)

        {

            auto r = this->AsASCIIQuietly ();

            if (r) {

                *into = *r;

                return true;

            }

            else {

                return false;

            }

        }

        [[deprecated ("Since Stroika v3.0d5 use StringShorteningPreference argument")]] String LimitLength (size_t maxLen, bool keepLeft) const

        {

            return LimitLength (maxLen, keepLeft ? StringShorteningPreference::ePreferKeepLeft : StringShorteningPreference::ePreferKeepRight);

        }

        [[deprecated ("Since Stroika v3.0d5 use StringShorteningPreference argument")]] String LimitLength (size_t maxLen, bool keepLeft,

                                                                                                            const String& ellipsis) const

        {

            return LimitLength (maxLen, keepLeft ? StringShorteningPreference::ePreferKeepLeft : StringShorteningPreference::ePreferKeepRight, ellipsis);

        }

        template <typename CHAR_T>

        [[deprecated ("Since Stroika v3.0d1, String{}")]] static String FromASCII (span<const CHAR_T> s)

        {

            return String{s};

        }

        template <typename CHAR_T>

        [[deprecated ("Since Stroika v3.0d1, String{}")]] static String FromASCII (const CHAR_T* cString)

        {

            return String{cString};

        }

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        [[deprecated ("Since Stroika v3.0d1, String{}")]] static String FromASCII (const basic_string<CHAR_T>& str)

        {

            return String{str};

        }

        [[deprecated ("Since Stroika v3.0d1, use span{} overload for this")]] static String FromASCII (const char* from, const char* to)

        {

            return String{span{from, to}};

        }

        [[deprecated ("Since Stroika v3.0d1, use span{} overload for this")]] static String FromASCII (const wchar_t* from, const wchar_t* to)

        {

            return String{span{from, to}};

        }

        [[deprecated ("Since Stroika v3.0d1, use span overloads")]] String InsertAt (const wchar_t* from, const wchar_t* to, size_t at) const

        {

            Memory::StackBuffer<Character> buf{Memory::eUninitialized, UTFConvert::ComputeTargetBufferSize<Character> (span{from, to})};

            return InsertAt (UTFConvert::kThe.ConvertSpan (span{from, to}, span{buf}), at);

        }

        [[deprecated ("Since Stroika v3.0d1, use span overloads")]] String InsertAt (const Character* from, const Character* to, size_t at) const

        {

            return InsertAt (span{from, to}, at);

        }

        [[deprecated ("Since Stroika v3.0d1, use span{} overload for this")]] static String FromLatin1 (const char* start, const char* end)

        {

            return FromLatin1 (span{start, end});

        }

        [[deprecated ("Since Stroika v3.0d1, use span{} constructor for this")]] static String FromNarrowString (const char* from,

                                                                                                                 const char* to, const locale& l)

        {

            return FromNarrowString (span{from, to}, l);

        }

        [[deprecated ("Since Stroika v3.0d1, use span{} constructor for this")]] static String FromNarrowSDKString (const char* from, const char* to)

        {

            return FromNarrowSDKString (span{from, to});

        }

        template <IUNICODECanAlwaysConvertTo CHAR_T>

        [[deprecated ("Since Stroika v3.0d1, use span{} constructor for this")]] String (const CHAR_T* from, const CHAR_T* to)

            : String{span<const CHAR_T>{from, to}}

        {

        }

        [[deprecated (

            "Since Stroika v3.0d1 - use As<wstring> ().c_str () or other c_str() overload (*UNSAFE TO USE*)")]] nonvirtual const wchar_t*

        c_str () const noexcept;

        [[deprecated ("Since Stroika v3.0 - use span{} overloads")]] inline static String FromSDKString (const SDKChar* from, const SDKChar* to)

        {

            return FromSDKString (span{from, to});

        }

        [[deprecated ("Since Stroika v3.0 - use span{} overloads")]] static String FromUTF8 (const char* from, const char* to)

        {

            return FromUTF8 (span{from, to});

        }

        [[deprecated ("Since Stroika v3.0 - use span{} overloads")]] static String FromUTF8 (const char8_t* from, const char8_t* to)

        {

            return FromUTF8 (span{from, to});

        }

        template <typename T = string>

        [[deprecated ("Since Stroika v3.0d1 - use Character::AsAsciiQuietly")]] static bool AsASCIIQuietly (const wchar_t* fromStart,

                                                                                                            const wchar_t* fromEnd, T* into)

        {

            return Character::AsASCIIQuietly (span<const wchar_t>{fromStart, fromEnd}, into);

        }

        [[deprecated (

            "Since Stroika v3.0d1 due to http://stroika-bugs.sophists.com/browse/STK-965 - NOT IMPLEMENTED")]] nonvirtual const wchar_t*

                                                                           data () const;

        [[deprecated ("Since Stroika v3.0d8 - use RemoveFirstIf")]] String Remove (Character c) const

        {

            return RemoveFirstIf (c);

        }

        [[deprecated ("Since Stroika v3.0d8 - use RemoveFirstIf")]] String Remove (const String& subString) const

        {

            return RemoveFirstIf (subString);

        }


    private:

        static shared_ptr<_IRep> mkEmpty_ ();


    private:

        /**

         *  If the argument CHAR_T is restrictive (such as ASCII/char) - this CHECKS and THROWS (Character::CheckASCII).

         *  This function also reads the data, and sees if it can downshift 'CHAR_T' to something more restrictive, and produces

         *  a possibly smaller rep.

         *

         *  For some overloads (e..g && move) - the data is 'stolen/moved'.

         *

         *  See mk_nocheck_ for a simpler - DO WHAT I SAID - operation.

         */

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static shared_ptr<_IRep> mk_ (span<const CHAR_T> s);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static shared_ptr<_IRep> mk_ (Iterable<CHAR_T> it);

        template <IUNICODECanUnambiguouslyConvertFrom CHAR_T>

        static shared_ptr<_IRep> mk_ (span<CHAR_T> s);

        template <IStdBasicStringCompatibleCharacter CHAR_T>

        static shared_ptr<_IRep> mk_ (basic_string<CHAR_T>&& s);


    private:

        /*

         *  Note the mk_nocheck_ - just does the mk of the buffer, but assuming the arguments are legit and will fit (though it may

         *  assert in DEBUG builds this is true).

         *

         *  This just blindly allocates the buffer of the given size/type for the given arguments.

         */

        template <typename CHAR_T>

        static shared_ptr<_IRep> mk_nocheck_ (span<const CHAR_T> s)

            requires (same_as<CHAR_T, ASCII> or same_as<CHAR_T, Latin1> or same_as<CHAR_T, char16_t> or same_as<CHAR_T, char32_t>);


    private:

        template <unsigned_integral T>

        nonvirtual size_t SubString_adjust_ (T fromOrTo, size_t myLength) const;

        template <signed_integral T>

        nonvirtual size_t SubString_adjust_ (T fromOrTo, size_t myLength) const;


    private:

        nonvirtual String SubString_ (const _SafeReadRepAccessor& thisAccessor, size_t from, size_t to) const;


    protected:

        nonvirtual void _AssertRepValidType () const;


    private:

        [[noreturn]] static void ThrowInvalidAsciiException_ (); // avoid include

    };


    static_assert (totally_ordered<String>);


#if qStroika_Foundation_Characters_AsPathAutoMapMSYSAndCygwin

    template <>

    std::filesystem::path String::As<std::filesystem::path> () const;

#endif


    /**

     *  operator<< ostream adapters work as you would expect and allow writing Stroika strings easily to ostreams such as cout.

     *

     *  \note uses AsNarrowSDKString (eIgnoreErrors)

     *

     *  The only catch - is that Stroika strings are UNICODE based, and so may not fit perfectly with 'char' based basic_ostream<>.

     *  To address this, Stroika strings are mapped to 'narrow sdk strings' - ignoring any errors. As this is generally not a very

     *  good practice to do (lossy) - and generally just done for debugging/diagnostic output, this was deemed acceptable (as of Stroika v3.0d6).

     */

    wostream& operator<< (wostream& out, const String& s);

    ostream&  operator<< (ostream& out, const String& s);


#if qStroika_HasComponent_googletest

    // For googletest compatibility

    void PrintTo (const String& s, std::ostream* os);

#endif


    /**

     * Protected helper Rep class.

     *

     *  \note   Important design note - String reps are IMMUTABLE. Changes to string like +=, create new string reps (so costly).

     *          Use StringBuilder for that purpose in performance sensitive code.

     */


    class String::_IRep : public Iterable<Character>::_IRep {

    public:

        /**

         *  Return the ith character in the string.

         */

        virtual Character GetAt (size_t index) const noexcept = 0;


    public:

        /**

         *  Each rep will support a span of at least one code-point type (ascii, utf8, utf16, or utf32)

         *

         *  This API is guaranteed to support a span of at least one of these types (maybe more). The caller may

         *  specify the code-point type preferred.

         */

        virtual PeekSpanData PeekData ([[maybe_unused]] optional<PeekSpanData::StorageCodePointType> preferred) const noexcept = 0;


    public:

        /*

         *  Return a pointer to mostly standard (wide, nul-terminated) C string,

         *  whose lifetime extends to the next non-const call on this rep, or nullptr.

         *

         *  It is only 'mostly' standard because it is allowed to have nul-chars embedded in it. But it will

         *  always have str[len] == 0;

         *

         *  \note Since Stroika v3.0d1, this can return nullptr (in which case the String library will allocate a new backend)

         *

         *  \post returnResult == nullptr or returnResult[len] == '\0';

         */

        virtual const wchar_t* c_str_peek () const noexcept = 0;


    private:

        friend class String;

    };


    // Some some docs/testing...

    static_assert (not IConvertibleToString<int>);

    static_assert (not IConvertibleToString<char>); // would have been sensible to allow, but easily generates confusing results: cuz that means String x = 3 would work; confusing with ovarloads)

    static_assert (IConvertibleToString<string>);

    static_assert (IConvertibleToString<wstring>);

    static_assert (IConvertibleToString<u8string>);

    static_assert (IConvertibleToString<u16string>);

    static_assert (IConvertibleToString<u32string>);

    static_assert (not IConvertibleToString<optional<String>>);


    namespace Private_ {

        // This is just anything that can be treated as a 'span<const Character>'

        // clang-format off

        template <typename T>

        concept ICanBeTreatedAsSpanOfCharacter_ =

            derived_from<remove_cvref_t<T>, String>

            or same_as<remove_cvref_t<T>, u8string>

            or same_as<remove_cvref_t<T>, u8string_view>

            or same_as<remove_cvref_t<T>, u16string>

            or same_as<remove_cvref_t<T>, u16string_view>

            or same_as<remove_cvref_t<T>, u32string>

            or same_as<remove_cvref_t<T>, u32string_view>

            or same_as<remove_cvref_t<T>, wstring>

            or same_as<remove_cvref_t<T>, wstring_view>

            or same_as<remove_cvref_t<T>, const Character*>

            or same_as<remove_cvref_t<T>, const char8_t*>

            or same_as<remove_cvref_t<T>, const char16_t*>

            or same_as<remove_cvref_t<T>, const char32_t*>

            or same_as<remove_cvref_t<T>, const wchar_t*>

            ;

        // clang-format on


        template <ICanBeTreatedAsSpanOfCharacter_ USTRING, size_t STACK_BUFFER_SZ>

        span<const Character> AsSpanOfCharacters_ (USTRING&& s, Memory::StackBuffer<Character, STACK_BUFFER_SZ>* mostlyIgnoredBuf);

    }


    /**

     *

     *  \par Example Usage

     *      \code

     *          constexpr String::EqualsComparer kStringCIComparer_ {Characters::CompareOptions::eCaseInsensitive};

     *          if (kStringCIComparer_ (filename.extension (), ".HFCC"sv)) {

     *              compiledName = filename;

     *          }

     *      \endcode

     *

     *  \note There is no String::Equals() method, because it would look queer if it took one string argument, and if it was static

     *        it would essentially look like the above comparer, so little point.

     */


    struct String::EqualsComparer : Common::ComparisonRelationDeclarationBase<Common::ComparisonRelationType::eEquals> {

        /**

         *  optional CompareOptions to CTOR allows for case insensitive compares

         */

        constexpr EqualsComparer (CompareOptions co = eWithCase);


        /**

         * Extra overloads a slight performance improvement

         */

        template <IConvertibleToString LT, IConvertibleToString RT>

        nonvirtual bool operator() (LT&& lhs, RT&& rhs) const;


        CompareOptions fCompareOptions;


    private:

        template <Private_::ICanBeTreatedAsSpanOfCharacter_ LT, Private_::ICanBeTreatedAsSpanOfCharacter_ RT>

        bool Cmp_ (LT&& lhs, RT&& rhs) const;

        template <Private_::ICanBeTreatedAsSpanOfCharacter_ LT, Private_::ICanBeTreatedAsSpanOfCharacter_ RT>

        bool Cmp_Generic_ (LT&& lhs, RT&& rhs) const;

    };


    /**

     */

    struct String::ThreeWayComparer : Common::ComparisonRelationDeclarationBase<Common::ComparisonRelationType::eThreeWayCompare> {

        /**

         *  optional CompareOptions to CTOR allows for case insensitive compares

         */

        constexpr ThreeWayComparer (CompareOptions co = eWithCase);


        /**

         * Extra overloads a slight performance improvement

         */

        template <IConvertibleToString LT, IConvertibleToString RT>

        nonvirtual strong_ordering operator() (LT&& lhs, RT&& rhs) const;


        CompareOptions fCompareOptions;


    private:

        template <Private_::ICanBeTreatedAsSpanOfCharacter_ LT, Private_::ICanBeTreatedAsSpanOfCharacter_ RT>

        strong_ordering Cmp_ (LT&& lhs, RT&& rhs) const;

        template <Private_::ICanBeTreatedAsSpanOfCharacter_ LT, Private_::ICanBeTreatedAsSpanOfCharacter_ RT>

        strong_ordering Cmp_Generic_ (LT&& lhs, RT&& rhs) const;

    };


    /**

     *  \brief very similar to ThreeWayComparer but returns true if less

     */


    struct String::LessComparer : Common::ComparisonRelationDeclarationBase<Common::ComparisonRelationType::eStrictInOrder> {

        constexpr LessComparer (CompareOptions co = eWithCase);


        template <typename T1, typename T2>

        nonvirtual bool operator() (T1 lhs, T2 rhs) const;


    private:

        ThreeWayComparer fComparer_;

    };


    static_assert (Common::IInOrderComparer<String::LessComparer, String>);


    inline namespace Literals {

        /**

         *  \brief shorthand for String::FromStringConstant { ARGUMENT }

         *

         *  \par Example:

         *      \code

         *          String s1 = "some-string"_k;

         *          String s2 = String::FromStringConstant ("some-string");

         *          String s3 = "some-string"sv;           // in most cases this will also work fine, and is preferable (since sv is part of C++ standard)

         *      \endcode

         *

         *  \note _k is STILL sometimes useful and better than sv, since the TYPE returned by _k is a String_Constant which IS a String

         *        so it will work in some overload contexts where sv would fail.

         *

         *  \note operator""_k with char*, requires that the argument string MUST BE ASCII (someday maybe lifted to allow Latin1)

         */

        String operator""_k (const ASCII* s, size_t len);

        String operator""_k (const wchar_t* s, size_t len);

        String operator""_k (const char8_t* s, size_t len);

        String operator""_k (const char16_t* s, size_t len);

        String operator""_k (const char32_t* s, size_t len);

    }


    /**

     *  Basic operator overload with the obvious meaning, and simply indirect to @String::Concatenate (const String& rhs)

     *

     *  \note Design Note

     *      Don't use member function so "x" + String{u"x"} works.

     *      Insist that EITHER LHS or RHS is a string (else operator applies too widely).

     *

     *  Both arguments must be convertible to a String, and at least must be String or derived from String

     */

    template <IConvertibleToString LHS_T, IConvertibleToString RHS_T>

    String operator+ (LHS_T&& lhs, RHS_T&& rhs)

        requires (derived_from<remove_cvref_t<LHS_T>, String> or derived_from<remove_cvref_t<RHS_T>, String>);


    /**

     *  \brief StringCombiner is a simple function object used to combine two strings visually - used in Iterable<>::Join ()

     *

     *  This can combine strings in the obvious way (concatenation) - but defaults to separating them with a comma (', ').

     *

     *  \note the functional api - is to be given two strings, and a flag saying if the combination is the last one in the list,

     *        since in English, this is frequently rendered somewhat differently than the rest.

     */

    template <typename STRING = String>


    struct StringCombiner {

        STRING           fSeparator{", "sv};

        optional<STRING> fSpecialSeparatorForLastPair;

        STRING           operator() (const STRING& lhs, const STRING& rhs, bool isLast) const;

    };


    /**

     *  kDefaultStringCombiner is just StringCombiner{}, rendered as a function object, so that it can be externed/imported

     *  in the Iterable code without imposing a dependency on the String code.

     */

    extern const function<String (String, String, bool)> kDefaultStringCombiner;


}


namespace Stroika::Foundation::Traversal {

    // specialized as performance optimization

    template <>

    Characters::String Iterable<Characters::String>::Join (const Characters::String& separator, const optional<Characters::String>& finalSeparator) const;

}


namespace std {

    template <>

    struct hash<Stroika::Foundation::Characters::String> {

        size_t operator() (const Stroika::Foundation::Characters::String& arg) const;

    };

}


namespace Stroika::Foundation::Memory {

    class BLOB; // Forward declare to avoid mutual include issues

}


namespace Stroika::Foundation::DataExchange {

    template <typename T>

    struct DefaultSerializer; // Forward declare to avoid mutual include issues

    template <>

    struct DefaultSerializer<Stroika::Foundation::Characters::String> {

        Memory::BLOB operator() (const Stroika::Foundation::Characters::String& arg) const;

    };

}


/**

 *  Allow std::format to work with String class

 *

 *  \note SUPER PRIMITIVE ROUGH FIRST DRAFT

 */

template <>


struct qStroika_Foundation_Characters_FMT_PREFIX_::formatter<Stroika::Foundation::Characters::String, wchar_t> {

    qStroika_Foundation_Characters_FMT_PREFIX_::formatter<std::wstring, wchar_t> fDelegate2_;


    template <typename ParseContext>

    constexpr typename ParseContext::iterator parse (ParseContext& ctx)

    {

        return fDelegate2_.parse (ctx);

    }


    template <typename FmtContext>

    typename FmtContext::iterator format (Stroika::Foundation::Characters::String s, FmtContext& ctx) const

    {

        return fDelegate2_.format (s.As<std::wstring> (), ctx);

    }

};


template <>

struct qStroika_Foundation_Characters_FMT_PREFIX_::formatter<Stroika::Foundation::Characters::String, char> {

    bool ignoreerrors{true}; // maybe set from thread-local variable, or parse() settings, or both


    template <typename ParseContext>

    constexpr typename ParseContext::iterator parse (ParseContext& ctx)

    {

        auto it = ctx.begin ();

        while (it != ctx.end ()) {

            ++it;

#if 0

                if (it == ctx.end()) {

                    throw Common::StdCompat::format_error{"Invalid format args (missing }) for formatter<String,char>."};

                }

#endif

            if (*it == '}') {

                return it;

            }

        }

        return it;

    }


    template <typename FmtContext>

    typename FmtContext::iterator format (Stroika::Foundation::Characters::String s, FmtContext& ctx) const

    {

        using namespace Stroika::Foundation::Characters;

        //  wformat_context delegateCTX;

        String dr{s}; // really want to delegate to wchar_t version (with vformat) but no documented easy way to extract format_args from ctx (though its in there)

        if (ignoreerrors) {

#if __cpp_lib_ranges >= 202207L

            return std::ranges::copy (dr.AsNarrowSDKString (eIgnoreErrors), ctx.out ()).out;

#else

            return format_to (ctx.out (), "{}", dr.AsNarrowSDKString (eIgnoreErrors));

#endif

        }

        else {

#if __cpp_lib_ranges >= 202207L

            return std::ranges::copy (dr.AsNarrowSDKString (), ctx.out ()).out;

#else

            return format_to (ctx.out (), "{}", dr.AsNarrowSDKString ());

#endif

        }

    }

};


/*

 ********************************************************************************

 ***************************** Implementation Details ***************************

 ********************************************************************************

 */

#include "String.inl"


#endif /*_Stroika_Foundation_Characters_String_h_*/

Character.h

Compare.h

Stroika_Define_Enum_Bounds
#define Stroika_Define_Enum_Bounds(FIRST_ITEM, LAST_ITEM)
Definition Enumeration.h:109

Iterable.h

SharedByValue.h

StackBuffer.h

StdCompat.h

Stroika::Foundation::Characters::Character
Definition Character.h:218

Stroika::Foundation::Characters::Character::IsWhitespace
constexpr bool IsWhitespace() const noexcept
Definition Character.inl:394

Stroika::Foundation::Characters::RegularExpression
RegularExpression is a compiled regular expression which can be used to match on a String class.
Definition RegularExpression.h:25

Stroika::Foundation::Characters::RegularExpressionMatch
Definition RegularExpression.h:129

Stroika::Foundation::Characters::String::_IRep
Definition String.h:1737

Stroika::Foundation::Characters::String::_IRep::GetAt
virtual Character GetAt(size_t index) const noexcept=0

Stroika::Foundation::Characters::String::_IRep::PeekData
virtual PeekSpanData PeekData(optional< PeekSpanData::StorageCodePointType > preferred) const noexcept=0

Stroika::Foundation::Characters::StringBuilder
Similar to String, but intended to more efficiently construct a String. Mutable type (String is large...
Definition StringBuilder.h:73

Stroika::Foundation::Characters::String
String is like std::u32string, except it is much easier to use, often much more space efficient,...
Definition String.h:201

Stroika::Foundation::Characters::String::Contains
nonvirtual bool Contains(Character c, CompareOptions co=eWithCase) const
Definition String.inl:697

Stroika::Foundation::Characters::String::AsUTF8
nonvirtual T AsUTF8() const

Stroika::Foundation::Characters::String::length
nonvirtual size_t length() const noexcept
Definition String.inl:1051

Stroika::Foundation::Characters::String::ToUpperCase
nonvirtual String ToUpperCase() const
Definition String.cpp:1744

Stroika::Foundation::Characters::String::FromNarrowString
static String FromNarrowString(const char *from, const locale &l)
Definition String.inl:340

Stroika::Foundation::Characters::String::Matches
nonvirtual bool Matches(const RegularExpression &regEx) const
Definition String.cpp:1133

Stroika::Foundation::Characters::String::IsWhitespace
nonvirtual bool IsWhitespace() const
Definition String.cpp:1782

Stroika::Foundation::Characters::String::NormalizeTextToNL
nonvirtual String NormalizeTextToNL() const
Definition String.cpp:1201

Stroika::Foundation::Characters::String::Join
static String Join(const Iterable< String > &list, const String &separator=", "sv)
Definition String.cpp:1692

Stroika::Foundation::Characters::String::FromStringConstant
static String FromStringConstant(const CHAR_T(&cString)[SIZE])
Take the given argument data (constant span) - which must remain unchanged - constant - for the appli...
Definition String.inl:386

Stroika::Foundation::Characters::String::ColValue
nonvirtual String ColValue(size_t i, const String &valueIfMissing={}) const
see Col(i) - but with default value of empty string
Definition String.inl:715

Stroika::Foundation::Characters::String::NormalizeSpace
nonvirtual String NormalizeSpace(Character useSpaceCharacter=' ') const
Replace sequences of whitespace characters (space, tab, newline etc) with a single space (or argument...
Definition String.cpp:1229

Stroika::Foundation::Characters::String::FindEach
nonvirtual Containers::Sequence< pair< size_t, size_t > > FindEach(const RegularExpression &regEx) const
Definition String.cpp:966

Stroika::Foundation::Characters::String::c_str
nonvirtual tuple< const wchar_t *, wstring_view > c_str(Memory::StackBuffer< wchar_t > *possibleBackingStore) const
Definition String.inl:1055

Stroika::Foundation::Characters::String::operator==
nonvirtual bool operator==(const String &rhs) const
Definition String.inl:1115

Stroika::Foundation::Characters::String::Repeat
nonvirtual String Repeat(unsigned int count) const
Definition String.cpp:1424

Stroika::Foundation::Characters::String::FromSDKString
static String FromSDKString(const SDKChar *from)
Definition String.inl:447

Stroika::Foundation::Characters::String::LimitLength
nonvirtual String LimitLength(size_t maxLen, StringShorteningPreference keepPref=StringShorteningPreference::ePreferKeepLeft) const
return the first maxLen (or fewer if string shorter) characters of this string (adding ellipsis if tr...
Definition String.inl:745

Stroika::Foundation::Characters::String::RemoveAll
nonvirtual String RemoveAll(Character c) const
Definition String.cpp:823

Stroika::Foundation::Characters::String::FindEachMatch
nonvirtual Containers::Sequence< RegularExpressionMatch > FindEachMatch(const RegularExpression &regEx) const
Definition String.cpp:984

Stroika::Foundation::Characters::String::RemoveFirstIf
nonvirtual String RemoveFirstIf(Character c) const
Definition String.cpp:807

Stroika::Foundation::Characters::String::AsUTF32
nonvirtual T AsUTF32() const

Stroika::Foundation::Characters::String::AsNarrowSDKString
nonvirtual string AsNarrowSDKString() const
Definition String.inl:834

Stroika::Foundation::Characters::String::Col
nonvirtual optional< String > Col(size_t i) const
Useful to replace 'awk print $3' - replace with Col(2) - zero based.
Definition String.cpp:1362

Stroika::Foundation::Characters::String::InsertAt
nonvirtual String InsertAt(Character c, size_t at) const
Definition String.inl:719

Stroika::Foundation::Characters::String::rfind
nonvirtual size_t rfind(Character c) const
Definition String.inl:1075

Stroika::Foundation::Characters::String::FromNarrowSDKString
static String FromNarrowSDKString(const char *from)
Definition String.inl:470

Stroika::Foundation::Characters::String::AsNarrowString
nonvirtual string AsNarrowString(const locale &l) const
Definition String.cpp:1838

Stroika::Foundation::Characters::String::Concatenate
nonvirtual String Concatenate(T &&rhs) const
appends 'rhs' string to this string (without modifying this string) and returns the combined string

Stroika::Foundation::Characters::String::AsSDKString
nonvirtual SDKString AsSDKString() const
Definition String.inl:806

Stroika::Foundation::Characters::String::size
nonvirtual size_t size() const noexcept
Definition String.inl:534

Stroika::Foundation::Characters::String::EndsWith
nonvirtual bool EndsWith(const Character &c, CompareOptions co=eWithCase) const
Definition String.cpp:1088

Stroika::Foundation::Characters::String::ToLowerCase
nonvirtual String ToLowerCase() const
Definition String.cpp:1706

Stroika::Foundation::Characters::String::ReplaceAll
nonvirtual String ReplaceAll(const RegularExpression &regEx, const String &with) const
Definition String.cpp:1155

Stroika::Foundation::Characters::String::npos
static constexpr size_t npos
Definition String.h:1399

Stroika::Foundation::Characters::String::Replace
nonvirtual String Replace(size_t from, size_t to, const String &replacement) const
Definition String.cpp:1045

Stroika::Foundation::Characters::String::String
String()
Definition String.inl:266

Stroika::Foundation::Characters::String::SubString
nonvirtual String SubString(SZ from) const

Stroika::Foundation::Characters::String::Trim
nonvirtual String Trim(bool(*shouldBeTrimmed)(Character)=Character::IsWhitespace) const
Definition String.cpp:1592

Stroika::Foundation::Characters::String::operator<=>
nonvirtual strong_ordering operator<=>(const String &rhs) const
Definition String.inl:1105

Stroika::Foundation::Characters::String::back
nonvirtual Character back() const
Definition String.inl:1079

Stroika::Foundation::Characters::String::StartsWith
nonvirtual bool StartsWith(const Character &c, CompareOptions co=eWithCase) const
Definition String.cpp:1059

Stroika::Foundation::Characters::String::StripAll
nonvirtual String StripAll(bool(*removeCharIf)(Character)) const
Definition String.cpp:1664

Stroika::Foundation::Characters::String::AsASCII
nonvirtual T AsASCII() const

Stroika::Foundation::Characters::String::AssureEndsWith
nonvirtual String AssureEndsWith(const Character &c, CompareOptions co=eWithCase) const
Return *this if it ends with argument character, or append 'c' so that it ends with a 'c'.
Definition String.cpp:1123

Stroika::Foundation::Characters::String::CopyTo
nonvirtual span< CHAR_T > CopyTo(span< CHAR_T > s) const

Stroika::Foundation::Characters::String::AsUTF16
nonvirtual T AsUTF16() const

Stroika::Foundation::Characters::String::GetPeekSpanData
nonvirtual PeekSpanData GetPeekSpanData() const
return the constant character data inside the string in the form of a case variant union of different...

Stroika::Foundation::Characters::String::SafeSubString
nonvirtual String SafeSubString(SZ from) const

Stroika::Foundation::Characters::String::AsLines
nonvirtual Containers::Sequence< String > AsLines() const
break the String into a series of lines;
Definition String.cpp:1306

Stroika::Foundation::Characters::String::LTrim
nonvirtual String LTrim(bool(*shouldBeTrimmed)(Character)=Character::IsWhitespace) const
Definition String.cpp:1443

Stroika::Foundation::Characters::String::front
nonvirtual Character front() const
Definition String.inl:1086

Stroika::Foundation::Characters::String::Grep
nonvirtual Containers::Sequence< String > Grep(const String &fgrepArg) const
Breaks this string into Lines, with AsLines (), and applies the argument filter (as if with ....
Definition String.cpp:1341

Stroika::Foundation::Characters::String::FindEachString
nonvirtual Containers::Sequence< String > FindEachString(const RegularExpression &regEx) const
Definition String.cpp:1001

Stroika::Foundation::Characters::String::Skip
nonvirtual String Skip(size_t n) const
Return a substring of this string, starting at 'argument' n. If n > size(), return empty string.
Definition String.inl:604

Stroika::Foundation::Characters::String::RFind
nonvirtual optional< size_t > RFind(Character c) const noexcept
Definition String.cpp:1011

Stroika::Foundation::Characters::String::GetData
static span< const CHAR_TYPE > GetData(const PeekSpanData &pds, Memory::StackBuffer< CHAR_TYPE, STACK_BUFFER_SZ > *possiblyUsedBuffer)
return the constant character data inside the string (rep) in the form of a span, possibly quickly an...
Definition String.inl:967

Stroika::Foundation::Characters::String::Tokenize
nonvirtual Containers::Sequence< String > Tokenize() const
Definition String.cpp:1234

Stroika::Foundation::Characters::String::RemoveAt
nonvirtual String RemoveAt(size_t charAt) const
Definition String.inl:608

Stroika::Foundation::Characters::String::AsASCIIQuietly
nonvirtual optional< T > AsASCIIQuietly() const

Stroika::Foundation::Characters::String::FromLatin1
static String FromLatin1(const CHAR_T *cString)
Definition String.inl:355

Stroika::Foundation::Characters::String::PeekData
static optional< span< const CHAR_TYPE > > PeekData(const PeekSpanData &pds)
return the constant character data inside the string in the form of a span or nullopt if not availabl...
Definition String.inl:910

Stroika::Foundation::Characters::String::FromUTF8
static String FromUTF8(span< CHAR_T > from)
Definition String.inl:420

Stroika::Foundation::Characters::String::RTrim
nonvirtual String RTrim(bool(*shouldBeTrimmed)(Character)=Character::IsWhitespace) const
Definition String.cpp:1508

Stroika::Foundation::Characters::String::Find
nonvirtual optional< size_t > Find(Character c, CompareOptions co=eWithCase) const
Definition String.inl:685

Stroika::Foundation::Characters::String::substr
nonvirtual String substr(size_t from, size_t count=npos) const
Definition String.inl:1092

Stroika::Foundation::Characters::String::As
nonvirtual T As() const

Stroika::Foundation::Characters::String::find
nonvirtual size_t find(Character c, size_t startAt=0) const
Definition String.inl:1067

Stroika::Foundation::Containers::Set
Set<T> is a container of T, where once an item is added, additionally adds () do nothing.
Definition Library/Sources/Stroika/Foundation/Containers/Set.h:105

Stroika::Foundation::Memory::BLOB
Definition BLOB.h:68

Stroika::Foundation::Memory::InlineBuffer
Logically halfway between std::array and std::vector; Smart 'direct memory array' - which when needed...
Definition InlineBuffer.h:93

Stroika::Foundation::Traversal::Iterable
Iterable<T> is a base class for containers which easily produce an Iterator<T> to traverse them.
Definition Iterable.h:237

Stroika::Foundation::Traversal::Iterable< Character >::Iterable
Iterable(const Iterable &) noexcept=default
Iterable are safely copyable (by value). Since Iterable uses COW, this just copies the underlying poi...

Stroika::Foundation::Characters::IBasicUNICODEStdString
returns true iff T == u8string, u16string, u32string, or wstring - which std::string types can be una...
Definition String.h:116

Stroika::Foundation::Characters::IConvertibleToString
Definition String.h:142

Stroika::Foundation::Characters::IStdPathLike2UNICODEString
anything with a 'special .STRINGTYPE conversion' method to UNICODE string, such as filesystem::path
Definition String.h:124

Stroika::Foundation::Characters::IUNICODECanUnambiguouslyConvertFrom
IUNICODECanUnambiguouslyConvertFrom is any 'character representation type' where array of them unambi...
Definition Character.h:179

Stroika::Foundation::Common::IInOrderComparer
Definition Compare.h:223

Stroika::Foundation::Memory::ISpan
Definition Foundation/Memory/Common.h:43

Stroika::Foundation::Characters
Definition Character.h:31

Stroika::Foundation::Characters::ASCII
char ASCII
Stroika's string/character classes treat 'char' as being an ASCII character.
Definition Character.h:59

Stroika::Foundation::Characters::SDKChar
conditional_t< qTargetPlatformSDKUseswchar_t, wchar_t, char > SDKChar
Definition SDKChar.h:71

Stroika::Foundation::Characters::StringShorteningPreference
StringShorteningPreference
Definition String.h:99

Stroika::Foundation::Characters::SDKString
basic_string< SDKChar > SDKString
Definition SDKString.h:38

Stroika::Foundation::Characters::operator+
String operator+(LHS_T &&lhs, RHS_T &&rhs)
Definition String.inl:1294

Stroika::Foundation::Characters::kDefaultStringCombiner
const function< String(String, String, bool)> kDefaultStringCombiner
Definition String.inl:1319

Stroika::Foundation::Characters::AllowMissingCharacterErrorsFlag
AllowMissingCharacterErrorsFlag
Definition SDKString.h:54

Stroika::Foundation::Characters::operator<<
wostream & operator<<(wostream &out, const String &s)
Definition String.cpp:2035

Stroika::Foundation::Containers
Definition String.h:55

Stroika::Foundation::DataExchange
Definition String.h:1954

std
STL namespace.

Stroika::Foundation::Characters::String::EqualsComparer
Definition String.h:1820

Stroika::Foundation::Characters::String::LessComparer
very similar to ThreeWayComparer but returns true if less
Definition String.h:1867

Stroika::Foundation::Characters::String::PeekSpanData
Summary data for raw contents of rep - each rep will support at least one of these span forms.
Definition String.h:1270

Stroika::Foundation::Characters::String::PeekSpanData::StorageCodePointType
StorageCodePointType
Definition String.h:1271

Stroika::Foundation::Characters::String::PeekSpanData::eSingleByteLatin1
@ eSingleByteLatin1
Definition String.h:1281

Stroika::Foundation::Characters::String::PeekSpanData::eAscii
@ eAscii
Definition String.h:1276

Stroika::Foundation::Characters::StringCombiner
StringCombiner is a simple function object used to combine two strings visually - used in Iterable<>:...
Definition String.h:1923

Stroika::Foundation::Common::ComparisonRelationDeclarationBase
Definition Compare.h:267

Stroika::Foundation::DataExchange::DefaultSerializer
function object which serializes type T to a BLOB (or BLOB like) object
Definition DefaultSerializer.h:62