df/d79/a02402_source.html

 // StringUtils.cpp


 // Implements the various string helper functions:


 #include "Globals.h"


 #include "fmt/printf.h"


 #ifdef _MSC_VER

     // Under MSVC, link to WinSock2 (needed by RawBEToUTF8's byteswapping)

     #pragma comment(lib, "ws2_32.lib")

 #endif


 static unsigned char HexToDec(char a_HexChar)

 {

     switch (a_HexChar)

     {

         case '0': return 0;

         case '1': return 1;

         case '2': return 2;

         case '3': return 3;

         case '4': return 4;

         case '5': return 5;

         case '6': return 6;

         case '7': return 7;

         case '8': return 8;

         case '9': return 9;

         case 'a': return 10;

         case 'b': return 11;

         case 'c': return 12;

         case 'd': return 13;

         case 'e': return 14;

         case 'f': return 15;

         case 'A': return 10;

         case 'B': return 11;

         case 'C': return 12;

         case 'D': return 13;

         case 'E': return 14;

         case 'F': return 15;

     }

     return 0xff;

 }


 AStringVector StringSplit(const AString & str, const AString & delim)

 {

     AStringVector results;

     size_t cutAt = 0;

     size_t Prev = 0;

     while ((cutAt = str.find_first_of(delim, Prev)) != str.npos)

     {

         results.push_back(str.substr(Prev, cutAt - Prev));

         Prev = cutAt + 1;

     }

     if (Prev < str.length())

     {

         results.push_back(str.substr(Prev));

     }

     return results;

 }


 AStringVector StringSplitWithQuotes(const AString & str, const AString & delim)

 {

     AStringVector results;


     size_t cutAt = 0;

     size_t Prev = 0;

     size_t cutAtQuote = 0;


     while ((cutAt = str.find_first_of(delim, Prev)) != str.npos)

     {

         if (cutAt == Prev)

         {

             // Empty string due to multiple whitespace / whitespace at the beginning of the input

             // Just skip it

             Prev = Prev + 1;

             continue;

         }

         AString current = str.substr(Prev, cutAt - Prev);

         if ((current.front() == '"') || (current.front() == '\''))

         {

             Prev += 1;

             cutAtQuote = str.find_first_of(current.front(), Prev);

             if (cutAtQuote != str.npos)

             {

                 current = str.substr(Prev, cutAtQuote - Prev);

                 cutAt = cutAtQuote + 1;

             }

         }


         results.push_back(std::move(current));

         Prev = cutAt + 1;

     }


     if (Prev < str.length())

     {

         AString current = str.substr(Prev);


         // If the remant is wrapped in matching quotes, remove them:

         if (

             (current.length() >= 2) &&

             ((current.front() == '"') || (current.front() == '\'')) &&

             (current.front() == current.back())

         )

         {

             current = current.substr(1, current.length() - 2);

         }


         results.push_back(current);

     }


     return results;

 }


 AString StringJoin(const AStringVector & a_Strings, const AString & a_Delimeter)

 {

     if (a_Strings.empty())

     {

         return {};

     }


     // Do a dry run to gather the size

     const auto DelimSize = a_Delimeter.size();

     size_t ResultSize = a_Strings[0].size();

     std::for_each(a_Strings.begin() + 1, a_Strings.end(),

         [&](const AString & a_String)

         {

             ResultSize += DelimSize;

             ResultSize += a_String.size();

         }

     );


     // Now do the actual join

     AString Result;

     Result.reserve(ResultSize);

     Result.append(a_Strings[0]);

     std::for_each(a_Strings.begin() + 1, a_Strings.end(),

         [&](const AString & a_String)

         {

             Result += a_Delimeter;

             Result += a_String;

         }

     );

     return Result;

 }


 AStringVector StringSplitAndTrim(const AString & str, const AString & delim)

 {

     AStringVector results;

     size_t cutAt = 0;

     size_t Prev = 0;

     while ((cutAt = str.find_first_of(delim, Prev)) != str.npos)

     {

         results.push_back(TrimString(str.substr(Prev, cutAt - Prev)));

         Prev = cutAt + 1;

     }

     if (Prev < str.length())

     {

         results.push_back(TrimString(str.substr(Prev)));

     }

     return results;

 }


 AString TrimString(const AString & str)

 {

     size_t len = str.length();

     size_t start = 0;

     while (start < len)

     {

         if (static_cast<unsigned char>(str[start]) > 32)

         {

             break;

         }

         ++start;

     }

     if (start == len)

     {

         return "";

     }


     size_t end = len;

     while (end >= start)

     {

         if (static_cast<unsigned char>(str[end]) > 32)

         {

             break;

         }

         --end;

     }


     return str.substr(start, end - start + 1);

 }


 AString & InPlaceLowercase(AString & s)

 {

     std::transform(s.begin(), s.end(), s.begin(), ::tolower);

     return s;

 }


 AString & InPlaceUppercase(AString & s)

 {

     std::transform(s.begin(), s.end(), s.begin(), ::toupper);

     return s;

 }


 AString StrToLower(const AString & s)

 {

     AString res;

     res.resize(s.size());

     std::transform(s.begin(), s.end(), res.begin(), ::tolower);

     return res;

 }


 AString StrToUpper(const AString & s)

 {

     AString res;

     res.resize(s.size());

     std::transform(s.begin(), s.end(), res.begin(), ::toupper);

     return res;

 }


 int NoCaseCompare(const AString & s1, const AString & s2)

 {

     #ifdef _MSC_VER

         return _stricmp(s1.c_str(), s2.c_str());

     #else

         return strcasecmp(s1.c_str(), s2.c_str());

     #endif  // else _MSC_VER

 }


 size_t RateCompareString(const AString & s1, const AString & s2)

 {

     size_t MatchedLetters = 0;

     size_t s1Length = s1.length();


     if (s1Length > s2.length())

     {

         // Definitely not a match

         return 0;

     }


     for (size_t i = 0; i < s1Length; i++)

     {

         char c1 = static_cast<char>(toupper(s1[i]));

         char c2 = static_cast<char>(toupper(s2[i]));

         if (c1 == c2)

         {

             ++MatchedLetters;

         }

         else

         {

             break;

         }

     }

     return MatchedLetters;

 }


 void ReplaceString(AString & iHayStack, const AString & iNeedle, const AString & iReplaceWith)

 {

     // find always returns the current position for an empty needle; prevent endless loop

     if (iNeedle.empty())

     {

         return;

     }


     size_t pos1 = iHayStack.find(iNeedle);

     while (pos1 != AString::npos)

     {

         iHayStack.replace( pos1, iNeedle.size(), iReplaceWith);

         pos1 = iHayStack.find(iNeedle, pos1 + iReplaceWith.size());

     }

 }


 void ReplaceURL(AString & iHayStack, const AString & iNeedle, const AString & iReplaceWith)

 {

     auto ReplaceWith = URLEncode(iReplaceWith);

     ReplaceString(iHayStack, iNeedle, ReplaceWith);

 }


 AString & RawBEToUTF8(const char * a_RawData, size_t a_NumShorts, AString & a_UTF8)

 {

     a_UTF8.clear();

     a_UTF8.reserve(3 * a_NumShorts / 2);  // a quick guess of the resulting size

     for (size_t i = 0; i < a_NumShorts; i++)

     {

         a_UTF8.append(UnicodeCharToUtf8(GetBEUShort(&a_RawData[i * 2])));

     }

     return a_UTF8;

 }


 AString UnicodeCharToUtf8(unsigned a_UnicodeChar)

 {

     if (a_UnicodeChar < 0x80)

     {

         return AString{static_cast<char>(a_UnicodeChar)};

     }

     else if (a_UnicodeChar < 0x800)

     {

         return AString

         {

             static_cast<char>(192 + a_UnicodeChar / 64),

             static_cast<char>(128 + a_UnicodeChar % 64),

         };

     }

     else if (a_UnicodeChar - 0xd800 < 0x800)

     {

         // Error

         return AString();

     }

     else if (a_UnicodeChar < 0x10000)

     {

         return AString

         {

             static_cast<char>(224 + a_UnicodeChar / 4096),

             static_cast<char>(128 + (a_UnicodeChar / 64) % 64),

             static_cast<char>(128 + a_UnicodeChar % 64)

         };

     }

     else if (a_UnicodeChar < 0x110000)

     {

         return AString

         {

             static_cast<char>(240 + a_UnicodeChar / 262144),

             static_cast<char>(128 + (a_UnicodeChar / 4096) % 64),

             static_cast<char>(128 + (a_UnicodeChar / 64) % 64),

             static_cast<char>(128 + a_UnicodeChar % 64),

         };

     }

     else

     {

         // Error

         return AString();

     }

 }


 #ifdef __GNUC__

 #pragma GCC diagnostic push

 #pragma GCC diagnostic ignored "-Wimplicit-fallthrough"

 #endif

 // UTF-8 conversion code adapted from:

 //  https://stackoverflow.com/questions/2867123/convert-utf-16-to-utf-8-under-windows-and-linux-in-c


 // Begin of Unicode, Inc.'s code / information


 /*

 Notice from the original file:

 * Copyright 2001-2004 Unicode, Inc.

 *

 * Disclaimer

 *

 * This source code is provided as is by Unicode, Inc. No claims are

 * made as to fitness for any particular purpose. No warranties of any

 * kind are expressed or implied. The recipient agrees to determine

 * applicability of information provided. If this file has been

 * purchased on magnetic or optical media from Unicode, Inc., the

 * sole remedy for any claim will be exchange of defective media

 * within 90 days of receipt.

 *

 * Limitations on Rights to Redistribute This Code

 *

 * Unicode, Inc. hereby grants the right to freely use the information

 * supplied in this file in the creation of products supporting the

 * Unicode Standard, and to make copies of this file in any form

 * for internal or external distribution as long as this notice

 * remains attached.

 */


 #define UNI_MAX_BMP         0x0000FFFF

 #define UNI_MAX_UTF16       0x0010FFFF

 #define UNI_SUR_HIGH_START  0xD800

 #define UNI_SUR_LOW_START   0xDC00

 #define UNI_SUR_LOW_END     0xDFFF


 static const Byte trailingBytesForUTF8[256] =

 {

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,

     2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,  3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5

 };


 static const unsigned int offsetsFromUTF8[6] =

 {

     0x00000000UL, 0x00003080UL, 0x000E2080UL,

     0x03C82080UL, 0xFA082080UL, 0x82082080UL

 };


 static bool isLegalUTF8(const unsigned char * source, int length)

 {

     unsigned char a;

     const unsigned char * srcptr = source + length;

     switch (length)

     {

         default: return false;

         // Everything else falls through when "true"...

         case 4: if (((a = (*--srcptr)) < 0x80) || (a > 0xbf)) return false;

         case 3: if (((a = (*--srcptr)) < 0x80) || (a > 0xbf)) return false;

         case 2:

         {

             if ((a = (*--srcptr)) > 0xbf)

             {

                 return false;

             }

             switch (*source)

             {

                 // no fall-through in this inner switch

                 case 0xe0: if (a < 0xa0) return false; break;

                 case 0xed: if (a > 0x9f) return false; break;

                 case 0xf0: if (a < 0x90) return false; break;

                 case 0xf4: if (a > 0x8f) return false; break;

                 default:   if (a < 0x80) return false;

             }

         }

         case 1: if ((*source >= 0x80) && (*source < 0xc2)) return false;

     }

     return (*source <= 0xf4);

 }


 std::u16string UTF8ToRawBEUTF16(const AString & a_UTF8)

 {

     std::u16string UTF16;

     UTF16.reserve(a_UTF8.size() * 2);


     const unsigned char * source    = reinterpret_cast<const unsigned char *>(a_UTF8.data());

     const unsigned char * sourceEnd = source + a_UTF8.size();

     const int halfShift  = 10;  // used for shifting by 10 bits

     const unsigned int halfBase = 0x0010000UL;

     const unsigned int halfMask = 0x3ffUL;


     while (source < sourceEnd)

     {

         unsigned int ch = 0;

         unsigned short extraBytesToRead = trailingBytesForUTF8[*source];

         if (source + extraBytesToRead >= sourceEnd)

         {

             return UTF16;

         }

         // Do this check whether lenient or strict

         if (!isLegalUTF8(source, extraBytesToRead + 1))

         {

             return UTF16;

         }


         // The cases all fall through. See "Note A" below.

         switch (extraBytesToRead)

         {

             case 5: ch += *source++; ch <<= 6; /* remember, illegal UTF-8 */

             case 4: ch += *source++; ch <<= 6; /* remember, illegal UTF-8 */

             case 3: ch += *source++; ch <<= 6;

             case 2: ch += *source++; ch <<= 6;

             case 1: ch += *source++; ch <<= 6;

             case 0: ch += *source++;

         }

         ch -= offsetsFromUTF8[extraBytesToRead];


         if (ch <= UNI_MAX_BMP)

         {

             // Target is a character <= 0xFFFF

             if ((ch >= UNI_SUR_HIGH_START) && (ch <= UNI_SUR_LOW_END))

             {

                 // UTF-16 surrogate values are illegal in UTF-32

                 ch = ' ';

             }

             unsigned short v = htons(static_cast<unsigned short>(ch));

             UTF16.push_back(static_cast<char16_t>(v));

         }

         else if (ch > UNI_MAX_UTF16)

         {

             // Invalid value, replace with a space

             unsigned short v = htons(' ');

             UTF16.push_back(static_cast<char16_t>(v));

         }

         else

         {

             // target is a character in range 0xFFFF - 0x10FFFF.

             ch -= halfBase;

             auto v1 = htons(static_cast<uint16_t>((ch >> halfShift) + UNI_SUR_HIGH_START));

             auto v2 = htons(static_cast<uint16_t>((ch & halfMask) + UNI_SUR_LOW_START));

             UTF16.push_back(static_cast<char16_t>(v1));

             UTF16.push_back(static_cast<char16_t>(v2));

         }

     }

     return UTF16;

 }


 /*

 ---------------------------------------------------------------------

 Note A.

 The fall-through switches in UTF-8 reading code save a

 temp variable, some decrements & conditionals.  The switches

 are equivalent to the following loop:

 {

     int tmpBytesToRead = extraBytesToRead + 1;

     do

     {

         ch += *source++;

         --tmpBytesToRead;

         if (tmpBytesToRead)

         {

             ch <<= 6;

         }

     } while (tmpBytesToRead > 0);

 }

 ---------------------------------------------------------------------

 */


 // End of Unicode, Inc.'s code / information

 #ifdef __GNUC__

 #pragma GCC diagnostic pop

 #endif


 #define HEX(x) static_cast<char>((x) > 9 ? (x) + 'A' - 10 : (x) + '0')


 AString & CreateHexDump(AString & a_Out, const void * a_Data, size_t a_Size, size_t a_BytesPerLine)

 {

     fmt::memory_buffer Output;

     /* If formatting the data from the comment above:

         Hex holds:   "31 32 33 34 35 36 37 38 39 30 61 62 63 64 65 66 "

         Chars holds: "1234567890abcdef" */

     fmt::memory_buffer Hex, Chars;


     if (a_Size > 0)

     {

         // Same as std::ceil(static_cast<float>(a_Size) / a_BytesPerLine);

         const size_t NumLines = a_Size / a_BytesPerLine + (a_Size % a_BytesPerLine != 0);

         const size_t CharsPerLine = 14 + 4 * a_BytesPerLine;

         Output.reserve(NumLines * CharsPerLine);

     }


     for (size_t i = 0; i < a_Size; i += a_BytesPerLine)

     {

         size_t k = std::min(a_Size - i, a_BytesPerLine);

         for (size_t j = 0; j < k; j++)

         {

             Byte c = (static_cast<const Byte *>(a_Data))[i + j];

             Hex.push_back(HEX(c >> 4));

             Hex.push_back(HEX(c & 0xf));

             Hex.push_back(' ');

             Chars.push_back((c >= ' ') ? static_cast<char>(c) : '.');

         }  // for j


         // Write Hex with a dynamic fixed width

         auto HexStr = fmt::string_view(Hex.data(), Hex.size());

         auto CharsStr = fmt::string_view(Chars.data(), Chars.size());

         fmt::format_to(

             Output, "{0:08x}: {1:{2}}   {3}\n",

             i, HexStr, a_BytesPerLine * 3, CharsStr

         );


         Hex.clear();

         Chars.clear();

     }  // for i

     a_Out.append(Output.data(), Output.size());

     return a_Out;

 }


 AString EscapeString(const AString & a_Message)

 {

     AString EscapedMsg;

     size_t len = a_Message.size();

     size_t last = 0;

     EscapedMsg.reserve(len);

     for (size_t i = 0; i < len; i++)

     {

         char ch = a_Message[i];

         switch (ch)

         {

             case '\'':

             case '\"':

             case '\\':

             {

                 if (i > last)

                 {

                     EscapedMsg.append(a_Message, last, i - last);

                 }

                 EscapedMsg.push_back('\\');

                 EscapedMsg.push_back(ch);

                 last = i + 1;

                 break;

             }

         }  // switch (ch)

     }  // for i - a_Message[]

     if (len > last)

     {

         EscapedMsg.append(a_Message, last, len - last);

     }

     return EscapedMsg;

 }


 AString StripColorCodes(const AString & a_Message)

 {

     AString res(a_Message);

     size_t idx = 0;

     for (;;)

     {

         idx = res.find("\xc2\xa7", idx);

         if (idx == AString::npos)

         {

             return res;

         }

         res.erase(idx, 3);

     }

 }


 std::pair<bool, AString> URLDecode(const AString & a_Text)

 {

     AString res;

     auto len = a_Text.size();

     res.reserve(len);

     for (size_t i = 0; i < len; i++)

     {

         if (a_Text[i] == '+')

         {

             res.push_back(' ');

             continue;

         }

         if (a_Text[i] != '%')

         {

             res.push_back(a_Text[i]);

             continue;

         }

         if (i + 1 >= len)

         {

             // String too short for an encoded value

             return std::make_pair(false, AString());

         }

         if ((a_Text[i + 1] == 'u') || (a_Text[i + 1] == 'U'))

         {

             // Unicode char "%u0xxxx"

             if (i + 6 >= len)

             {

                 return std::make_pair(false, AString());

             }

             if (a_Text[i + 2] != '0')

             {

                 return std::make_pair(false, AString());

             }

             unsigned v1 = HexToDec(a_Text[i + 3]);

             unsigned v2 = HexToDec(a_Text[i + 4]);

             unsigned v3 = HexToDec(a_Text[i + 5]);

             unsigned v4 = HexToDec(a_Text[i + 6]);

             if ((v1 == 0xff) || (v2 == 0xff) || (v4 == 0xff) || (v3 == 0xff))

             {

                 // Invalid hex numbers

                 return std::make_pair(false, AString());

             }

             res.append(UnicodeCharToUtf8((v1 << 12) | (v2 << 8) | (v3 << 4) | v4));

             i = i + 6;

         }

         else

         {

             // Regular char "%xx":

             if (i + 2 >= len)

             {

                 return std::make_pair(false, AString());

             }

             auto v1 = HexToDec(a_Text[i + 1]);

             auto v2 = HexToDec(a_Text[i + 2]);

             if ((v1 == 0xff) || (v2 == 0xff))

             {

                 // Invalid hex numbers

                 return std::make_pair(false, AString());

             }

             res.push_back(static_cast<char>((v1 << 4) | v2));

             i = i + 2;

         }

     }  // for i - a_Text[i]

     return std::make_pair(true, res);

 }


 AString URLEncode(const AString & a_Text)

 {

     AString res;

     auto len = a_Text.size();

     res.reserve(len);

     static const char HEX[] = "0123456789ABCDEF";

     for (size_t i = 0; i < len; ++i)

     {

         if (isalnum(a_Text[i]))

         {

             res.push_back(a_Text[i]);

         }

         else if (a_Text[i] == ' ')

         {

             res.push_back('+');

         }

         else

         {

             res.push_back('%');

             res.push_back(HEX[static_cast<unsigned char>(a_Text[i]) >> 4]);

             res.push_back(HEX[static_cast<unsigned char>(a_Text[i]) & 0x0f]);

         }

     }

     return res;

 }


 AString ReplaceAllCharOccurrences(const AString & a_String, char a_From, char a_To)

 {

     AString res(a_String);

     std::replace(res.begin(), res.end(), a_From, a_To);

     return res;

 }


 static inline int UnBase64(char c)

 {

     if ((c >='A') && (c <= 'Z'))

     {

         return c - 'A';

     }

     if ((c >='a') && (c <= 'z'))

     {

         return c - 'a' + 26;

     }

     if ((c >= '0') && (c <= '9'))

     {

         return c - '0' + 52;

     }

     if (c == '+')

     {

         return 62;

     }

     if (c == '/')

     {

         return 63;

     }

     if (c == '=')

     {

         return -1;

     }

     return -2;

 }


 AString Base64Decode(const AString & a_Base64String)

 {

     AString res;

     size_t i, len = a_Base64String.size();

     size_t o;

     int c;

     res.resize((len * 4) / 3 + 5, 0);  // Approximate the upper bound on the result length

     for (o = 0, i = 0; i < len; i++)

     {

         c = UnBase64(a_Base64String[i]);

         if (c >= 0)

         {

             switch (o & 7)

             {

                 case 0: res[o >> 3] |= (c << 2); break;

                 case 6: res[o >> 3] |= (c >> 4); res[(o >> 3) + 1] |= (c << 4); break;

                 case 4: res[o >> 3] |= (c >> 2); res[(o >> 3) + 1] |= (c << 6); break;

                 case 2: res[o >> 3] |= c; break;

             }

             o += 6;

         }

         if (c == -1)

         {

             // Error while decoding, invalid input. Return as much as we've decoded:

             res.resize(o >> 3);

             return res;

         }

     }

     res.resize(o >> 3);

     return res;

 }


 AString Base64Encode(const AString & a_Input)

 {

     static const char BASE64[64] =

     {

         'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P',

         'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', 'a', 'b', 'c', 'd', 'e', 'f',

         'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v',

         'w', 'x', 'y', 'z', '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', '/'

     };


     AString output;

     output.resize(((a_Input.size() + 2) / 3) * 4);


     size_t output_index = 0;

     size_t size_full24 = (a_Input.size() / 3) * 3;


     for (size_t i = 0; i < size_full24; i += 3)

     {

         output[output_index++] = BASE64[static_cast<unsigned char>(a_Input[i]) >> 2];

         output[output_index++] = BASE64[(static_cast<unsigned char>(a_Input[i]) << 4 | static_cast<unsigned char>(a_Input[i + 1]) >> 4) & 63];

         output[output_index++] = BASE64[(static_cast<unsigned char>(a_Input[i + 1]) << 2 | static_cast<unsigned char>(a_Input[i + 2]) >> 6) & 63];

         output[output_index++] = BASE64[static_cast<unsigned char>(a_Input[i + 2]) & 63];

     }


     if (size_full24 < a_Input.size())

     {

         output[output_index++] = BASE64[static_cast<unsigned char>(a_Input[size_full24]) >> 2];

         if (size_full24 + 1 == a_Input.size())

         {

             output[output_index++] = BASE64[(static_cast<unsigned char>(a_Input[size_full24]) << 4) & 63];

             output[output_index++] = '=';

         }

         else

         {

             output[output_index++] = BASE64[(static_cast<unsigned char>(a_Input[size_full24]) << 4 | static_cast<unsigned char>(a_Input[size_full24 + 1]) >> 4) & 63];

             output[output_index++] = BASE64[(static_cast<unsigned char>(a_Input[size_full24 + 1]) << 2) & 63];

         }


         output[output_index++] = '=';

     }

     ASSERT(output_index == output.size());


     return output;

 }


 short GetBEShort(const std::byte * const a_Mem)

 {

     return static_cast<short>(

         (static_cast<short>(a_Mem[0]) << 8) |

         static_cast<short>(a_Mem[1])

     );

 }


 unsigned short GetBEUShort(const char * a_Mem)

 {

     const Byte * Bytes = reinterpret_cast<const Byte *>(a_Mem);

     return static_cast<unsigned short>((Bytes[0] << 8) | Bytes[1]);

 }


 int GetBEInt(const std::byte * const a_Mem)

 {

     return

         (static_cast<int>(a_Mem[0]) << 24) |

         (static_cast<int>(a_Mem[1]) << 16) |

         (static_cast<int>(a_Mem[2]) << 8) |

         static_cast<int>(a_Mem[3])

     ;

 }


 void SetBEInt(std::byte * a_Mem, Int32 a_Value)

 {

     a_Mem[0] = std::byte(a_Value >> 24);

     a_Mem[1] = std::byte((a_Value >> 16) & 0xff);

     a_Mem[2] = std::byte((a_Value >> 8) & 0xff);

     a_Mem[3] = std::byte(a_Value & 0xff);

 }


 bool SplitZeroTerminatedStrings(const AString & a_Strings, AStringVector & a_Output)

 {

     a_Output.clear();

     size_t size = a_Strings.size();

     size_t start = 0;

     bool res = false;

     for (size_t i = 0; i < size; i++)

     {

         if (a_Strings[i] == 0)

         {

             a_Output.push_back(a_Strings.substr(start, i - start));

             start = i + 1;

             res = true;

         }

     }

     if (start < size)

     {

         a_Output.push_back(a_Strings.substr(start, size - start));

         res = true;

     }


     return res;

 }


 AStringVector MergeStringVectors(const AStringVector & a_Strings1, const AStringVector & a_Strings2)

 {

     // Initialize the resulting vector by the first vector:

     AStringVector res = a_Strings1;


     // Add each item from strings2 that is not already present:

     for (const auto & item : a_Strings2)

     {

         if (std::find(res.begin(), res.end(), item) == res.end())

         {

             res.push_back(item);

         }

     }  // for item - a_Strings2[]


     return res;

 }


 AString StringsConcat(const AStringVector & a_Strings, char a_Separator)

 {

     // If the vector is empty, return an empty string:

     if (a_Strings.empty())

     {

         return "";

     }


     // Concatenate the strings in the vector:

     AString res;

     res.append(a_Strings[0]);

     for (auto itr = a_Strings.cbegin() + 1, end = a_Strings.cend(); itr != end; ++itr)

     {

         res.push_back(a_Separator);

         res.append(*itr);

     }

     return res;

 }


 bool StringToFloat(const AString & a_String, float & a_Num)

 {

     char *err;

     a_Num = strtof(a_String.c_str(), &err);

     return (*err == 0);

 }


 bool IsOnlyWhitespace(const AString & a_String)

 {

     return std::all_of(a_String.cbegin(), a_String.cend(), isspace);

 }

Globals.h

Int32
signed int Int32
Definition: Globals.h:152

ASSERT
#define ASSERT(x)
Definition: Globals.h:276

Byte
unsigned char Byte
Definition: Globals.h:161

URLDecode
std::pair< bool, AString > URLDecode(const AString &a_Text)
URL-Decodes the given string.
Definition: StringUtils.cpp:719

GetBEShort
short GetBEShort(const std::byte *const a_Mem)
Reads two bytes from the specified memory location and interprets them as BigEndian short.
Definition: StringUtils.cpp:949

StringSplitAndTrim
AStringVector StringSplitAndTrim(const AString &str, const AString &delim)
Split the string at any of the listed delimiters and trim each value.
Definition: StringUtils.cpp:169

isLegalUTF8
static bool isLegalUTF8(const unsigned char *source, int length)
Definition: StringUtils.cpp:476

InPlaceLowercase
AString & InPlaceLowercase(AString &s)
In-place string conversion to lowercase.
Definition: StringUtils.cpp:224

TrimString
AString TrimString(const AString &str)
Trims whitespace at both ends of the string.
Definition: StringUtils.cpp:190

UNI_SUR_LOW_START
#define UNI_SUR_LOW_START
Definition: StringUtils.cpp:443

offsetsFromUTF8
static const unsigned int offsetsFromUTF8[6]
Definition: StringUtils.cpp:466

RawBEToUTF8
AString & RawBEToUTF8(const char *a_RawData, size_t a_NumShorts, AString &a_UTF8)
Converts a stream of BE shorts into UTF-8 string; returns a_UTF8.
Definition: StringUtils.cpp:342

URLEncode
AString URLEncode(const AString &a_Text)
URL-encodes the given string.
Definition: StringUtils.cpp:789

StrToLower
AString StrToLower(const AString &s)
Returns a lower-cased copy of the string.
Definition: StringUtils.cpp:244

GetBEInt
int GetBEInt(const std::byte *const a_Mem)
Reads four bytes from the specified memory location and interprets them as BigEndian int.
Definition: StringUtils.cpp:971

InPlaceUppercase
AString & InPlaceUppercase(AString &s)
In-place string conversion to uppercase.
Definition: StringUtils.cpp:234

EscapeString
AString EscapeString(const AString &a_Message)
Returns a copy of a_Message with all quotes and backslashes escaped by a backslash.
Definition: StringUtils.cpp:663

ReplaceAllCharOccurrences
AString ReplaceAllCharOccurrences(const AString &a_String, char a_From, char a_To)
Replaces all occurrences of char a_From inside a_String with char a_To.
Definition: StringUtils.cpp:819

UNI_SUR_HIGH_START
#define UNI_SUR_HIGH_START
Definition: StringUtils.cpp:442

StringSplit
AStringVector StringSplit(const AString &str, const AString &delim)
Split the string at any of the listed delimiters.
Definition: StringUtils.cpp:55

SplitZeroTerminatedStrings
bool SplitZeroTerminatedStrings(const AString &a_Strings, AStringVector &a_Output)
Splits a string that has embedded \0 characters, on those characters.
Definition: StringUtils.cpp:997

Base64Decode
AString Base64Decode(const AString &a_Base64String)
Decodes a Base64-encoded string into the raw data.
Definition: StringUtils.cpp:864

SetBEInt
void SetBEInt(std::byte *a_Mem, Int32 a_Value)
Writes four bytes to the specified memory location so that they interpret as BigEndian int.
Definition: StringUtils.cpp:985

ReplaceString
void ReplaceString(AString &iHayStack, const AString &iNeedle, const AString &iReplaceWith)
Replaces each occurence of iNeedle in iHayStack with iReplaceWith.
Definition: StringUtils.cpp:312

UNI_MAX_UTF16
#define UNI_MAX_UTF16
Definition: StringUtils.cpp:441

UnBase64
static int UnBase64(char c)
Converts one Hex character in a Base64 encoding into the data value.
Definition: StringUtils.cpp:831

StripColorCodes
AString StripColorCodes(const AString &a_Message)
Removes all control codes used by MC for colors and styles.
Definition: StringUtils.cpp:700

CreateHexDump
AString & CreateHexDump(AString &a_Out, const void *a_Data, size_t a_Size, size_t a_BytesPerLine)
format binary data this way: 00001234: 31 32 33 34 35 36 37 38 39 30 61 62 63 64 65 66 1234567890abcd...
Definition: StringUtils.cpp:616

StringSplitWithQuotes
AStringVector StringSplitWithQuotes(const AString &str, const AString &delim)
Split the string at any of the listed delimiters.
Definition: StringUtils.cpp:76

StringsConcat
AString StringsConcat(const AStringVector &a_Strings, char a_Separator)
Concatenates the specified strings into a single string, separated by the specified separator charact...
Definition: StringUtils.cpp:1046

NoCaseCompare
int NoCaseCompare(const AString &s1, const AString &s2)
Case-insensitive string comparison.
Definition: StringUtils.cpp:268

ReplaceURL
void ReplaceURL(AString &iHayStack, const AString &iNeedle, const AString &iReplaceWith)
Replaces each occurence of iNeedle in iHayStack with iReplaceWith, after URL-encoding iReplaceWith.
Definition: StringUtils.cpp:332

HexToDec
static unsigned char HexToDec(char a_HexChar)
Returns the value of the single hex digit.
Definition: StringUtils.cpp:21

MergeStringVectors
AStringVector MergeStringVectors(const AStringVector &a_Strings1, const AStringVector &a_Strings2)
Merges the two vectors of strings, removing duplicate entries from the second vector.
Definition: StringUtils.cpp:1025

StrToUpper
AString StrToUpper(const AString &s)
Returns an upper-cased copy of the string.
Definition: StringUtils.cpp:256

UnicodeCharToUtf8
AString UnicodeCharToUtf8(unsigned a_UnicodeChar)
Converts a unicode character to its UTF8 representation.
Definition: StringUtils.cpp:357

UNI_SUR_LOW_END
#define UNI_SUR_LOW_END
Definition: StringUtils.cpp:444

StringJoin
AString StringJoin(const AStringVector &a_Strings, const AString &a_Delimeter)
Join a list of strings with the given delimiter between entries.
Definition: StringUtils.cpp:133

RateCompareString
size_t RateCompareString(const AString &s1, const AString &s2)
Case-insensitive string comparison that returns a rating of equal-ness between [0 - s1....
Definition: StringUtils.cpp:281

StringToFloat
bool StringToFloat(const AString &a_String, float &a_Num)
Converts a string into a float.
Definition: StringUtils.cpp:1069

UNI_MAX_BMP
#define UNI_MAX_BMP
Definition: StringUtils.cpp:440

IsOnlyWhitespace
bool IsOnlyWhitespace(const AString &a_String)
Returns true if only whitespace characters are present in the string.
Definition: StringUtils.cpp:1080

Base64Encode
AString Base64Encode(const AString &a_Input)
Encodes a string into Base64.
Definition: StringUtils.cpp:900

UTF8ToRawBEUTF16
std::u16string UTF8ToRawBEUTF16(const AString &a_UTF8)
Converts a UTF-8 string into a UTF-16 BE string.
Definition: StringUtils.cpp:511

trailingBytesForUTF8
static const Byte trailingBytesForUTF8[256]
Definition: StringUtils.cpp:450

GetBEUShort
unsigned short GetBEUShort(const char *a_Mem)
Reads two bytes from the specified memory location and interprets them as BigEndian unsigned short.
Definition: StringUtils.cpp:961

HEX
#define HEX(x)
Definition: StringUtils.cpp:610

AStringVector
std::vector< AString > AStringVector
Definition: StringUtils.h:12

AString
std::string AString
Definition: StringUtils.h:11