1 #ifndef CONVERSION_UTILITIES_STRINGCONVERSION_H 2 #define CONVERSION_UTILITIES_STRINGCONVERSION_H 7 #include "../misc/traits.h" 11 #include <initializer_list> 31 std::free(stringData);
38 using StringData = std::pair<std::unique_ptr<char[], StringDataDeleter>, std::size_t>;
42 const char *fromCharset,
const char *toCharset,
const char *inputBuffer, std::size_t inputBufferSize,
float outputBufferSizeFactor = 1.0f);
65 template <
class Container = std::initializer_list<std::
string>>
66 typename Container::value_type
joinStrings(
const Container &strings,
67 const typename Container::value_type &delimiter =
typename Container::value_type(),
bool omitEmpty =
false,
68 const typename Container::value_type &leftClosure =
typename Container::value_type(),
69 const typename Container::value_type &rightClosure =
typename Container::value_type())
71 typename Container::value_type res;
72 if (!strings.size()) {
75 std::size_t entries = 0, size = 0;
76 for (
const auto &str : strings) {
77 if (omitEmpty && str.empty()) {
86 size += (entries * leftClosure.size()) + (entries * rightClosure.size()) + ((entries - 1) * delimiter.size());
88 for (
const auto &str : strings) {
89 if (omitEmpty && str.empty()) {
93 res.append(delimiter);
95 res.append(leftClosure);
97 res.append(rightClosure);
105 template <
class Container = std::initializer_list<std::
string>>
inline std::vector<std::string>
toMultiline(
const Container &arrayOfLines)
128 template <
class Container = std::list<std::
string>>
129 Container
splitString(
const typename Container::value_type &
string,
const typename Container::value_type &delimiter,
135 for (
typename Container::value_type::size_type
i = 0, end =
string.size(), delimPos;
i < end;
i = delimPos + delimiter.size()) {
136 delimPos =
string.find(delimiter,
i);
137 if (!merge && maxParts >= 0 && res.size() ==
static_cast<typename Container::value_type::size_type
>(maxParts)) {
144 delimPos = Container::value_type::npos;
146 if (delimPos == Container::value_type::npos) {
147 delimPos =
string.size();
151 res.back().append(delimiter);
152 res.back().append(
string.substr(
i, delimPos -
i));
155 res.emplace_back(
string.substr(
i, delimPos -
i));
175 template <
class Container = std::list<std::
string>>
176 Container
splitStringSimple(
const typename Container::value_type &
string,
const typename Container::value_type &delimiter,
int maxParts = -1)
180 for (
typename Container::value_type::size_type
i = 0, end =
string.size(), delimPos;
i < end;
i = delimPos + delimiter.size()) {
181 delimPos =
string.find(delimiter,
i);
182 if (maxParts >= 0 && res.size() ==
static_cast<typename Container::value_type::size_type
>(maxParts)) {
183 delimPos = Container::value_type::npos;
185 if (delimPos == Container::value_type::npos) {
186 delimPos =
string.size();
188 res.emplace_back(
string.substr(
i, delimPos -
i));
196 template <
class Container = std::vector<std::
string>>
inline std::vector<std::string>
toArrayOfLines(
const std::string &multilineString)
204 template <
typename StringType>
bool startsWith(
const StringType &str,
const StringType &phrase)
206 if (str.size() < phrase.size()) {
209 for (
auto stri = str.cbegin(), strend = str.cend(), phrasei = phrase.cbegin(), phraseend = phrase.cend(); stri != strend; ++stri, ++phrasei) {
210 if (phrasei == phraseend) {
212 }
else if (*stri != *phrasei) {
222 template <
typename StringType>
bool startsWith(
const StringType &str,
const typename StringType::value_type *phrase)
224 for (
auto stri = str.cbegin(), strend = str.cend(); stri != strend; ++stri, ++phrase) {
227 }
else if (*stri != *phrase) {
238 template <
typename StringType>
bool containsSubstrings(
const StringType &str, std::initializer_list<StringType> substrings)
240 typename StringType::size_type currentPos = 0;
241 for (
const auto &substr : substrings) {
242 if ((currentPos = str.find(substr, currentPos)) == StringType::npos) {
245 currentPos += substr.size();
254 template <
typename StringType>
255 bool containsSubstrings(
const StringType &str, std::initializer_list<const typename StringType::value_type *> substrings)
257 typename StringType::size_type currentPos = 0;
258 for (
const auto *substr : substrings) {
259 if ((currentPos = str.find(substr, currentPos)) == StringType::npos) {
262 currentPos += std::strlen(substr);
270 template <
typename StringType>
void findAndReplace(StringType &str,
const StringType &find,
const StringType &replace)
272 for (
typename StringType::size_type
i = 0; (
i = str.find(find,
i)) != StringType::npos;
i += replace.size()) {
273 str.replace(
i, find.size(), replace);
283 template <
typename CharType> constexpr CharType
digitToChar(CharType digit)
285 return digit <= 9 ? (digit +
'0') : (digit +
'A' - 10);
294 template <
typename IntegralType,
class StringType = std::string,
296 StringType
numberToString(IntegralType number,
typename StringType::value_type base = 10)
298 std::size_t resSize = 0;
299 for (
auto n = number; n; n /= base, ++resSize)
302 res.reserve(resSize);
304 res.insert(res.begin(), digitToChar<typename StringType::value_type>(number % base));
316 template <
typename IntegralType,
class StringType = std::string,
318 StringType
numberToString(IntegralType number,
typename StringType::value_type base = 10)
320 const bool negative = number < 0;
323 number = -number, resSize = 1;
327 for (
auto n = number; n; n /= base, ++resSize)
330 res.reserve(resSize);
332 res.insert(res.begin(), digitToChar<typename StringType::value_type>(number % base));
336 res.insert(res.begin(),
'-');
349 template <
typename FloatingType,
class StringType = std::
string, Traits::EnableIf<std::is_
floating_po
int<FloatingType>> * =
nullptr>
350 StringType
numberToString(FloatingType number,
typename StringType::value_type base = 10)
352 std::basic_stringstream<typename StringType::value_type> ss;
353 ss << std::setbase(base) << number;
362 template <
typename CharType> CharType
charToDigit(CharType character, CharType base)
365 if (character >=
'0' && character <=
'9') {
366 res = character -
'0';
367 }
else if (character >=
'a' && character <=
'z') {
368 res = character -
'a' + 10;
369 }
else if (character >=
'A' && character <=
'Z') {
370 res = character -
'A' + 10;
375 std::string errorMsg;
376 errorMsg.reserve(36);
377 errorMsg +=
"The character \"";
378 errorMsg += character;
379 errorMsg +=
"\" is no valid digit.";
391 template <
typename IntegralType,
typename StringType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
unsigned<IntegralType>> * =
nullptr>
392 IntegralType
stringToNumber(
const StringType &
string,
typename StringType::value_type base = 10)
394 IntegralType result = 0;
395 for (
const auto &c :
string) {
400 result += charToDigit<typename StringType::value_type>(c, base);
413 template <
typename IntegralType,
class StringType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
signed<IntegralType>> * =
nullptr>
414 IntegralType
stringToNumber(
const StringType &
string,
typename StringType::value_type base = 10)
416 auto i =
string.begin();
417 auto end =
string.end();
418 for (;
i != end && *
i ==
' '; ++
i)
423 const bool negative = (*
i ==
'-');
427 IntegralType result = 0;
428 for (;
i != end; ++
i) {
433 result += charToDigit<typename StringType::value_type>(*
i, base);
435 return negative ? -result : result;
448 template <
typename FloatingType,
class StringType, Traits::EnableIf<std::is_
floating_po
int<FloatingType>> * =
nullptr>
449 FloatingType
stringToNumber(
const StringType &
string,
typename StringType::value_type base = 10)
451 std::basic_stringstream<typename StringType::value_type> ss;
452 ss << std::setbase(base) << string;
454 if ((ss >> result) && ss.eof()) {
457 std::string errorMsg;
458 errorMsg.reserve(42 +
string.size());
459 errorMsg +=
"The string \"";
461 errorMsg +=
"\" is no valid floating number.";
473 template <
typename IntegralType,
class CharType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
unsigned<IntegralType>> * =
nullptr>
476 IntegralType result = 0;
477 for (; *string; ++string) {
478 if (*
string ==
' ') {
482 result += charToDigit<CharType>(*string, base);
497 template <
typename FloatingType,
class CharType, Traits::EnableIf<std::is_
floating_po
int<FloatingType>> * =
nullptr>
500 std::basic_stringstream<CharType> ss;
501 ss << std::setbase(base) << string;
503 if ((ss >> result) && ss.eof()) {
506 std::string errorMsg;
507 errorMsg.reserve(42 + std::char_traits<CharType>::length(
string));
508 errorMsg +=
"The string \"";
510 errorMsg +=
"\" is no valid floating number.";
521 template <
typename IntegralType,
class CharType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
unsigned<IntegralType>> * =
nullptr>
522 IntegralType
bufferToNumber(
const CharType *
string, std::size_t size,
unsigned char base = 10)
524 IntegralType result = 0;
525 for (
const CharType *end =
string + size;
string != end; ++string) {
526 if (*
string ==
' ') {
530 result += charToDigit<CharType>(*string, base);
542 template <
typename IntegralType,
class CharType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
signed<IntegralType>> * =
nullptr>
543 IntegralType
stringToNumber(
const CharType *
string,
unsigned char base = 10)
548 for (; *
string && *
string ==
' '; ++string)
553 const bool negative = (*
string ==
'-');
557 IntegralType result = 0;
558 for (; *string; ++string) {
559 if (*
string ==
' ') {
563 result += charToDigit<CharType>(*string, base);
565 return negative ? -result : result;
575 template <
typename IntegralType,
class CharType, Traits::EnableIf<std::is_
integral<IntegralType>, std::is_
signed<IntegralType>> * =
nullptr>
576 IntegralType
bufferToNumber(
const CharType *
string, std::size_t size,
unsigned char base = 10)
581 const CharType *end =
string + size;
582 for (;
string != end && *
string ==
' '; ++string)
587 const bool negative = (*
string ==
'-');
591 IntegralType result = 0;
592 for (;
string != end; ++string) {
593 if (*
string ==
' ') {
597 result += charToDigit<CharType>(*string, base);
599 return negative ? -result : result;
613 char buffer[
sizeof(T)];
614 ConversionUtilities::BE::getBytes(integer, buffer);
615 return std::string(buffer + startOffset,
sizeof(T) - startOffset);
624 #endif // CONVERSION_UTILITIES_STRINGCONVERSION_H CPP_UTILITIES_EXPORT StringData convertUtf8ToUtf16LE(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to UTF-16 (little-endian).
bool startsWith(const StringType &str, const StringType &phrase)
Returns whether str starts with phrase.
void operator()(char *stringData)
Deletes the specified stringData with std::free(), because the memory has been allocated using std::m...
CPP_UTILITIES_EXPORT std::string encodeBase64(const byte *data, uint32 dataSize)
Encodes the specified data to Base64.
std::pair< std::unique_ptr< char[], StringDataDeleter >, std::size_t > StringData
Type used to return string encoding conversion result.
IntegralType stringToNumber(const StringType &string, typename StringType::value_type base=10)
Converts the given string to an unsigned number assuming string uses the specified base...
Container splitStringSimple(const typename Container::value_type &string, const typename Container::value_type &delimiter, int maxParts=-1)
Splits the given string (which might also be a string view) at the specified delimiter.
bool containsSubstrings(const StringType &str, std::initializer_list< StringType > substrings)
Returns whether str contains the specified substrings.
The ConversionException class is thrown by the various conversion functions of this library when a co...
std::vector< std::string > toArrayOfLines(const std::string &multilineString)
Converts the specified multilineString to an array of lines.
CPP_UTILITIES_EXPORT StringData convertUtf16BEToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-16 (big-endian) string to UTF-8.
CPP_UTILITIES_EXPORT void truncateString(std::string &str, char terminationChar='\0')
Truncates all characters after the first occurrence of the specified terminationChar and the terminat...
StringType numberToString(IntegralType number, typename StringType::value_type base=10)
Converts the given number to its equivalent string representation using the specified base...
std::uint64_t uint64
unsigned 64-bit integer
The StringDataDeleter struct deletes the data of a StringData instance.
typename std::enable_if< All< Condition... >::value, Detail::Enabler >::type EnableIf
Shortcut for std::enable_if to omit ::value and ::type.
std::string interpretIntegerAsString(T integer, int startOffset=0)
Interprets the given integer at the specified position as std::string using the specified byte order...
CPP_UTILITIES_EXPORT StringData convertUtf8ToUtf16BE(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to UTF-16 (big-endian).
EmptyPartsTreat
Specifies the role of empty parts when splitting strings.
CPP_UTILITIES_EXPORT StringData convertUtf8ToLatin1(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to Latin-1.
void findAndReplace(StringType &str, const StringType &find, const StringType &replace)
Replaces all occurences of find with relpace in the specified str.
Contains several functions providing conversions between different data types.
std::uint32_t uint32
unsigned 32-bit integer
IntegralType bufferToNumber(const CharType *string, std::size_t size, unsigned char base=10)
Converts the given string of size characters to an unsigned numeric value using the specified base...
CPP_UTILITIES_EXPORT StringData convertUtf16LEToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-16 (little-endian) string to UTF-8.
CharType charToDigit(CharType character, CharType base)
Returns number/digit of the specified character representation using the specified base...
Container::value_type joinStrings(const Container &strings, const typename Container::value_type &delimiter=typename Container::value_type(), bool omitEmpty=false, const typename Container::value_type &leftClosure=typename Container::value_type(), const typename Container::value_type &rightClosure=typename Container::value_type())
Joins the given strings using the specified delimiter.
CPP_UTILITIES_EXPORT StringData convertString(const char *fromCharset, const char *toCharset, const char *inputBuffer, std::size_t inputBufferSize, float outputBufferSizeFactor=1.0f)
Converts the specified string from one character set to another.
std::uint8_t byte
unsigned byte
CPP_UTILITIES_EXPORT StringData convertLatin1ToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified Latin-1 string to UTF-8.
std::vector< std::string > toMultiline(const Container &arrayOfLines)
Converts the specified arrayOfLines to a multiline string.
Container splitString(const typename Container::value_type &string, const typename Container::value_type &delimiter, EmptyPartsTreat emptyPartsRole=EmptyPartsTreat::Keep, int maxParts=-1)
Splits the given string at the specified delimiter.
CPP_UTILITIES_EXPORT std::string dataSizeToString(uint64 sizeInByte, bool includeByte=false)
Converts the specified data size in byte to its equivalent std::string representation.
#define CPP_UTILITIES_EXPORT
Marks the symbol to be exported by the c++utilities library.
CPP_UTILITIES_EXPORT std::pair< std::unique_ptr< byte[]>, uint32 > decodeBase64(const char *encodedStr, const uint32 strSize)
Decodes the specified Base64 encoded string.
constexpr CharType digitToChar(CharType digit)
Returns the character representation of the specified digit.
CPP_UTILITIES_EXPORT std::string bitrateToString(double speedInKbitsPerSecond, bool useByteInsteadOfBits=false)
Converts the specified bitrate in kbit/s to its equivalent std::string representation.