3 #ifndef CPP_UTILITIES_NO_THREAD_LOCAL
4 #include "../feature_detection/features.h"
6 #define CPP_UTILITIES_THREAD_LOCAL
19 #ifdef PLATFORM_WINDOWS
30 size_t operator()(
size_t value)
36 size_t operator()(
size_t value)
42 size_t operator()(
size_t value)
50 size_t operator()(
size_t value)
52 return static_cast<size_t>(
static_cast<float>(value) * factor);
57 template <
class OutputSizeH
int>
class ConversionDescriptor {
59 ConversionDescriptor(
const char *fromCharset,
const char *toCharset)
60 : m_ptr(iconv_open(toCharset, fromCharset))
61 , m_outputSizeHint(OutputSizeHint())
63 if (m_ptr ==
reinterpret_cast<iconv_t
>(-1)) {
64 throw ConversionException(
"Unable to allocate descriptor for character set conversion.");
68 ConversionDescriptor(
const char *fromCharset,
const char *toCharset, OutputSizeHint outputSizeHint)
69 : m_ptr(iconv_open(toCharset, fromCharset))
70 , m_outputSizeHint(outputSizeHint)
72 if (m_ptr ==
reinterpret_cast<iconv_t
>(-1)) {
73 throw ConversionException(
"Unable to allocate descriptor for character set conversion.");
77 ~ConversionDescriptor()
86 size_t inputBytesLeft = inputBufferSize;
87 size_t outputSize = m_outputSizeHint(inputBufferSize);
88 size_t outputBytesLeft = outputSize;
89 char *outputBuffer =
reinterpret_cast<char *
>(malloc(outputSize));
92 char *currentOutputOffset = outputBuffer;
93 for (;; currentOutputOffset = outputBuffer + bytesWritten) {
94 bytesWritten = iconv(m_ptr,
const_cast<char **
>(&inputBuffer), &inputBytesLeft, ¤tOutputOffset, &outputBytesLeft);
95 if (bytesWritten ==
static_cast<size_t>(-1)) {
96 if (errno == EINVAL) {
98 bytesWritten =
static_cast<size_t>(currentOutputOffset - outputBuffer);
100 }
else if (errno == E2BIG) {
102 bytesWritten =
static_cast<size_t>(currentOutputOffset - outputBuffer);
103 outputBytesLeft = (outputSize += m_outputSizeHint(inputBytesLeft)) - bytesWritten;
104 outputBuffer =
reinterpret_cast<char *
>(realloc(outputBuffer, outputSize));
108 throw ConversionException(
"Invalid multibyte sequence in the input.");
115 return StringData(std::unique_ptr<
char[], StringDataDeleter>(outputBuffer), currentOutputOffset - outputBuffer);
120 OutputSizeHint m_outputSizeHint;
135 const char *fromCharset,
const char *toCharset,
const char *inputBuffer, std::size_t inputBufferSize,
float outputBufferSizeFactor)
137 return ConversionDescriptor<Factor>(fromCharset, toCharset, outputBufferSizeFactor).convertString(inputBuffer, inputBufferSize);
145 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Double> descriptor(
"UTF-8",
"UTF-16LE");
146 return descriptor.convertString(inputBuffer, inputBufferSize);
154 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Half> descriptor(
"UTF-16LE",
"UTF-8");
155 return descriptor.convertString(inputBuffer, inputBufferSize);
163 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Double> descriptor(
"UTF-8",
"UTF-16BE");
164 return descriptor.convertString(inputBuffer, inputBufferSize);
172 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Half> descriptor(
"UTF-16BE",
"UTF-8");
173 return descriptor.convertString(inputBuffer, inputBufferSize);
181 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Keep> descriptor(
"ISO-8859-1",
"UTF-8");
182 return descriptor.convertString(inputBuffer, inputBufferSize);
190 CPP_UTILITIES_THREAD_LOCAL ConversionDescriptor<Keep> descriptor(
"UTF-8",
"ISO-8859-1");
191 return descriptor.convertString(inputBuffer, inputBufferSize);
194 #ifdef PLATFORM_WINDOWS
201 WideStringData convertMultiByteToWide(std::error_code &ec,
const char *inputBuffer,
int inputBufferSize)
204 WideStringData widePath;
205 widePath.second = MultiByteToWideChar(CP_UTF8, 0, inputBuffer, inputBufferSize,
nullptr, 0);
206 if (widePath.second <= 0) {
207 ec = std::error_code(GetLastError(), std::system_category());
211 widePath.first = make_unique<wchar_t[]>(
static_cast<size_t>(widePath.second));
212 widePath.second = MultiByteToWideChar(CP_UTF8, 0, inputBuffer, inputBufferSize, widePath.first.get(), widePath.second);
213 if (widePath.second <= 0) {
214 ec = std::error_code(GetLastError(), std::system_category());
215 widePath.first.reset();
224 WideStringData convertMultiByteToWide(std::error_code &ec,
const std::string &inputBuffer)
226 return convertMultiByteToWide(
227 ec, inputBuffer.data(), inputBuffer.size() < (
numeric_limits<int>::max() - 1) ?
static_cast<int>(inputBuffer.size() + 1) : -1);
236 WideStringData convertMultiByteToWide(
const char *inputBuffer,
int inputBufferSize)
239 return convertMultiByteToWide(ec, inputBuffer, inputBufferSize);
246 WideStringData convertMultiByteToWide(
const std::string &inputBuffer)
249 return convertMultiByteToWide(ec, inputBuffer);
259 string::size_type firstNullByte = str.find(terminationChar);
260 if (firstNullByte != string::npos) {
261 str.resize(firstNullByte);
272 stringstream res(stringstream::in | stringstream::out);
273 res.setf(ios::fixed, ios::floatfield);
274 res << setprecision(2);
275 if (sizeInByte < 1024LL) {
276 res << sizeInByte <<
" bytes";
277 }
else if (sizeInByte < 1048576LL) {
278 res << (static_cast<double>(sizeInByte) / 1024.0) <<
" KiB";
279 }
else if (sizeInByte < 1073741824LL) {
280 res << (static_cast<double>(sizeInByte) / 1048576.0) <<
" MiB";
281 }
else if (sizeInByte < 1099511627776LL) {
282 res << (static_cast<double>(sizeInByte) / 1073741824.0) <<
" GiB";
284 res << (static_cast<double>(sizeInByte) / 1099511627776.0) <<
" TiB";
286 if (includeByte && sizeInByte > 1024LL) {
287 res <<
' ' <<
'(' << sizeInByte <<
" byte)";
304 stringstream res(stringstream::in | stringstream::out);
305 res << setprecision(3);
306 if (std::isnan(bitrateInKbitsPerSecond)) {
307 res <<
"indeterminable";
308 }
else if (useIecBinaryPrefixes) {
309 if (bitrateInKbitsPerSecond < 8.0) {
310 res << (bitrateInKbitsPerSecond * 125.0) <<
" byte/s";
311 }
else if (bitrateInKbitsPerSecond < 8000.0) {
312 res << (bitrateInKbitsPerSecond * 0.125) <<
" KiB/s";
313 }
else if (bitrateInKbitsPerSecond < 8000000.0) {
314 res << (bitrateInKbitsPerSecond * 0.000125) <<
" MiB/s";
316 res << (bitrateInKbitsPerSecond * 0.000000125) <<
" GiB/s";
319 if (bitrateInKbitsPerSecond < 1.0) {
320 res << (bitrateInKbitsPerSecond * 1000.0) <<
" bit/s";
321 }
else if (bitrateInKbitsPerSecond < 1000.0) {
322 res << (bitrateInKbitsPerSecond) <<
" kbit/s";
323 }
else if (bitrateInKbitsPerSecond < 1000000.0) {
324 res << (bitrateInKbitsPerSecond * 0.001) <<
" Mbit/s";
326 res << (bitrateInKbitsPerSecond * 0.000001) <<
" Gbit/s";
333 const char *
const base64Chars =
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
334 const char base64Pad =
'=';
343 auto encoded = std::string();
344 auto mod =
static_cast<std::uint8_t
>(dataSize % 3);
345 auto temp = std::uint32_t();
346 encoded.reserve(((dataSize / 3) + (mod > 0)) * 4);
347 for (
const std::uint8_t *end = --data + dataSize - mod; data != end;) {
348 temp =
static_cast<std::uint32_t
>(*++data << 16);
349 temp |=
static_cast<std::uint32_t
>(*++data << 8);
351 encoded.push_back(base64Chars[(temp & 0x00FC0000) >> 18]);
352 encoded.push_back(base64Chars[(temp & 0x0003F000) >> 12]);
353 encoded.push_back(base64Chars[(temp & 0x00000FC0) >> 6]);
354 encoded.push_back(base64Chars[(temp & 0x0000003F)]);
358 temp =
static_cast<std::uint32_t
>(*++data << 16);
359 encoded.push_back(base64Chars[(temp & 0x00FC0000) >> 18]);
360 encoded.push_back(base64Chars[(temp & 0x0003F000) >> 12]);
361 encoded.push_back(base64Pad);
362 encoded.push_back(base64Pad);
365 temp =
static_cast<std::uint32_t
>(*++data << 16);
366 temp |=
static_cast<std::uint32_t
>(*++data << 8);
367 encoded.push_back(base64Chars[(temp & 0x00FC0000) >> 18]);
368 encoded.push_back(base64Chars[(temp & 0x0003F000) >> 12]);
369 encoded.push_back(base64Chars[(temp & 0x00000FC0) >> 6]);
370 encoded.push_back(base64Pad);
381 pair<unique_ptr<std::uint8_t[]>, std::uint32_t>
decodeBase64(
const char *encodedStr,
const std::uint32_t strSize)
386 std::uint32_t decodedSize = (strSize / 4) * 3;
387 const char *
const end = encodedStr + strSize;
389 if (*(end - 1) == base64Pad) {
392 if (*(end - 2) == base64Pad) {
396 auto buffer = make_unique<std::uint8_t[]>(decodedSize);
397 auto *iter = buffer.get() - 1;
398 while (encodedStr < end) {
399 std::int32_t temp = 0;
400 for (std::uint8_t quantumPos = 0; quantumPos < 4; ++quantumPos, ++encodedStr) {
402 if (*encodedStr >=
'A' && *encodedStr <=
'Z') {
403 temp |= *encodedStr -
'A';
404 }
else if (*encodedStr >=
'a' && *encodedStr <=
'z') {
405 temp |= *encodedStr -
'a' + 26;
406 }
else if (*encodedStr >=
'0' && *encodedStr <=
'9') {
407 temp |= *encodedStr -
'0' + 2 * 26;
408 }
else if (*encodedStr ==
'+') {
410 }
else if (*encodedStr ==
'/') {
411 temp |= 2 * 26 + 10 + 1;
412 }
else if (*encodedStr == base64Pad) {
413 switch (end - encodedStr) {
415 *++iter =
static_cast<std::uint8_t
>((temp >> 16) & 0xFF);
416 *++iter =
static_cast<std::uint8_t
>((temp >> 8) & 0xFF);
417 return make_pair(move(buffer), decodedSize);
419 *++iter =
static_cast<std::uint8_t
>((temp >> 10) & 0xFF);
420 return make_pair(move(buffer), decodedSize);
428 *++iter =
static_cast<std::uint8_t
>((temp >> 16) & 0xFF);
429 *++iter =
static_cast<std::uint8_t
>((temp >> 8) & 0xFF);
430 *++iter =
static_cast<std::uint8_t
>(temp & 0xFF);
432 return make_pair(move(buffer), decodedSize);
The ConversionException class is thrown by the various conversion functions of this library when a co...
Contains all utilities provides by the c++utilities library.
CPP_UTILITIES_EXPORT StringData convertUtf8ToUtf16BE(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to UTF-16 (big-endian).
CPP_UTILITIES_EXPORT StringData convertString(const char *fromCharset, const char *toCharset, const char *inputBuffer, std::size_t inputBufferSize, float outputBufferSizeFactor=1.0f)
Converts the specified string from one character set to another.
CPP_UTILITIES_EXPORT StringData convertLatin1ToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified Latin-1 string to UTF-8.
CPP_UTILITIES_EXPORT StringData convertUtf16LEToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-16 (little-endian) string to UTF-8.
CPP_UTILITIES_EXPORT std::pair< std::unique_ptr< std::uint8_t[]>, std::uint32_t > decodeBase64(const char *encodedStr, const std::uint32_t strSize)
Decodes the specified Base64 encoded string.
CPP_UTILITIES_EXPORT void truncateString(std::string &str, char terminationChar='\0')
Truncates all characters after the first occurrence of the specified terminationChar and the terminat...
std::pair< std::unique_ptr< char[], StringDataDeleter >, std::size_t > StringData
Type used to return string encoding conversion result.
CPP_UTILITIES_EXPORT StringData convertUtf16BEToUtf8(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-16 (big-endian) string to UTF-8.
constexpr T max(T first, T second)
Returns the greatest of the given items.
CPP_UTILITIES_EXPORT StringData convertUtf8ToLatin1(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to Latin-1.
CPP_UTILITIES_EXPORT StringData convertUtf8ToUtf16LE(const char *inputBuffer, std::size_t inputBufferSize)
Converts the specified UTF-8 string to UTF-16 (little-endian).
CPP_UTILITIES_EXPORT std::string bitrateToString(double speedInKbitsPerSecond, bool useByteInsteadOfBits=false)
Converts the specified bitrate in kbit/s to its equivalent std::string representation.
CPP_UTILITIES_EXPORT std::string encodeBase64(const std::uint8_t *data, std::uint32_t dataSize)
Encodes the specified data to Base64.
CPP_UTILITIES_EXPORT std::string dataSizeToString(std::uint64_t sizeInByte, bool includeByte=false)
Converts the specified data size in byte to its equivalent std::string representation.