| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | // Copyright 2013 Dolphin Emulator Project
 | 
					
						
							|  |  |  | // Licensed under GPLv2
 | 
					
						
							|  |  |  | // Refer to the license.txt file included.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <algorithm>
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-08 20:15:08 -04:00
										 |  |  | #include "common/common.h"
 | 
					
						
							|  |  |  | #include "common/string_util.h"
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef _WIN32
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     #include <Windows.h>
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     #include <codecvt>
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #else
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     #include <iconv.h>
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-07 11:50:43 -07:00
										 |  |  | namespace Common { | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-14 21:25:46 -04:00
										 |  |  | /// Make a string lowercase
 | 
					
						
							| 
									
										
										
										
											2014-09-07 11:50:43 -07:00
										 |  |  | std::string ToLower(std::string str) { | 
					
						
							| 
									
										
										
										
											2014-09-07 00:49:52 -07:00
										 |  |  |     std::transform(str.begin(), str.end(), str.begin(), ::tolower); | 
					
						
							|  |  |  |     return str; | 
					
						
							| 
									
										
										
										
											2014-04-14 21:25:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /// Make a string uppercase
 | 
					
						
							| 
									
										
										
										
											2014-09-07 11:50:43 -07:00
										 |  |  | std::string ToUpper(std::string str) { | 
					
						
							| 
									
										
										
										
											2014-09-07 00:49:52 -07:00
										 |  |  |     std::transform(str.begin(), str.end(), str.begin(), ::toupper); | 
					
						
							|  |  |  |     return str; | 
					
						
							| 
									
										
										
										
											2014-04-14 21:25:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | // faster than sscanf
 | 
					
						
							|  |  |  | bool AsciiToHex(const char* _szValue, u32& result) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     char *endptr = NULL; | 
					
						
							|  |  |  |     const u32 value = strtoul(_szValue, &endptr, 16); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (!endptr || *endptr) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     result = value; | 
					
						
							|  |  |  |     return true; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool CharArrayFromFormatV(char* out, int outsize, const char* format, va_list args) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     int writtenCount; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef _WIN32
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     // You would think *printf are simple, right? Iterate on each character,
 | 
					
						
							|  |  |  |     // if it's a format specifier handle it properly, etc.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // Nooooo. Not according to the C standard.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // According to the C99 standard (7.19.6.1 "The fprintf function")
 | 
					
						
							|  |  |  |     //     The format shall be a multibyte character sequence
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // Because some character encodings might have '%' signs in the middle of
 | 
					
						
							|  |  |  |     // a multibyte sequence (SJIS for example only specifies that the first
 | 
					
						
							|  |  |  |     // byte of a 2 byte sequence is "high", the second byte can be anything),
 | 
					
						
							|  |  |  |     // printf functions have to decode the multibyte sequences and try their
 | 
					
						
							|  |  |  |     // best to not screw up.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // Unfortunately, on Windows, the locale for most languages is not UTF-8
 | 
					
						
							|  |  |  |     // as we would need. Notably, for zh_TW, Windows chooses EUC-CN as the
 | 
					
						
							|  |  |  |     // locale, and completely fails when trying to decode UTF-8 as EUC-CN.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // On the other hand, the fix is simple: because we use UTF-8, no such
 | 
					
						
							|  |  |  |     // multibyte handling is required as we can simply assume that no '%' char
 | 
					
						
							|  |  |  |     // will be present in the middle of a multibyte sequence.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // This is why we lookup an ANSI (cp1252) locale here and use _vsnprintf_l.
 | 
					
						
							|  |  |  |     static locale_t c_locale = NULL; | 
					
						
							|  |  |  |     if (!c_locale) | 
					
						
							|  |  |  |         c_locale = _create_locale(LC_ALL, ".1252"); | 
					
						
							|  |  |  |     writtenCount = _vsnprintf_l(out, outsize, format, c_locale, args); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #else
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     writtenCount = vsnprintf(out, outsize, format, args); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (writtenCount > 0 && writtenCount < outsize) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         out[writtenCount] = '\0'; | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     else | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         out[outsize - 1] = '\0'; | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string StringFromFormat(const char* format, ...) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     va_list args; | 
					
						
							|  |  |  |     char *buf = NULL; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #ifdef _WIN32
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     int required = 0; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     va_start(args, format); | 
					
						
							|  |  |  |     required = _vscprintf(format, args); | 
					
						
							|  |  |  |     buf = new char[required + 1]; | 
					
						
							|  |  |  |     CharArrayFromFormatV(buf, required + 1, format, args); | 
					
						
							|  |  |  |     va_end(args); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::string temp = buf; | 
					
						
							|  |  |  |     delete[] buf; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #else
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     va_start(args, format); | 
					
						
							|  |  |  |     if (vasprintf(&buf, format, args) < 0) | 
					
						
							|  |  |  |         ERROR_LOG(COMMON, "Unable to allocate memory for string"); | 
					
						
							|  |  |  |     va_end(args); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::string temp = buf; | 
					
						
							|  |  |  |     free(buf); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return temp; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // For Debugging. Read out an u8 array.
 | 
					
						
							|  |  |  | std::string ArrayToString(const u8 *data, u32 size, int line_len, bool spaces) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::ostringstream oss; | 
					
						
							|  |  |  |     oss << std::setfill('0') << std::hex; | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     for (int line = 0; size; ++data, --size) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         oss << std::setw(2) << (int)*data; | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         if (line_len == ++line) | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             oss << '\n'; | 
					
						
							|  |  |  |             line = 0; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         else if (spaces) | 
					
						
							|  |  |  |             oss << ' '; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return oss.str(); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Turns "  hej " into "hej". Also handles tabs.
 | 
					
						
							|  |  |  | std::string StripSpaces(const std::string &str) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     const size_t s = str.find_first_not_of(" \t\r\n"); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (str.npos != s) | 
					
						
							|  |  |  |         return str.substr(s, str.find_last_not_of(" \t\r\n") - s + 1); | 
					
						
							|  |  |  |     else | 
					
						
							|  |  |  |         return ""; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // "\"hello\"" is turned to "hello"
 | 
					
						
							|  |  |  | // This one assumes that the string has already been space stripped in both
 | 
					
						
							|  |  |  | // ends, as done by StripSpaces above, for example.
 | 
					
						
							|  |  |  | std::string StripQuotes(const std::string& s) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (s.size() && '\"' == s[0] && '\"' == *s.rbegin()) | 
					
						
							|  |  |  |         return s.substr(1, s.size() - 2); | 
					
						
							|  |  |  |     else | 
					
						
							|  |  |  |         return s; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool TryParse(const std::string &str, u32 *const output) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     char *endptr = NULL; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     // Reset errno to a value other than ERANGE
 | 
					
						
							|  |  |  |     errno = 0; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     unsigned long value = strtoul(str.c_str(), &endptr, 0); | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (!endptr || *endptr) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (errno == ERANGE) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | #if ULONG_MAX > UINT_MAX
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (value >= 0x100000000ull | 
					
						
							|  |  |  |         && value <= 0xFFFFFFFF00000000ull) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     *output = static_cast<u32>(value); | 
					
						
							|  |  |  |     return true; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool TryParse(const std::string &str, bool *const output) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-10-23 21:17:01 -07:00
										 |  |  |     if ("1" == str || "true" == ToLower(str)) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         *output = true; | 
					
						
							| 
									
										
										
										
											2014-10-23 21:17:01 -07:00
										 |  |  |     else if ("0" == str || "false" == ToLower(str)) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         *output = false; | 
					
						
							|  |  |  |     else | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return true; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string StringFromBool(bool value) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return value ? "True" : "False"; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool SplitPath(const std::string& full_path, std::string* _pPath, std::string* _pFilename, std::string* _pExtension) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (full_path.empty()) | 
					
						
							|  |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     size_t dir_end = full_path.find_last_of("/" | 
					
						
							|  |  |  |     // windows needs the : included for something like just "C:" to be considered a directory
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #ifdef _WIN32
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         ":" | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     ); | 
					
						
							|  |  |  |     if (std::string::npos == dir_end) | 
					
						
							|  |  |  |         dir_end = 0; | 
					
						
							|  |  |  |     else | 
					
						
							|  |  |  |         dir_end += 1; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     size_t fname_end = full_path.rfind('.'); | 
					
						
							|  |  |  |     if (fname_end < dir_end || std::string::npos == fname_end) | 
					
						
							|  |  |  |         fname_end = full_path.size(); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (_pPath) | 
					
						
							|  |  |  |         *_pPath = full_path.substr(0, dir_end); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (_pFilename) | 
					
						
							|  |  |  |         *_pFilename = full_path.substr(dir_end, fname_end - dir_end); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (_pExtension) | 
					
						
							|  |  |  |         *_pExtension = full_path.substr(fname_end); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return true; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void BuildCompleteFilename(std::string& _CompleteFilename, const std::string& _Path, const std::string& _Filename) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     _CompleteFilename = _Path; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     // check for seperator
 | 
					
						
							|  |  |  |     if (DIR_SEP_CHR != *_CompleteFilename.rbegin()) | 
					
						
							|  |  |  |         _CompleteFilename += DIR_SEP_CHR; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     // add the filename
 | 
					
						
							|  |  |  |     _CompleteFilename += _Filename; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void SplitString(const std::string& str, const char delim, std::vector<std::string>& output) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::istringstream iss(str); | 
					
						
							|  |  |  |     output.resize(1); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     while (std::getline(iss, *output.rbegin(), delim)) | 
					
						
							|  |  |  |         output.push_back(""); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     output.pop_back(); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string TabsToSpaces(int tab_size, const std::string &in) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     const std::string spaces(tab_size, ' '); | 
					
						
							|  |  |  |     std::string out(in); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     size_t i = 0; | 
					
						
							|  |  |  |     while (out.npos != (i = out.find('\t'))) | 
					
						
							|  |  |  |         out.replace(i, 1, spaces); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return out; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string ReplaceAll(std::string result, const std::string& src, const std::string& dest) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-09-08 14:48:59 -04:00
										 |  |  |     size_t pos = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (src == dest) | 
					
						
							|  |  |  |         return result; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     while ((pos = result.find(src, pos)) != std::string::npos) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     { | 
					
						
							|  |  |  |         result.replace(pos, src.size(), dest); | 
					
						
							| 
									
										
										
										
											2014-09-08 14:48:59 -04:00
										 |  |  |         pos += dest.length(); | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2014-09-08 14:48:59 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return result; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // UriDecode and UriEncode are from http://www.codeguru.com/cpp/cpp/string/conversions/print.php/c12759
 | 
					
						
							|  |  |  | // by jinq0123 (November 2, 2006)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Uri encode and decode.
 | 
					
						
							|  |  |  | // RFC1630, RFC1738, RFC2396
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | //#include <string>
 | 
					
						
							|  |  |  | //#include <assert.h>
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | const char HEX2DEC[256] = | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     /*       0  1  2  3   4  5  6  7   8  9  A  B   C  D  E  F */ | 
					
						
							|  |  |  |     /* 0 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 1 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 2 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 3 */  0, 1, 2, 3,  4, 5, 6, 7,  8, 9,16,16, 16,16,16,16, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* 4 */ 16,10,11,12, 13,14,15,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 5 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 6 */ 16,10,11,12, 13,14,15,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 7 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* 8 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* 9 */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* A */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* B */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* C */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* D */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* E */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16, | 
					
						
							|  |  |  |     /* F */ 16,16,16,16, 16,16,16,16, 16,16,16,16, 16,16,16,16 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string UriDecode(const std::string & sSrc) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     // Note from RFC1630:  "Sequences which start with a percent sign
 | 
					
						
							|  |  |  |     // but are not followed by two hexadecimal characters (0-9, A-F) are reserved
 | 
					
						
							|  |  |  |     // for future extension"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     const unsigned char * pSrc = (const unsigned char *)sSrc.c_str(); | 
					
						
							|  |  |  |     const size_t SRC_LEN = sSrc.length(); | 
					
						
							|  |  |  |     const unsigned char * const SRC_END = pSrc + SRC_LEN; | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  |     const unsigned char * const SRC_LAST_DEC = SRC_END - 2;   // last decodable '%'
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  |     char * const pStart = new char[SRC_LEN]; | 
					
						
							|  |  |  |     char * pEnd = pStart; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     while (pSrc < SRC_LAST_DEC) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         if (*pSrc == '%') | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             char dec1, dec2; | 
					
						
							|  |  |  |             if (16 != (dec1 = HEX2DEC[*(pSrc + 1)]) | 
					
						
							|  |  |  |                 && 16 != (dec2 = HEX2DEC[*(pSrc + 2)])) | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 *pEnd++ = (dec1 << 4) + dec2; | 
					
						
							|  |  |  |                 pSrc += 3; | 
					
						
							|  |  |  |                 continue; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         *pEnd++ = *pSrc++; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // the last 2- chars
 | 
					
						
							|  |  |  |     while (pSrc < SRC_END) | 
					
						
							|  |  |  |         *pEnd++ = *pSrc++; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     std::string sResult(pStart, pEnd); | 
					
						
							|  |  |  |     delete [] pStart; | 
					
						
							|  |  |  |     return sResult; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Only alphanum is safe.
 | 
					
						
							|  |  |  | const char SAFE[256] = | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     /*      0 1 2 3  4 5 6 7  8 9 A B  C D E F */ | 
					
						
							|  |  |  |     /* 0 */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* 1 */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* 2 */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* 3 */ 1,1,1,1, 1,1,1,1, 1,1,0,0, 0,0,0,0, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* 4 */ 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1, | 
					
						
							|  |  |  |     /* 5 */ 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* 6 */ 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1, | 
					
						
							|  |  |  |     /* 7 */ 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* 8 */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* 9 */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* A */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* B */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* C */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* D */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* E */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, | 
					
						
							|  |  |  |     /* F */ 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string UriEncode(const std::string & sSrc) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     const char DEC2HEX[16 + 1] = "0123456789ABCDEF"; | 
					
						
							|  |  |  |     const unsigned char * pSrc = (const unsigned char *)sSrc.c_str(); | 
					
						
							|  |  |  |     const size_t SRC_LEN = sSrc.length(); | 
					
						
							|  |  |  |     unsigned char * const pStart = new unsigned char[SRC_LEN * 3]; | 
					
						
							|  |  |  |     unsigned char * pEnd = pStart; | 
					
						
							|  |  |  |     const unsigned char * const SRC_END = pSrc + SRC_LEN; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     for (; pSrc < SRC_END; ++pSrc) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  |         if (SAFE[*pSrc]) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |             *pEnd++ = *pSrc; | 
					
						
							|  |  |  |         else | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             // escape this char
 | 
					
						
							|  |  |  |             *pEnd++ = '%'; | 
					
						
							|  |  |  |             *pEnd++ = DEC2HEX[*pSrc >> 4]; | 
					
						
							|  |  |  |             *pEnd++ = DEC2HEX[*pSrc & 0x0F]; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     std::string sResult((char *)pStart, (char *)pEnd); | 
					
						
							|  |  |  |     delete [] pStart; | 
					
						
							|  |  |  |     return sResult; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef _WIN32
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | std::string UTF16ToUTF8(const std::u16string& input) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     std::wstring_convert<std::codecvt_utf8_utf16<char16_t>, char16_t> convert; | 
					
						
							|  |  |  |     return convert.to_bytes(input); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::u16string UTF8ToUTF16(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     std::wstring_convert<std::codecvt_utf8_utf16<char16_t>, char16_t> convert; | 
					
						
							|  |  |  |     return convert.from_bytes(input); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static std::string UTF16ToUTF8(const std::wstring& input) | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     auto const size = WideCharToMultiByte(CP_UTF8, 0, input.data(), input.size(), nullptr, 0, nullptr, nullptr); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::string output; | 
					
						
							|  |  |  |     output.resize(size); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (size == 0 || size != WideCharToMultiByte(CP_UTF8, 0, input.data(), input.size(), &output[0], output.size(), nullptr, nullptr)) | 
					
						
							|  |  |  |         output.clear(); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return output; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | static std::wstring CPToUTF16(u32 code_page, const std::string& input) | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     auto const size = MultiByteToWideChar(code_page, 0, input.data(), input.size(), nullptr, 0); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::wstring output; | 
					
						
							|  |  |  |     output.resize(size); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     if (size == 0 || size != MultiByteToWideChar(code_page, 0, input.data(), input.size(), &output[0], output.size())) | 
					
						
							|  |  |  |         output.clear(); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return output; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | std::wstring UTF8ToUTF16W(const std::string &input) | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return CPToUTF16(CP_UTF8, input); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string SHIFTJISToUTF8(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return UTF16ToUTF8(CPToUTF16(932, input)); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string CP1252ToUTF8(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return UTF16ToUTF8(CPToUTF16(1252, input)); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #else
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | template <typename T> | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | static std::string CodeToUTF8(const char* fromcode, const std::basic_string<T>& input) | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     std::string result; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     iconv_t const conv_desc = iconv_open("UTF-8", fromcode); | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     if ((iconv_t)(-1) == conv_desc) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     { | 
					
						
							|  |  |  |         ERROR_LOG(COMMON, "Iconv initialization failure [%s]: %s", fromcode, strerror(errno)); | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |         iconv_close(conv_desc); | 
					
						
							|  |  |  |         return {}; | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     const size_t in_bytes = sizeof(T) * input.size(); | 
					
						
							|  |  |  |     // Multiply by 4, which is the max number of bytes to encode a codepoint
 | 
					
						
							|  |  |  |     const size_t out_buffer_size = 4 * in_bytes; | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     std::string out_buffer; | 
					
						
							|  |  |  |     out_buffer.resize(out_buffer_size); | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     auto src_buffer = &input[0]; | 
					
						
							|  |  |  |     size_t src_bytes = in_bytes; | 
					
						
							|  |  |  |     auto dst_buffer = &out_buffer[0]; | 
					
						
							|  |  |  |     size_t dst_bytes = out_buffer.size(); | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     while (0 != src_bytes) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         size_t const iconv_result = iconv(conv_desc, (char**)(&src_buffer), &src_bytes, | 
					
						
							|  |  |  |             &dst_buffer, &dst_bytes); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (static_cast<size_t>(-1) == iconv_result) | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             if (EILSEQ == errno || EINVAL == errno) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |             { | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |                 // Try to skip the bad character
 | 
					
						
							|  |  |  |                 if (0 != src_bytes) | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |                 { | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |                     --src_bytes; | 
					
						
							|  |  |  |                     ++src_buffer; | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |                 } | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |             else | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 ERROR_LOG(COMMON, "iconv failure [%s]: %s", fromcode, strerror(errno)); | 
					
						
							|  |  |  |                 break; | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     out_buffer.resize(out_buffer_size - dst_bytes); | 
					
						
							|  |  |  |     out_buffer.swap(result); | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     iconv_close(conv_desc); | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |     return result; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::u16string UTF8ToUTF16(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     std::u16string result; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     iconv_t const conv_desc = iconv_open("UTF-16", "UTF-8"); | 
					
						
							|  |  |  |     if ((iconv_t)(-1) == conv_desc) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         ERROR_LOG(COMMON, "Iconv initialization failure [UTF-8]: %s", strerror(errno)); | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |         iconv_close(conv_desc); | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  |         return {}; | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     const size_t in_bytes = sizeof(char) * input.size(); | 
					
						
							|  |  |  |     // Multiply by 4, which is the max number of bytes to encode a codepoint
 | 
					
						
							|  |  |  |     const size_t out_buffer_size = 4 * sizeof(char16_t) * in_bytes; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     std::u16string out_buffer; | 
					
						
							|  |  |  |     out_buffer.resize(out_buffer_size); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     char* src_buffer = const_cast<char*>(&input[0]); | 
					
						
							|  |  |  |     size_t src_bytes = in_bytes; | 
					
						
							|  |  |  |     char* dst_buffer = (char*)(&out_buffer[0]); | 
					
						
							|  |  |  |     size_t dst_bytes = out_buffer.size(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     while (0 != src_bytes) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         size_t const iconv_result = iconv(conv_desc, &src_buffer, &src_bytes, | 
					
						
							|  |  |  |                                           &dst_buffer, &dst_bytes); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (static_cast<size_t>(-1) == iconv_result) | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             if (EILSEQ == errno || EINVAL == errno) | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 // Try to skip the bad character
 | 
					
						
							|  |  |  |                 if (0 != src_bytes) | 
					
						
							|  |  |  |                 { | 
					
						
							|  |  |  |                     --src_bytes; | 
					
						
							|  |  |  |                     ++src_buffer; | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |             else | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 ERROR_LOG(COMMON, "iconv failure [UTF-8]: %s", strerror(errno)); | 
					
						
							|  |  |  |                 break; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     out_buffer.resize(out_buffer_size - dst_bytes); | 
					
						
							|  |  |  |     out_buffer.swap(result); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     iconv_close(conv_desc); | 
					
						
							| 
									
										
										
										
											2014-11-19 08:49:13 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     return result; | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-10 14:36:32 -08:00
										 |  |  | std::string UTF16ToUTF8(const std::u16string& input) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return CodeToUTF8("UTF-16", input); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | std::string CP1252ToUTF8(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     //return CodeToUTF8("CP1252//TRANSLIT", input);
 | 
					
						
							|  |  |  |     //return CodeToUTF8("CP1252//IGNORE", input);
 | 
					
						
							|  |  |  |     return CodeToUTF8("CP1252", input); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::string SHIFTJISToUTF8(const std::string& input) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2014-04-01 18:20:08 -04:00
										 |  |  |     //return CodeToUTF8("CP932", input);
 | 
					
						
							|  |  |  |     return CodeToUTF8("SJIS", input); | 
					
						
							| 
									
										
										
										
											2013-09-04 20:17:46 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2014-09-07 11:50:43 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  | } |