/* * Copyright (c) 2010-2017 OTClient * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN * THE SOFTWARE. */ #include "string.h" #include "format.h" #include #include #include #ifdef _MSC_VER #pragma warning(disable:4267) // '?' : conversion from 'A' to 'B', possible loss of data #endif namespace stdext { std::string resolve_path(const std::string& filePath, std::string sourcePath) { if(stdext::starts_with(filePath, "/")) return filePath; if(!stdext::ends_with(sourcePath, "/")) { std::size_t slashPos = sourcePath.find_last_of("/"); if(slashPos == std::string::npos) throw_exception(format("invalid source path '%s', for file '%s'", sourcePath, filePath)); sourcePath = sourcePath.substr(0, slashPos + 1); } return sourcePath + filePath; } std::string date_time_string() { char date[32]; std::time_t tnow; std::time(&tnow); std::tm *ts = std::localtime(&tnow); std::strftime(date, 32, "%b %d %Y %H:%M:%S", ts); return std::string(date); } std::string dec_to_hex(uint64_t num) { std::string str; std::ostringstream o; o << std::hex << num; str = o.str(); return str; } uint64_t hex_to_dec(const std::string& str) { uint64_t num; std::istringstream i(str); i >> std::hex >> num; return num; } bool is_valid_utf8(const std::string& src) { const unsigned char *bytes = (const unsigned char *)src.c_str(); while(*bytes) { if( (// ASCII // use bytes[0] <= 0x7F to allow ASCII control characters bytes[0] == 0x09 || bytes[0] == 0x0A || bytes[0] == 0x0D || (0x20 <= bytes[0] && bytes[0] <= 0x7E) ) ) { bytes += 1; continue; } if( (// non-overlong 2-byte (0xC2 <= bytes[0] && bytes[0] <= 0xDF) && (0x80 <= bytes[1] && bytes[1] <= 0xBF) ) ) { bytes += 2; continue; } if( (// excluding overlongs bytes[0] == 0xE0 && (0xA0 <= bytes[1] && bytes[1] <= 0xBF) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) ) || (// straight 3-byte ((0xE1 <= bytes[0] && bytes[0] <= 0xEC) || bytes[0] == 0xEE || bytes[0] == 0xEF) && (0x80 <= bytes[1] && bytes[1] <= 0xBF) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) ) || (// excluding surrogates bytes[0] == 0xED && (0x80 <= bytes[1] && bytes[1] <= 0x9F) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) ) ) { bytes += 3; continue; } if( (// planes 1-3 bytes[0] == 0xF0 && (0x90 <= bytes[1] && bytes[1] <= 0xBF) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) && (0x80 <= bytes[3] && bytes[3] <= 0xBF) ) || (// planes 4-15 (0xF1 <= bytes[0] && bytes[0] <= 0xF3) && (0x80 <= bytes[1] && bytes[1] <= 0xBF) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) && (0x80 <= bytes[3] && bytes[3] <= 0xBF) ) || (// plane 16 bytes[0] == 0xF4 && (0x80 <= bytes[1] && bytes[1] <= 0x8F) && (0x80 <= bytes[2] && bytes[2] <= 0xBF) && (0x80 <= bytes[3] && bytes[3] <= 0xBF) ) ) { bytes += 4; continue; } return false; } return true; } std::string utf8_to_latin1(const std::string& src) { std::string out; for(uint i=0;i= 32 && c < 128) || c == 0x0d || c == 0x0a || c == 0x09) out += c; else if(c == 0xc2 || c == 0xc3) { uchar c2 = src[i++]; if(c == 0xc2) { if(c2 > 0xa1 && c2 < 0xbb) out += c2; } else if(c == 0xc3) out += 64 + c2; } else if(c >= 0xc4 && c <= 0xdf) i += 1; else if(c >= 0xe0 && c <= 0xed) i += 2; else if(c >= 0xf0 && c <= 0xf4) i += 3; } return out; } std::string latin1_to_utf8(const std::string& src) { std::string out; for(uchar c : src) { if((c >= 32 && c < 128) || c == 0x0d || c == 0x0a || c == 0x09) out += c; else { out += 0xc2 + (c > 0xbf); out += 0x80 + (c & 0x3f); } } return out; } #ifdef WIN32 #include #include std::wstring utf8_to_utf16(const std::string& src) { std::wstring res; wchar_t out[4096]; if(MultiByteToWideChar(CP_UTF8, 0, src.c_str(), -1, out, 4096)) res = out; return res; } std::string utf16_to_utf8(const std::wstring& src) { std::string res; char out[4096]; if(WideCharToMultiByte(CP_UTF8, 0, src.c_str(), -1, out, 4096, NULL, NULL)) res = out; return res; } std::wstring latin1_to_utf16(const std::string& src) { return utf8_to_utf16(latin1_to_utf8(src)); } std::string utf16_to_latin1(const std::wstring& src) { return utf8_to_latin1(utf16_to_utf8(src)); } #endif void tolower(std::string& str) { std::transform(str.begin(), str.end(), str.begin(), lochar); } void toupper(std::string& str) { std::transform(str.begin(), str.end(), str.begin(), upchar); } void trim(std::string& str) { boost::trim(str); } char upchar(char c) { if((c >= 97 && c <= 122) || (uchar)c >= 224) c -= 32; return c; } char lochar(char c) { if((c >= 65 && c <= 90) || ((uchar)c >= 192 && (uchar)c <= 223)) c += 32; return c; } void ucwords(std::string& str) { uint32 strLen = str.length(); if(strLen == 0) return; str[0] = upchar(str[0]); for(uint32 i = 1; i < strLen; ++i) { if(str[i - 1] == ' ') str[i] = upchar(str[i]); } } bool ends_with(const std::string& str, const std::string& test) { return boost::ends_with(str, test); } bool starts_with(const std::string& str, const std::string& test) { return boost::starts_with(str, test); } void replace_all(std::string& str, const std::string& search, const std::string& replacement) { return boost::replace_all(str, search, replacement); } std::vector split(const std::string& str, const std::string& separators) { std::vector splitted; boost::split(splitted, str, boost::is_any_of(std::string(separators))); return splitted; } }