// String utilities.
//
-// Written by Bernie Bright, 1998
+// Written by Bernie Bright, started 1998
//
-// Copyright (C) 1998 Bernie Bright - bbright@c031.aone.net.au
+// Copyright (C) 1998 Bernie Bright - bbright@bigpond.net.au
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Library General Public
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Library General Public License for more details.
//
-// You should have received a copy of the GNU Library General Public
-// License along with this library; if not, write to the
-// Free Software Foundation, Inc., 59 Temple Place - Suite 330,
-// Boston, MA 02111-1307, USA.
+// You should have received a copy of the GNU General Public License
+// along with this program; if not, write to the Free Software
+// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
//
// $Id$
-#ifdef HAVE_CONFIG_H
-# include <config.h>
-#endif
+#include <ctype.h>
+#include <cstring>
+#include <sstream>
#include "strutils.hxx"
-const string whitespace = " \n\r\t";
+#include <simgear/debug/logstream.hxx>
-//
-string
-trimleft( const string& s, const string& trimmings )
-{
- string result;
- string::size_type pos = s.find_first_not_of( trimmings );
- if ( pos != string::npos )
+using std::string;
+using std::vector;
+using std::stringstream;
+
+namespace simgear {
+ namespace strutils {
+
+ /**
+ *
+ */
+ static vector<string>
+ split_whitespace( const string& str, int maxsplit )
+ {
+ vector<string> result;
+ string::size_type len = str.length();
+ string::size_type i = 0;
+ string::size_type j;
+ int countsplit = 0;
+
+ while (i < len)
+ {
+ while (i < len && isspace((unsigned char)str[i]))
+ {
+ ++i;
+ }
+
+ j = i;
+
+ while (i < len && !isspace((unsigned char)str[i]))
+ {
+ ++i;
+ }
+
+ if (j < i)
+ {
+ result.push_back( str.substr(j, i-j) );
+ ++countsplit;
+ while (i < len && isspace((unsigned char)str[i]))
+ {
+ ++i;
+ }
+
+ if (maxsplit && (countsplit >= maxsplit) && i < len)
+ {
+ result.push_back( str.substr( i, len-i ) );
+ i = len;
+ }
+ }
+ }
+
+ return result;
+ }
+
+ /**
+ *
+ */
+ vector<string>
+ split( const string& str, const char* sep, int maxsplit )
+ {
+ if (sep == 0)
+ return split_whitespace( str, maxsplit );
+
+ vector<string> result;
+ int n = std::strlen( sep );
+ if (n == 0)
+ {
+ // Error: empty separator string
+ return result;
+ }
+ const char* s = str.c_str();
+ string::size_type len = str.length();
+ string::size_type i = 0;
+ string::size_type j = 0;
+ int splitcount = 0;
+
+ while (i+n <= len)
+ {
+ if (s[i] == sep[0] && (n == 1 || std::memcmp(s+i, sep, n) == 0))
+ {
+ result.push_back( str.substr(j,i-j) );
+ i = j = i + n;
+ ++splitcount;
+ if (maxsplit && (splitcount >= maxsplit))
+ break;
+ }
+ else
+ {
+ ++i;
+ }
+ }
+
+ result.push_back( str.substr(j,len-j) );
+ return result;
+ }
+
+ /**
+ * The lstrip(), rstrip() and strip() functions are implemented
+ * in do_strip() which uses an additional parameter to indicate what
+ * type of strip should occur.
+ */
+ const int LEFTSTRIP = 0;
+ const int RIGHTSTRIP = 1;
+ const int BOTHSTRIP = 2;
+
+ static string
+ do_strip( const string& s, int striptype )
+ {
+ string::size_type len = s.length();
+ if( len == 0 ) // empty string is trivial
+ return s;
+ string::size_type i = 0;
+ if (striptype != RIGHTSTRIP)
+ {
+ while (i < len && isspace(s[i]))
+ {
+ ++i;
+ }
+ }
+
+ string::size_type j = len;
+ if (striptype != LEFTSTRIP)
+ {
+ do
+ {
+ --j;
+ }
+ while (j >= 1 && isspace(s[j]));
+ ++j;
+ }
+
+ if (i == 0 && j == len)
+ {
+ return s;
+ }
+ else
+ {
+ return s.substr( i, j - i );
+ }
+ }
+
+ string
+ lstrip( const string& s )
+ {
+ return do_strip( s, LEFTSTRIP );
+ }
+
+ string
+ rstrip( const string& s )
+ {
+ return do_strip( s, RIGHTSTRIP );
+ }
+
+ string
+ strip( const string& s )
+ {
+ return do_strip( s, BOTHSTRIP );
+ }
+
+ string
+ rpad( const string & s, string::size_type length, char c )
+ {
+ string::size_type l = s.length();
+ if( l >= length ) return s;
+ string reply = s;
+ return reply.append( length-l, c );
+ }
+
+ string
+ lpad( const string & s, size_t length, char c )
+ {
+ string::size_type l = s.length();
+ if( l >= length ) return s;
+ string reply = s;
+ return reply.insert( 0, length-l, c );
+ }
+
+ bool
+ starts_with( const string & s, const string & substr )
+ {
+ return s.compare(0, substr.length(), substr) == 0;
+ }
+
+ bool
+ ends_with( const string & s, const string & substr )
+ {
+ if( substr.length() > s.length() )
+ return false;
+ return s.compare( s.length() - substr.length(),
+ substr.length(),
+ substr ) == 0;
+ }
+
+ string simplify(const string& s)
+ {
+ string result; // reserve size of 's'?
+ string::const_iterator it = s.begin(),
+ end = s.end();
+
+ // advance to first non-space char - simplifes logic in main loop,
+ // since we can always prepend a single space when we see a
+ // space -> non-space transition
+ for (; (it != end) && isspace(*it); ++it) { /* nothing */ }
+
+ bool lastWasSpace = false;
+ for (; it != end; ++it) {
+ char c = *it;
+ if (isspace(c)) {
+ lastWasSpace = true;
+ continue;
+ }
+
+ if (lastWasSpace) {
+ result.push_back(' ');
+ }
+
+ lastWasSpace = false;
+ result.push_back(c);
+ }
+
+ return result;
+ }
+
+ int to_int(const std::string& s, int base)
+ {
+ stringstream ss(s);
+ switch (base) {
+ case 8: ss >> std::oct; break;
+ case 16: ss >> std::hex; break;
+ default: break;
+ }
+
+ int result;
+ ss >> result;
+ return result;
+ }
+
+ int compare_versions(const string& v1, const string& v2)
+ {
+ vector<string> v1parts(split(v1, "."));
+ vector<string> v2parts(split(v2, "."));
+
+ int lastPart = std::min(v1parts.size(), v2parts.size());
+ for (int part=0; part < lastPart; ++part) {
+ int part1 = to_int(v1parts[part]);
+ int part2 = to_int(v2parts[part]);
+
+ if (part1 != part2) {
+ return part1 - part2;
+ }
+ } // of parts iteration
+
+ // reached end - longer wins
+ return v1parts.size() - v2parts.size();
+ }
+
+ string join(const string_list& l, const string& joinWith)
{
- result.assign( s.substr( pos ) );
+ string result;
+ unsigned int count = l.size();
+ for (unsigned int i=0; i < count; ++i) {
+ result += l[i];
+ if (i < (count - 1)) {
+ result += joinWith;
+ }
+ }
+
+ return result;
}
+
+ string uppercase(const string &s) {
+ string rslt(s);
+ for(string::iterator p = rslt.begin(); p != rslt.end(); p++){
+ *p = toupper(*p);
+ }
+ return rslt;
+ }
+
- return result;
+#ifdef SG_WINDOWS
+ #include <windows.h>
+#endif
+
+std::string convertWindowsLocal8BitToUtf8(const std::string& a)
+{
+#ifdef SG_WINDOWS
+ DWORD flags = 0;
+ std::vector<wchar_t> wideString;
+
+ // call to query transform size
+ int requiredWideChars = MultiByteToWideChar(CP_ACP, flags, a.c_str(), a.size(),
+ NULL, 0);
+ // allocate storage and call for real
+ wideString.resize(requiredWideChars);
+ MultiByteToWideChar(CP_ACP, flags, a.c_str(), a.size(),
+ wideString.data(), wideString.size());
+
+ // now convert back down to UTF-8
+ std::vector<char> result;
+ int requiredUTF8Chars = WideCharToMultiByte(CP_UTF8, flags,
+ wideString.data(), wideString.size(),
+ NULL, 0, NULL, NULL);
+ result.resize(requiredUTF8Chars);
+ WideCharToMultiByte(CP_UTF8, flags,
+ wideString.data(), wideString.size(),
+ result.data(), result.size(), NULL, NULL);
+ return std::string(result.data(), result.size());
+#else
+ return a;
+#endif
}
-//
-string
-trimright( const string& s, const string& trimmings )
+static const std::string base64_chars =
+"ABCDEFGHIJKLMNOPQRSTUVWXYZ"
+"abcdefghijklmnopqrstuvwxyz"
+"0123456789+/";
+
+static const unsigned char base64_decode_map[128] =
{
- string result;
+ 127, 127, 127, 127, 127, 127, 127, 127, 127, 127,
+ 127, 127, 127, 127, 127, 127, 127, 127, 127, 127,
+ 127, 127, 127, 127, 127, 127, 127, 127, 127, 127,
+ 127, 127, 127, 127, 127, 127, 127, 127, 127, 127,
+ 127, 127, 127, 62, 127, 127, 127, 63, 52, 53,
+ 54, 55, 56, 57, 58, 59, 60, 61, 127, 127,
+ 127, 64, 127, 127, 127, 0, 1, 2, 3, 4,
+ 5, 6, 7, 8, 9, 10, 11, 12, 13, 14,
+ 15, 16, 17, 18, 19, 20, 21, 22, 23, 24,
+ 25, 127, 127, 127, 127, 127, 127, 26, 27, 28,
+ 29, 30, 31, 32, 33, 34, 35, 36, 37, 38,
+ 39, 40, 41, 42, 43, 44, 45, 46, 47, 48,
+ 49, 50, 51, 127, 127, 127, 127, 127
+};
+
+
+static inline bool is_base64(unsigned char c) {
+ return (isalnum(c) || (c == '+') || (c == '/'));
+}
- string::size_type pos = s.find_last_not_of( trimmings );
- if ( pos == string::npos )
- {
- // Not found, return the original string.
- result = s;
+static bool is_whitespace(unsigned char c) {
+ return ((c == ' ') || (c == '\r') || (c == '\n'));
+}
+
+void decodeBase64(const std::string& encoded_string, std::vector<unsigned char>& ret)
+{
+ int in_len = encoded_string.size();
+ int i = 0;
+ int j = 0;
+ int in_ = 0;
+ unsigned char char_array_4[4], char_array_3[3];
+
+ while (in_len-- && ( encoded_string[in_] != '=')) {
+ if (is_whitespace( encoded_string[in_])) {
+ in_++;
+ continue;
+ }
+
+ if (!is_base64(encoded_string[in_])) {
+ break;
}
- else
+
+ char_array_4[i++] = encoded_string[in_]; in_++;
+ if (i ==4) {
+ for (i = 0; i <4; i++)
+ char_array_4[i] = base64_decode_map[char_array_4[i]];
+
+ char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
+ char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
+ char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
+
+ for (i = 0; (i < 3); i++)
+ ret.push_back(char_array_3[i]);
+ i = 0;
+ }
+ }
+
+ if (i) {
+ for (j = i; j <4; j++)
+ char_array_4[j] = 0;
+
+ for (j = 0; j <4; j++)
+ char_array_4[j] = base64_decode_map[char_array_4[j]];
+
+ char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
+ char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
+ char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
+
+ for (j = 0; (j < i - 1); j++) ret.push_back(char_array_3[j]);
+ }
+}
+
+const char hexChar[] = {'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'a', 'b', 'c', 'd', 'e', 'f'};
+
+std::string encodeHex(const std::string& bytes)
+{
+ std::string hex;
+ size_t count = bytes.size();
+ for (unsigned int i=0; i<count;++i) {
+ unsigned char c = bytes[i];
+ hex.push_back(hexChar[c >> 4]);
+ hex.push_back(hexChar[c & 0x0f]);
+ }
+
+ return hex;
+}
+
+std::string encodeHex(const unsigned char* rawBytes, unsigned int length)
+{
+ std::string hex;
+ for (unsigned int i=0; i<length;++i) {
+ unsigned char c = *rawBytes++;
+ hex.push_back(hexChar[c >> 4]);
+ hex.push_back(hexChar[c & 0x0f]);
+ }
+
+ return hex;
+}
+
+//------------------------------------------------------------------------------
+std::string unescape(const char* s)
+{
+ std::string r;
+ while( *s )
+ {
+ if( *s != '\\' )
{
- result.assign( s.substr( 0, pos+1 ) );
+ r += *s++;
+ continue;
}
- return result;
+ if( !*++s )
+ break;
+
+ if (*s == '\\') {
+ r += '\\';
+ } else if (*s == 'n') {
+ r += '\n';
+ } else if (*s == 'r') {
+ r += '\r';
+ } else if (*s == 't') {
+ r += '\t';
+ } else if (*s == 'v') {
+ r += '\v';
+ } else if (*s == 'f') {
+ r += '\f';
+ } else if (*s == 'a') {
+ r += '\a';
+ } else if (*s == 'b') {
+ r += '\b';
+ } else if (*s == 'x') {
+ if (!*++s)
+ break;
+ int v = 0;
+ for (int i = 0; i < 2 && isxdigit(*s); i++, s++)
+ v = v * 16 + (isdigit(*s) ? *s - '0' : 10 + tolower(*s) - 'a');
+ r += v;
+ continue;
+
+ } else if (*s >= '0' && *s <= '7') {
+ int v = *s++ - '0';
+ for (int i = 0; i < 3 && *s >= '0' && *s <= '7'; i++, s++)
+ v = v * 8 + *s - '0';
+ r += v;
+ continue;
+
+ } else {
+ r += *s;
+ }
+ s++;
+ }
+ return r;
}
-//
-string
-trim( const string& s, const string& trimmings )
+string sanitizePrintfFormat(const string& input)
{
- return trimright( trimleft( s, trimmings ), trimmings );
+ string::size_type i = input.find("%n");
+ if (i != string::npos) {
+ SG_LOG(SG_IO, SG_WARN, "sanitizePrintfFormat: bad format string:" << input);
+ return string();
+ }
+
+ return input;
}
+} // end namespace strutils
+
+} // end namespace simgear