/[winpt]/trunk/Src/wptUTF8.cpp

Diff of /trunk/Src/wptUTF8.cpp

Parent Directory | Revision Log | View Patch Patch

-revision 187 by twoaday,
Wed Mar 22 11:04:20 2006 UTC
+revision 464 by twoaday,
Tue Oct  9 09:27:57 2012 UTC
 Line 1
  /* wptUTF8.cpp - UTF8 conversation
-  *      Copyright (C) 2002, 2004, 2005, 2006 Timo Schulz
+  *      Copyright (C) 2002, 2004, 2005, 2006, 2009, 2012 Timo Schulz
   *
   * This file is part of WinPT.
   *
 Line 12
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
   * GNU General Public License for more details.
-  *
-  * You should have received a copy of the GNU General Public License
-  * along with WinPT; if not, write to the Free Software Foundation,
-  * Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA
   */
  #ifdef HAVE_CONFIG_H
  #include <config.h>
  #endif
-Line 32
+Line 27
  #include "wptErrors.h"
+ /* Byte order mark that is usually used to indicate that the following
+    data is encoded in UTF-8. */
+ BYTE UTF8_BOM[] = {0xEF, 0xBB, 0xBF};
+ /**
+  * Convert the given intput string, which is encoded with the locale
+  * setting, into UTF-8 representation.
+  */
  char*
  native_to_utf8 (const char *string)
  {
-     wchar_t *result;
+     int n = MultiByteToWideChar (GetACP (), 0, string, -1, NULL, 0);
-     char *native;
-     int n;
-     n = MultiByteToWideChar (GetACP (), 0, string, -1, NULL, 0);
      if (n < 0)
          return NULL;
-     result = (wchar_t*)malloc ((n+1) * sizeof *result);
+     wchar_t *result = new wchar_t[n+1];
      if (!result)
          BUG (0);
      n = MultiByteToWideChar (GetACP (), 0, string, -1, result, n);
      if (n < 0) {
-         free (result);
+         free_if_alloc (result);
          return NULL;
      }
 Line 57 
 native_to_utf8 (const char *string)
      if (n < 0)
          return NULL;
-     native = (char*)malloc (n+1);
+     char *native = new char[n + 1];
      if (!native)
          BUG (0);
+     memset(native, 0, n + 1);
      n = WideCharToMultiByte (CP_UTF8, 0, result, -1, native, n, NULL, NULL);
      if (n < 0) {
-         free (result);
+         free_if_alloc (result);
          return NULL;
      }
-     free (result);
+     free_if_alloc (result);
      return native;
  }
- /* Convert utf8 string @str to native CP. */
+ /**
+  * Convert an UTF-8 string into an UTF-16 string.
+  */
+ wchar_t*
+ utf8_to_utf16(const char *string, size_t *retlen)
+ {
+     int n = MultiByteToWideChar(CP_UTF8, 0, string, -1, NULL, 0);
+     if (n < 0)
+         return NULL;
+     wchar_t *result = new wchar_t[n + 1];
+     if (!result)
+         BUG(0);
+     n = MultiByteToWideChar(CP_UTF8, 0, string, -1, result, n);
+     if (n < 0) {
+         free_if_alloc(result);
+         return NULL;
+     }
+     *retlen = n;
+     return result;
+ }
+ /**
+  * Convert the given string, which is encoded in UTF-8,
+  * into the locale setting.
+  */
  char*
  utf8_to_native (const char *string)
  {
-     wchar_t *result;
+     int n = MultiByteToWideChar (CP_UTF8, 0, string, -1, NULL, 0);
-     char *native;
-     int n;
-     n = MultiByteToWideChar (CP_UTF8, 0, string, -1, NULL, 0);
      if (n < 0)
          return NULL;
-     result = (wchar_t*)malloc ((n+1) * sizeof *result);
+     wchar_t *result = new wchar_t[n+1];
      if (!result)
          BUG (0);
      n = MultiByteToWideChar (CP_UTF8, 0, string, -1, result, n);
      if (n < 0) {
-         free (result);
+         free_if_alloc (result);
          return NULL;
      }
-Line 98 
 utf8_to_native (const char *string)
+Line 123 
 utf8_to_native (const char *string)
      if (n < 0)
          return NULL;
-     native = (char*)malloc (n+1);
+     char *native = new char[n + 1];
      if (!native)
          BUG (0);
+     memset(native, 0, n + 1);
      n = WideCharToMultiByte (GetACP (), 0, result, -1, native, n, NULL, NULL);
      if (n < 0) {
-         free (result);
+         free_if_alloc (result);
          return NULL;
      }
-     free (result);
+     free_if_alloc (result);
      return native;
  }
+ /**
+  * Return -1 if the given string contains any 8-bit characters.
+  * This is a helper to decide when to use UTF8 encoding.
+  */
  int
- is_8bit_string (const char * str)
+ is_8bit_string (const char *str)
  {
-     size_t i;
+     for (size_t i = 0; i < strlen (str); i++) {
-     for (i = 0; i < strlen (str); i++) {
          if (str[i] & 0x80)
              return -1;
      }

 Legend:



Removed from v.187
 


changed lines


 
Added in v.464
 Legend:



Removed from v.187
 


changed lines


 
Added in v.464
-Removed from v.187
+Added in v.464

[email protected]	ViewVC Help
Powered by ViewVC 1.1.26