subuniutil.cpp 4.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697
  1. /** BEGIN COPYRIGHT BLOCK
  2. * This Program is free software; you can redistribute it and/or modify it under
  3. * the terms of the GNU General Public License as published by the Free Software
  4. * Foundation; version 2 of the License.
  5. *
  6. * This Program is distributed in the hope that it will be useful, but WITHOUT
  7. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
  8. * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
  9. *
  10. * You should have received a copy of the GNU General Public License along with
  11. * this Program; if not, write to the Free Software Foundation, Inc., 59 Temple
  12. * Place, Suite 330, Boston, MA 02111-1307 USA.
  13. *
  14. * In addition, as a special exception, Red Hat, Inc. gives You the additional
  15. * right to link the code of this Program with code not covered under the GNU
  16. * General Public License ("Non-GPL Code") and to distribute linked combinations
  17. * including the two, subject to the limitations in this paragraph. Non-GPL Code
  18. * permitted under this exception must only link to the code of this Program
  19. * through those well defined interfaces identified in the file named EXCEPTION
  20. * found in the source code files (the "Approved Interfaces"). The files of
  21. * Non-GPL Code may instantiate templates or use macros or inline functions from
  22. * the Approved Interfaces without causing the resulting work to be covered by
  23. * the GNU General Public License. Only Red Hat, Inc. may make changes or
  24. * additions to the list of Approved Interfaces. You must obey the GNU General
  25. * Public License in all respects for all of the Program code and other code used
  26. * in conjunction with the Program except the Non-GPL Code covered by this
  27. * exception. If you modify this file, you may extend this exception to your
  28. * version of the file, but you are not obligated to do so. If you do not wish to
  29. * provide this exception without modification, you must delete this exception
  30. * statement from your version and license this file solely under the GPL without
  31. * exception.
  32. *
  33. *
  34. * Copyright (C) 2001 Sun Microsystems, Inc. Used by permission.
  35. * Copyright (C) 2005 Red Hat, Inc.
  36. * All rights reserved.
  37. * END COPYRIGHT BLOCK **/
  38. #include "subuniutil.h"
  39. // Copied: 2-8-2005
  40. // From: secuniutil.c
  41. unsigned long
  42. utf8getcc( const char** src )
  43. {
  44. register unsigned long c;
  45. register const unsigned char* s = (const unsigned char*)*src;
  46. switch (UTF8len [(*s >> 2) & 0x3F]) {
  47. case 0: /* erroneous: s points to the middle of a character. */
  48. c = (*s++) & 0x3F; goto more5;
  49. case 1: c = (*s++); break;
  50. case 2: c = (*s++) & 0x1F; goto more1;
  51. case 3: c = (*s++) & 0x0F; goto more2;
  52. case 4: c = (*s++) & 0x07; goto more3;
  53. case 5: c = (*s++) & 0x03; goto more4;
  54. case 6: c = (*s++) & 0x01; goto more5;
  55. more5: if ((*s & 0xC0) != 0x80) break; c = (c << 6) | ((*s++) & 0x3F);
  56. more4: if ((*s & 0xC0) != 0x80) break; c = (c << 6) | ((*s++) & 0x3F);
  57. more3: if ((*s & 0xC0) != 0x80) break; c = (c << 6) | ((*s++) & 0x3F);
  58. more2: if ((*s & 0xC0) != 0x80) break; c = (c << 6) | ((*s++) & 0x3F);
  59. more1: if ((*s & 0xC0) != 0x80) break; c = (c << 6) | ((*s++) & 0x3F);
  60. break;
  61. }
  62. *src = (const char*)s;
  63. return c;
  64. }
  65. //
  66. wchar_t *
  67. ASCIIToUnicode( const char *buf, wchar_t *uni, int inUnilen )
  68. /* Convert the 0-terminated UTF-8 string 'buf' to 0-terminated UCS-2;
  69. write the result into uni, truncated (if necessary) to fit in 0..unilen-1. */
  70. /* XXX This function should be named UTF8ToUnicode */
  71. /* XXX unilen should be size_t, not int */
  72. {
  73. auto size_t unilen = (size_t)inUnilen; /* to get rid of warnings for now */
  74. auto size_t i;
  75. if (unilen > 0 && buf && uni) {
  76. for (i = 0; i < unilen; ++i) {
  77. register unsigned long c = utf8getcc( &buf );
  78. if (c >= 0xfffeUL) c = 0xfffdUL; /* REPLACEMENT CHARACTER */
  79. if (0 == (uni[i] = (wchar_t)c)) break;
  80. }
  81. if (i >= unilen && unilen > 0) {
  82. uni[unilen-1] = 0;
  83. }
  84. }
  85. return uni;
  86. }
  87. wchar_t *
  88. StrToUnicode( const char *buf )
  89. {
  90. wchar_t unibuf[1024];
  91. ASCIIToUnicode( buf, unibuf, sizeof(unibuf) );
  92. return _wcsdup( unibuf );
  93. }
  94. // End Copy