TextConvert.cpp 3.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165
  1. #include "StdAfx.h"
  2. #include "TextConvert.h"
  3. static BYTE kUtf8Limits[5] = { 0xC0, 0xE0, 0xF0, 0xF8, 0xFC };
  4. CTextConvert::CTextConvert()
  5. {
  6. }
  7. CTextConvert::~CTextConvert()
  8. {
  9. }
  10. CStringW CTextConvert::MultiByteToUnicodeString(const CStringA &srcString)
  11. {
  12. CStringW resultString;
  13. if(!srcString.IsEmpty())
  14. {
  15. int numChars = MultiByteToWideChar(CP_ACP, 0, srcString,
  16. srcString.GetLength(), resultString.GetBuffer(srcString.GetLength()),
  17. srcString.GetLength() + 1);
  18. resultString.ReleaseBuffer(numChars);
  19. }
  20. return resultString;
  21. }
  22. CStringA CTextConvert::UnicodeStringToMultiByte(const CStringW &srcString)
  23. {
  24. CStringA resultString;
  25. if(!srcString.IsEmpty())
  26. {
  27. int numRequiredBytes = srcString.GetLength() * sizeof(wchar_t);
  28. int numChars = WideCharToMultiByte(CP_ACP, 0, srcString,
  29. srcString.GetLength(), resultString.GetBuffer(numRequiredBytes),
  30. numRequiredBytes + 1, NULL, NULL);
  31. resultString.ReleaseBuffer(numChars);
  32. }
  33. return resultString;
  34. }
  35. CStringA CTextConvert::ConvertToChar(const CString &src)
  36. {
  37. #ifdef _UNICODE
  38. return UnicodeStringToMultiByte(src);
  39. #else
  40. return src;
  41. #endif
  42. }
  43. bool CTextConvert::ConvertFromUTF8(const CStringA &src, CString &dest)
  44. {
  45. #ifdef _UNICODE
  46. dest.Empty();
  47. for(int i = 0; i < src.GetLength();)
  48. {
  49. BYTE c = (BYTE)src[i++];
  50. if (c < 0x80)
  51. {
  52. dest += (wchar_t)c;
  53. continue;
  54. }
  55. if(c < 0xC0)
  56. {
  57. dest = src;
  58. return false;
  59. }
  60. int numAdds;
  61. for (numAdds = 1; numAdds < 5; numAdds++)
  62. if (c < kUtf8Limits[numAdds])
  63. break;
  64. UINT value = (c - kUtf8Limits[numAdds - 1]);
  65. do
  66. {
  67. if (i >= src.GetLength())
  68. {
  69. dest = src;
  70. return false;
  71. }
  72. BYTE c2 = (BYTE)src[i++];
  73. if (c2 < 0x80 || c2 >= 0xC0)
  74. {
  75. dest = src;
  76. return false;
  77. }
  78. value <<= 6;
  79. value |= (c2 - 0x80);
  80. numAdds--;
  81. }while(numAdds > 0);
  82. if (value < 0x10000)
  83. {
  84. dest += (wchar_t)(value);
  85. }
  86. else
  87. {
  88. value -= 0x10000;
  89. if (value >= 0x100000)
  90. {
  91. dest = src;
  92. return false;
  93. }
  94. dest += (wchar_t)(0xD800 + (value >> 10));
  95. dest += (wchar_t)(0xDC00 + (value & 0x3FF));
  96. }
  97. }
  98. #else
  99. dest = src;
  100. #endif
  101. return true;
  102. }
  103. bool CTextConvert::ConvertToUTF8(const CString &src, CStringA &dest)
  104. {
  105. #ifdef _UNICODE
  106. dest.Empty();
  107. for(int i = 0; i < src.GetLength();)
  108. {
  109. UINT value = (UINT)src[i++];
  110. if (value < 0x80)
  111. {
  112. dest += (char)value;
  113. continue;
  114. }
  115. if (value >= 0xD800 && value < 0xE000)
  116. {
  117. if (value >= 0xDC00)
  118. {
  119. dest = src;
  120. return false;
  121. }
  122. if (i >= src.GetLength())
  123. {
  124. dest = src;
  125. return false;
  126. }
  127. UINT c2 = (UINT)src[i++];
  128. if (c2 < 0xDC00 || c2 >= 0xE000)
  129. {
  130. dest = src;
  131. return false;
  132. }
  133. value = ((value - 0xD800) << 10) | (c2 - 0xDC00);
  134. }
  135. int numAdds;
  136. for (numAdds = 1; numAdds < 5; numAdds++)
  137. if (value < (((UINT)1) << (numAdds * 5 + 6)))
  138. break;
  139. dest += (char)(kUtf8Limits[numAdds - 1] + (value >> (6 * numAdds)));
  140. do
  141. {
  142. numAdds--;
  143. dest += (char)(0x80 + ((value >> (6 * numAdds)) & 0x3F));
  144. }
  145. while(numAdds > 0);
  146. }
  147. #else
  148. dest = src;
  149. #endif
  150. return true;
  151. }