-
Notifications
You must be signed in to change notification settings - Fork 32
/
Copy pathStrConv.cpp
118 lines (105 loc) · 2.64 KB
/
StrConv.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
#include "StrConv.h"
#if defined( __linux__ ) || defined(__APPLE__) || defined(__ANDROID__)
inline int is_high_surrogate(char16_t uc) { return (uc & 0xfffffc00) == 0xd800; }
inline int is_low_surrogate(char16_t uc) { return (uc & 0xfffffc00) == 0xdc00; }
inline char32_t surrogate_to_utf32(char16_t high, char16_t low) {
return (high << 10) + low - 0x35fdc00;
}
// The algorithm is based on this answer:
//https://stackoverflow.com/a/23920015/2134488
//
void convertUTF16ToUTF32(char16_t *input,
const size_t input_size,
std::basic_string<wchar_t> &output)
{
int i = 0;
const char16_t * const end = input + input_size;
while (input < end) {
const char16_t uc = *input++;
if (!((uc - 0xd800u) < 2048u)) {
output[i++] = uc;
}
else {
if (is_high_surrogate(uc) && input < end && is_low_surrogate(*input)) {
output[i++] = (wchar_t)surrogate_to_utf32(uc, *input++);
}
else {
output[i++] = 0; //ERROR
}
}
}
}
// The algorithm is based on this answer:
//https://stackoverflow.com/questions/955484/is-it-possible-to-convert-utf32-text-to-utf16-using-only-windows-api
//
unsigned int convertUTF32ToUTF16(const wchar_t *input, size_t input_size, char16_t *output)
{
char16_t *start = output;
const wchar_t * const end = input + input_size;
while (input < end) {
const wchar_t cUTF32 = *input++;
if (cUTF32 < 0x10000)
{
*output++ = cUTF32;
}
else {
unsigned int t = cUTF32 - 0x10000;
wchar_t h = (((t << 12) >> 22) + 0xD800);
wchar_t l = (((t << 22) >> 22) + 0xDC00);
*output++ = h;
*output++ = (l & 0x0000FFFF);
}
}
return (output - start) * 2; // size in bytes
}
#endif
inline void tolowerPtr(char16_t*);
// Приведение к нижнему регистру только для Кириллицы и Латиницы
//
void tolowerStr(std::u16string & s)
{
char16_t* c = const_cast<char16_t*>(s.c_str());
const size_t l = s.size();
for (char16_t* c2 = c; c2 < c + l; c2++)tolowerPtr(c2);
};
inline void tolowerPtr(char16_t *p)
{
if (((*p >= u'А') && (*p <= u'Я')) || ((*p >= u'A') && (*p <= u'Z')))
*p = *p + 32;
else if (*p == u'Ё')
*p = u'ё';
}
void strrev_u16(char16_t *str, int len)
{
int i;
int j;
char16_t a;
for (i = 0, j = len - 1; i < j; i++, j--)
{
a = str[i];
str[i] = str[j];
str[j] = a;
}
}
int itoa_u16(int num, char16_t* str, int len, int base)
{
int sum = num;
int i = 0;
int digit;
if (len == 0)
return -1;
do
{
digit = sum % base;
if (digit < 0xA)
str[i++] = u'0' + digit;
else
str[i++] = u'A' + digit - 0xA;
sum /= base;
} while (sum && (i < (len - 1)));
if (i == (len - 1) && sum)
return -1;
str[i] = '\0';
strrev_u16(str, i);
return i;
}