forked from emscripten-core/emscripten
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutf32.cpp
88 lines (73 loc) · 2.92 KB
/
utf32.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
// Copyright 2013 The Emscripten Authors. All rights reserved.
// Emscripten is available under two separate licenses, the MIT license and the
// University of Illinois/NCSA Open Source License. Both these licenses can be
// found in the LICENSE file.
#include <stdio.h>
#include <string>
#include <emscripten.h>
#include <cassert>
#include <wchar.h>
typedef unsigned int utf32;
typedef unsigned short utf16;
EM_JS_DEPS(deps, "$UTF32ToString,$stringToUTF32,$UTF16ToString,$stringToUTF16");
// This code tests that Unicode std::wstrings can be marshalled between C++ and JS.
int main() {
// U+2603 is snowman,
// U+20AC is the Euro sign,
// U+2007C is a Chinese Han character that looks like three raindrops.
std::wstring wstr = L"abc\u2603\u20AC\U0002007C123 --- abc\u2603\u20AC\U0002007C123";
printf("sizeof(wchar_t): %d.\n", (int)sizeof(wchar_t));
if (sizeof(wchar_t) == 4) {
utf32 *memory = new utf32[wstr.length()+1];
EM_ASM({
var str = UTF32ToString($0);
out(str);
var numBytesWritten = stringToUTF32(str, $1, Number($2));
if (numBytesWritten != 23*4) throw 'stringToUTF32 wrote an invalid length ' + numBytesWritten;
}, wstr.c_str(), memory, (wstr.length()+1)*sizeof(utf32));
// Compare memory to confirm that the string is intact after taking a route
// through JS side.
const utf32 *srcPtr = reinterpret_cast<const utf32 *>(wstr.c_str());
for (int i = 0;; ++i) {
assert(memory[i] == srcPtr[i]);
if (srcPtr[i] == 0)
break;
}
EM_ASM({
var str = UTF32ToString($0);
out(str);
var numBytesWritten = stringToUTF32(str, $1, Number($2));
if (numBytesWritten != 5*4) throw 'stringToUTF32 wrote an invalid length ' + numBytesWritten;
}, wstr.c_str(), memory, 6*sizeof(utf32));
assert(memory[5] == 0);
delete[] memory;
printf("OK (long).\n");
} else {
assert(sizeof(wchar_t) == 2);
// sizeof(wchar_t) == 2, and we're building with -fshort-wchar.
utf16 *memory = new utf16[2*wstr.length()+1];
EM_ASM({
var str = UTF16ToString($0);
out(str);
var numBytesWritten = stringToUTF16(str, $1, Number($2));
if (numBytesWritten != 25*2) throw 'stringToUTF16 wrote an invalid length ' + numBytesWritten;
}, wstr.c_str(), memory, (2*wstr.length()+1)*sizeof(utf16));
// Compare memory to confirm that the string is intact after taking a route
// through JS side.
const utf16 *srcPtr = reinterpret_cast<const utf16 *>(wstr.c_str());
for (int i = 0;; ++i) {
assert(memory[i] == srcPtr[i]);
if (srcPtr[i] == 0)
break;
}
EM_ASM({
var str = UTF16ToString($0);
out(str);
var numBytesWritten = stringToUTF16(str, $1, Number($2));
if (numBytesWritten != 5*2) throw 'stringToUTF16 wrote an invalid length ' + numBytesWritten;
}, wstr.c_str(), memory, 6*sizeof(utf16));
assert(memory[5] == 0);
delete[] memory;
printf("OK (short).\n");
}
}