decoder.js
1.38 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
function con(b) {
if ((b & 0xc0) === 0x80) {
return b & 0x3f;
} else {
throw new Error("invalid UTF-8 encoding");
}
}
function code(min, n) {
if (n < min || (0xd800 <= n && n < 0xe000) || n >= 0x10000) {
throw new Error("invalid UTF-8 encoding");
} else {
return n;
}
}
export function decode(bytes) {
return _decode(bytes)
.map(x => String.fromCharCode(x))
.join("");
}
function _decode(bytes) {
if (bytes.length === 0) {
return [];
}
/**
* 1 byte
*/
{
const [b1, ...bs] = bytes;
if (b1 < 0x80) {
return [code(0x0, b1), ..._decode(bs)];
}
if (b1 < 0xc0) {
throw new Error("invalid UTF-8 encoding");
}
}
/**
* 2 bytes
*/
{
const [b1, b2, ...bs] = bytes;
if (b1 < 0xe0) {
return [code(0x80, ((b1 & 0x1f) << 6) + con(b2)), ..._decode(bs)];
}
}
/**
* 3 bytes
*/
{
const [b1, b2, b3, ...bs] = bytes;
if (b1 < 0xf0) {
return [
code(0x800, ((b1 & 0x0f) << 12) + (con(b2) << 6) + con(b3)),
..._decode(bs)
];
}
}
/**
* 4 bytes
*/
{
const [b1, b2, b3, b4, ...bs] = bytes;
if (b1 < 0xf8) {
return [
code(
0x10000,
((((b1 & 0x07) << 18) + con(b2)) << 12) + (con(b3) << 6) + con(b4)
),
..._decode(bs)
];
}
}
throw new Error("invalid UTF-8 encoding");
}