14constexpr uint16_t kHigh[128] = {
15 0x00C7, 0x00FC, 0x00E9, 0x00E2, 0x00E4, 0x00E0, 0x00E5, 0x00E7,
16 0x00EA, 0x00EB, 0x00E8, 0x00EF, 0x00EE, 0x00EC, 0x00C4, 0x00C5,
17 0x00C9, 0x00E6, 0x00C6, 0x00F4, 0x00F6, 0x00F2, 0x00FB, 0x00F9,
18 0x00FF, 0x00D6, 0x00DC, 0x00A2, 0x00A3, 0x00A5, 0x20A7, 0x0192,
19 0x00E1, 0x00ED, 0x00F3, 0x00FA, 0x00F1, 0x00D1, 0x00AA, 0x00BA,
20 0x00BF, 0x2310, 0x00AC, 0x00BD, 0x00BC, 0x00A1, 0x00AB, 0x00BB,
21 0x2591, 0x2592, 0x2593, 0x2502, 0x2524, 0x2561, 0x2562, 0x2556,
22 0x2555, 0x2563, 0x2551, 0x2557, 0x255D, 0x255C, 0x255B, 0x2510,
23 0x2514, 0x2534, 0x252C, 0x251C, 0x2500, 0x253C, 0x255E, 0x255F,
24 0x255A, 0x2554, 0x2569, 0x2566, 0x2560, 0x2550, 0x256C, 0x2567,
25 0x2568, 0x2564, 0x2565, 0x2559, 0x2558, 0x2552, 0x2553, 0x256B,
26 0x256A, 0x2518, 0x250C, 0x2588, 0x2584, 0x258C, 0x2590, 0x2580,
27 0x03B1, 0x00DF, 0x0393, 0x03C0, 0x03A3, 0x03C3, 0x00B5, 0x03C4,
28 0x03A6, 0x0398, 0x03A9, 0x03B4, 0x221E, 0x03C6, 0x03B5, 0x2229,
29 0x2261, 0x00B1, 0x2265, 0x2264, 0x2320, 0x2321, 0x00F7, 0x2248,
30 0x00B0, 0x2219, 0x00B7, 0x221A, 0x207F, 0x00B2, 0x25A0, 0x00A0,
37 return (b < 0x80) ? b : kHigh[b - 0x80];
42 if (cp < 0x80)
return static_cast<uint8_t
>(cp);
46 case 0x00A6:
return 0x7C;
47 case 0x00A7:
return 0x15;
48 case 0x00B6:
return 0x14;
49 case 0x00E3:
return 0x83;
52 for (
int i = 0; i < 128; ++i) {
53 if (kHigh[i] == cp)
return static_cast<uint8_t
>(0x80 + i);
62 const uint8_t* r =
reinterpret_cast<const uint8_t*
>(s);
67 if ((c & 0x80) == 0) { out.push_back(
static_cast<char>(c)); ++r;
continue; }
68 else if ((c & 0xE0) == 0xC0) { cp = c & 0x1F; cont = 1; }
69 else if ((c & 0xF0) == 0xE0) { cp = c & 0x0F; cont = 2; }
70 else if ((c & 0xF8) == 0xF0) { cp = c & 0x07; cont = 3; }
71 else { ++r;
continue; }
74 for (uint8_t i = 0; i < cont; ++i) {
75 if ((*r & 0xC0) != 0x80) { ok =
false;
break; }
76 cp = (cp << 6) | (*r & 0x3F);
81 if (mapped) out.push_back(
static_cast<char>(mapped));
90 for (
const uint8_t* r =
reinterpret_cast<const uint8_t*
>(s); *r; ++r) {
93 out.push_back(
static_cast<char>(cp));
94 }
else if (cp < 0x800) {
95 out.push_back(
static_cast<char>(0xC0 | (cp >> 6)));
96 out.push_back(
static_cast<char>(0x80 | (cp & 0x3F)));
98 out.push_back(
static_cast<char>(0xE0 | (cp >> 12)));
99 out.push_back(
static_cast<char>(0x80 | ((cp >> 6) & 0x3F)));
100 out.push_back(
static_cast<char>(0x80 | (cp & 0x3F)));
Canonical CP437 <-> Unicode/UTF-8 codec.
std::string fromUtf8(const char *s)
Convert a UTF-8 string to CP437 bytes (unmapped chars dropped).
std::string toUtf8(const char *s)
Convert CP437 bytes to a UTF-8 string.
uint8_t fromUnicode(uint32_t cp)
Map a Unicode codepoint to its CP437 byte, or 0 if it has none.
uint32_t toUnicode(uint8_t b)
Map a CP437 byte to its Unicode codepoint. 0x00-0x7F is ASCII.