forked from monero-project/monero
Compare commits
87 Commits
master
...
release-v0
Author | SHA1 | Date |
---|---|---|
luigi1111 | 7bd1ed03dd | 4 years ago |
luigi1111 | 9006119fba | 4 years ago |
Howard Chu | 3aae649738 | 4 years ago |
moneromooo-monero | 03254742e5 | 4 years ago |
Howard Chu | e416f56f31 | 4 years ago |
Howard Chu | 2f481da900 | 4 years ago |
luigi1111 | c9aad8a38b | 4 years ago |
luigi1111 | 7f8fe816f4 | 4 years ago |
moneromooo-monero | 870a7b5201 | 4 years ago |
moneromooo-monero | 5b761d0186 | 4 years ago |
moneromooo-monero | c02d7621a4 | 4 years ago |
moneromooo-monero | 0678fc1f97 | 4 years ago |
selsta | f37009364a | 4 years ago |
luigi1111 | a498a1b4ce | 4 years ago |
luigi1111 | 4627b0f3e2 | 4 years ago |
luigi1111 | 829cbfd700 | 4 years ago |
luigi1111 | efe1bfe7a1 | 4 years ago |
luigi1111 | cd9acb3a5b | 4 years ago |
luigi1111 | b0a470d18f | 4 years ago |
luigi1111 | fcac8f5aff | 4 years ago |
Dusan Klinec | 19bb72d020 | 4 years ago |
selsta | cc19397b48 | 4 years ago |
moneromooo-monero | 8eaf0e189f | 4 years ago |
selsta | fa199f20af | 4 years ago |
moneromooo-monero | bca61e4fa6 | 4 years ago |
luigi1111 | f0ada2f22b | 4 years ago |
luigi1111 | 8a850ed742 | 4 years ago |
luigi1111 | 44e3875190 | 4 years ago |
luigi1111 | d825252b7d | 4 years ago |
luigi1111 | 1336992a5b | 4 years ago |
luigi1111 | e78387936e | 4 years ago |
luigi1111 | 8e0435876c | 4 years ago |
luigi1111 | 79f4af310e | 4 years ago |
moneromooo-monero | a67c634f89 | 4 years ago |
Lee Clagett | 3b390fba9c | 4 years ago |
moneromooo-monero | b7812d1674 | 4 years ago |
moneromooo-monero | 0a19785e99 | 4 years ago |
moneromooo-monero | 0569e635cf | 4 years ago |
moneromooo-monero | 23df29d8d6 | 4 years ago |
moneromooo-monero | e3068346ee | 4 years ago |
moneromooo-monero | 96b7697177 | 4 years ago |
moneromooo-monero | 5285ecc3d6 | 4 years ago |
François Colas | 4e6d587275 | 4 years ago |
luigi1111 | 25419b4bfb | 4 years ago |
selsta | f50a6c5aed | 4 years ago |
luigi1111 | cf4add7899 | 4 years ago |
luigi1111 | e28d291330 | 4 years ago |
luigi1111 | 4f6dbcd00e | 4 years ago |
luigi1111 | 062cf63959 | 4 years ago |
luigi1111 | 343acd3025 | 4 years ago |
moneromooo-monero | 0d92fe5234 | 4 years ago |
moneromooo-monero | ada8172b46 | 4 years ago |
rbrunner7 | c5c85925e2 | 4 years ago |
Doyle | 438b84690e | 4 years ago |
luigi1111 | eed8a4e8a6 | 4 years ago |
luigi1111 | b82af557f5 | 4 years ago |
luigi1111 | 0161cb79a1 | 4 years ago |
luigi1111 | f28026b86f | 4 years ago |
luigi1111 | cb75003642 | 4 years ago |
luigi1111 | 8fb0d7e0b4 | 4 years ago |
luigi1111 | 3578ce9fb6 | 4 years ago |
luigi1111 | f8642bf95c | 4 years ago |
luigi1111 | da04c5fb48 | 4 years ago |
luigi1111 | 278f78e877 | 4 years ago |
moneromooo-monero | 99d702e28b | 4 years ago |
moneromooo-monero | cef39dc313 | 4 years ago |
moneromooo-monero | 705c78b797 | 4 years ago |
moneromooo-monero | 4291344f80 | 4 years ago |
moneromooo-monero | bbab044c92 | 4 years ago |
moneromooo-monero | f01d529bdb | 4 years ago |
moneromooo-monero | f52697729d | 4 years ago |
moneromooo-monero | bb4d95c98f | 4 years ago |
moneromooo-monero | 44e3782b4d | 4 years ago |
selsta | 7633ba059c | 4 years ago |
selsta | 4a9c3aca03 | 4 years ago |
moneromooo-monero | 7209db839c | 4 years ago |
luigi1111 | 4987161fa6 | 4 years ago |
luigi1111 | a67a9fc9c4 | 4 years ago |
luigi1111 | 87490c541f | 4 years ago |
luigi1111 | a763ea7cf8 | 4 years ago |
selsta | f35ced6d7f | 4 years ago |
moneromooo-monero | 1b48f325b8 | 4 years ago |
Lee Clagett | cc40ce1b3f | 4 years ago |
Dusan Klinec | ab4429346d | 4 years ago |
iDunk5400 | 82afc5ff13 | 4 years ago |
luigi1111 | 309211fd6a | 4 years ago |
selsta | 08a45c51a0 | 4 years ago |
Binary file not shown.
@ -0,0 +1,114 @@
|
||||
// Copyright (c) 2019, The Monero Project
|
||||
//
|
||||
// All rights reserved.
|
||||
//
|
||||
// Redistribution and use in source and binary forms, with or without modification, are
|
||||
// permitted provided that the following conditions are met:
|
||||
//
|
||||
// 1. Redistributions of source code must retain the above copyright notice, this list of
|
||||
// conditions and the following disclaimer.
|
||||
//
|
||||
// 2. Redistributions in binary form must reproduce the above copyright notice, this list
|
||||
// of conditions and the following disclaimer in the documentation and/or other
|
||||
// materials provided with the distribution.
|
||||
//
|
||||
// 3. Neither the name of the copyright holder nor the names of its contributors may be
|
||||
// used to endorse or promote products derived from this software without specific
|
||||
// prior written permission.
|
||||
//
|
||||
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY
|
||||
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
|
||||
// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
|
||||
// THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
||||
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||||
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
|
||||
// STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
|
||||
// THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
|
||||
#pragma once
|
||||
|
||||
#include <cctype>
|
||||
#include <cwchar>
|
||||
#include <stdexcept>
|
||||
|
||||
namespace tools
|
||||
{
|
||||
template<typename T, typename Transform>
|
||||
inline T utf8canonical(const T &s, Transform t = [](wint_t c)->wint_t { return c; })
|
||||
{
|
||||
T sc = "";
|
||||
size_t avail = s.size();
|
||||
const char *ptr = s.data();
|
||||
wint_t cp = 0;
|
||||
int bytes = 1;
|
||||
char wbuf[8], *wptr;
|
||||
while (avail--)
|
||||
{
|
||||
if ((*ptr & 0x80) == 0)
|
||||
{
|
||||
cp = *ptr++;
|
||||
bytes = 1;
|
||||
}
|
||||
else if ((*ptr & 0xe0) == 0xc0)
|
||||
{
|
||||
if (avail < 1)
|
||||
throw std::runtime_error("Invalid UTF-8");
|
||||
cp = (*ptr++ & 0x1f) << 6;
|
||||
cp |= *ptr++ & 0x3f;
|
||||
--avail;
|
||||
bytes = 2;
|
||||
}
|
||||
else if ((*ptr & 0xf0) == 0xe0)
|
||||
{
|
||||
if (avail < 2)
|
||||
throw std::runtime_error("Invalid UTF-8");
|
||||
cp = (*ptr++ & 0xf) << 12;
|
||||
cp |= (*ptr++ & 0x3f) << 6;
|
||||
cp |= *ptr++ & 0x3f;
|
||||
avail -= 2;
|
||||
bytes = 3;
|
||||
}
|
||||
else if ((*ptr & 0xf8) == 0xf0)
|
||||
{
|
||||
if (avail < 3)
|
||||
throw std::runtime_error("Invalid UTF-8");
|
||||
cp = (*ptr++ & 0x7) << 18;
|
||||
cp |= (*ptr++ & 0x3f) << 12;
|
||||
cp |= (*ptr++ & 0x3f) << 6;
|
||||
cp |= *ptr++ & 0x3f;
|
||||
avail -= 3;
|
||||
bytes = 4;
|
||||
}
|
||||
else
|
||||
throw std::runtime_error("Invalid UTF-8");
|
||||
|
||||
cp = t(cp);
|
||||
if (cp <= 0x7f)
|
||||
bytes = 1;
|
||||
else if (cp <= 0x7ff)
|
||||
bytes = 2;
|
||||
else if (cp <= 0xffff)
|
||||
bytes = 3;
|
||||
else if (cp <= 0x10ffff)
|
||||
bytes = 4;
|
||||
else
|
||||
throw std::runtime_error("Invalid code point UTF-8 transformation");
|
||||
|
||||
wptr = wbuf;
|
||||
switch (bytes)
|
||||
{
|
||||
case 1: *wptr++ = cp; break;
|
||||
case 2: *wptr++ = 0xc0 | (cp >> 6); *wptr++ = 0x80 | (cp & 0x3f); break;
|
||||
case 3: *wptr++ = 0xe0 | (cp >> 12); *wptr++ = 0x80 | ((cp >> 6) & 0x3f); *wptr++ = 0x80 | (cp & 0x3f); break;
|
||||
case 4: *wptr++ = 0xf0 | (cp >> 18); *wptr++ = 0x80 | ((cp >> 12) & 0x3f); *wptr++ = 0x80 | ((cp >> 6) & 0x3f); *wptr++ = 0x80 | (cp & 0x3f); break;
|
||||
default: throw std::runtime_error("Invalid UTF-8");
|
||||
}
|
||||
*wptr = 0;
|
||||
sc.append(wbuf, bytes);
|
||||
cp = 0;
|
||||
bytes = 1;
|
||||
}
|
||||
return sc;
|
||||
}
|
||||
}
|
Loading…
Reference in new issue