3 files changed, 2223 insertions, 0 deletions
diff --git a/src/3rdParty/colib/LICENSE b/src/3rdParty/colib/LICENSE
new file mode 100755
index 0000000..e0eddeb
--- /dev/null
+++ b/src/3rdParty/colib/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2020 colin
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/src/3rdParty/colib/ljson.c b/src/3rdParty/colib/ljson.c
new file mode 100644
index 0000000..4daba07
--- /dev/null
+++ b/src/3rdParty/colib/ljson.c
@@ -0,0 +1,925 @@
+/**
+ * json解析器：只支持utf-8格式，Lua只支持64位的数字
+ */
+#define LUA_LIB
+#include <stdlib.h>
+#include <string.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <ctype.h>
+#include <assert.h>
+#include <errno.h>
+#include <setjmp.h>
+#include <ctype.h>
+#include <limits.h>
+#include <float.h>
+#include <math.h>
+#include "lua.h"
+#include "lauxlib.h"
+#if LUA_VERSION_NUM > 501
+#ifndef LUA_COMPAT_5_1
+#ifndef lua_objlen
+#define lua_objlen lua_rawlen
+#endif // lua_objlen
+#endif // LUA_COMPAT_5_1
+#endif // LUA_VERSION_NUM
+// 内存分配函数，方便替换
+#define co_malloc malloc
+#define co_free free
+#define co_realloc realloc
+#define co_calloc calloc
+#if !defined(likely)
+#if defined(__GNUC__)
+#define likely(x)       (__builtin_expect(((x) != 0), 1))
+#define unlikely(x)     (__builtin_expect(((x) != 0), 0))
+#else
+#define likely(x)       (x)
+#define unlikely(x)     (x)
+#endif
+#endif
+//-----------------------------------------------------------------------------
+// membuffer
+#define STACK_BUFF_SIZE 512
+typedef struct membuffer {
+        char *b;                // 内存buffer
+        size_t sz;              // buffer已用长度
+        size_t cap;             // buffer实际大小
+        char s[STACK_BUFF_SIZE];
+} membuffer_t;
+// 初始化buffer
+static inline void membuffer_init(membuffer_t *buff) {
+        buff->b = buff->s;
+        buff->cap = STACK_BUFF_SIZE;
+        buff->sz = 0;
+}
+static inline void membuffer_add_size(membuffer_t *buff, size_t sz) {
+        buff->sz += sz;
+}
+static inline void membuffer_reset(membuffer_t *buff) {
+        buff->sz = 0;
+}
+static inline void membuffer_free(membuffer_t *buff) {
+        if (buff->b && buff->b != buff->s) {
+                co_free(buff->b);
+                buff->b = NULL;
+        }
+}
+static inline void _membuffer_grow(membuffer_t *buff, size_t needsz) {
+        if (buff->cap < needsz) {
+                size_t newcap = buff->cap * 2;
+                if (newcap < needsz)
+                        newcap = needsz;
+                if (buff->b == buff->s) {
+                        buff->b = (char*)co_malloc(newcap);
+                        memcpy(buff->b, buff->s, buff->sz);
+                } else {
+                        buff->b = (char*)co_realloc(buff->b, newcap);
+                }
+                buff->cap = newcap;
+        }
+}
+// 确保缓存中还有sz的可用空间
+static inline void membuffer_ensure_space(membuffer_t *buff, size_t sz) {
+        if (buff->sz + sz > buff->cap) {
+                _membuffer_grow(buff, buff->sz+sz);
+        }
+}
+// 压入一个字符
+static inline void membuffer_putc(membuffer_t *buff, char c) {
+        membuffer_ensure_space(buff, 1);
+        buff->b[buff->sz++] = c;
+}
+// 写入一段内存
+static inline void membuffer_putb(membuffer_t *buff, const void *b, size_t sz) {
+        membuffer_ensure_space(buff, sz);
+        memcpy(buff->b + buff->sz, b, sz);
+        buff->sz += sz;
+}
+// 压入一个字符：不检查空间(不安全版本)
+static inline void membuffer_putc_unsafe(membuffer_t *buff, char c) {
+        buff->b[buff->sz++] = c;
+}
+#if LUA_VERSION_NUM > 501
+// 写入一段内存：不检查空间(不安全版本)
+static inline void membuffer_putb_unsafe(membuffer_t *buff, const void *b, size_t sz) {
+        memcpy(buff->b + buff->sz, b, sz);
+        buff->sz += sz;
+}
+#endif
+// 取当前的指针
+static inline char* membuffer_getp(membuffer_t *buff) {
+        return buff->b + buff->sz;
+}
+//-----------------------------------------------------------------------------
+// parser
+//-------------------------------------
+// 与Lua相关的代码
+static inline void l_add_object(lua_State *L) {
+        luaL_checkstack(L, 6, NULL);
+        lua_createtable(L, 0, 4);
+}
+static inline void l_begin_pair(lua_State *L, const char *k, size_t sz) {
+        lua_pushlstring(L, k, sz);
+}
+static inline void l_end_pair(lua_State *L) {
+        lua_rawset(L, -3);
+}
+static inline void l_add_array(lua_State *L) {
+        luaL_checkstack(L, 6, NULL);
+        lua_createtable(L, 4, 0);
+}
+static inline void l_add_index(lua_State *L, int i) {
+        lua_rawseti(L, -2, i+1);
+}
+static inline void l_add_string(lua_State *L, const char *s, size_t sz) {
+        lua_pushlstring(L, s, sz);
+}
+static inline void l_add_float(lua_State *L, double f) {
+        lua_pushnumber(L, (lua_Number)f);
+}
+static inline void l_add_integer(lua_State *L, int64_t i) {
+        lua_pushinteger(L, (lua_Integer)i);
+}
+static inline void l_add_boolean(lua_State *L, int b) {
+        lua_pushboolean(L, b);
+}
+static inline void l_add_null(lua_State *L) {
+        lua_pushlightuserdata(L, NULL);
+}
+static inline void l_error(lua_State *L, const char *msg) {
+        luaL_error(L, msg);
+}
+// 解析事件
+#define ON_ADD_OBJECT(ud) l_add_object((lua_State*)(ud))
+#define ON_BEGIN_PAIR(ud, k, sz) l_begin_pair((lua_State*)(ud), k, sz)
+#define ON_END_PAIR(ud) l_end_pair((lua_State*)(ud))
+#define ON_ADD_ARRAY(ud) l_add_array((lua_State*)(ud))
+#define ON_ADD_INDEX(ud, i) l_add_index((lua_State*)(ud), i)
+#define ON_ADD_STRING(ud, s, sz) l_add_string((lua_State*)(ud), s, sz)
+#define ON_ADD_FLOAT(ud, f) l_add_float((lua_State*)(ud), f)
+#define ON_ADD_INTEGER(ud, i) l_add_integer((lua_State*)(ud), i)
+#define ON_ADD_BOOLEAN(ud, b) l_add_boolean((lua_State*)(ud), b)
+#define ON_ADD_NULL(ud) l_add_null((lua_State*)(ud))
+#define ON_ERROR(ud, msg) l_error((lua_State*)(ud), msg)
+//-------------------------------------
+// 解析json，这部分代码与Lua无关，是通用的解析器；如果要移植这部分代码，需要把 //>>> 开头的注释去掉
+// 错误消息的大小
+#define ERRMSG_SIZE 256
+// json解析器
+typedef struct {
+        const char *str;        // json字符串
+        const char *ptr;        // json字符串解析指针
+        void *ud;                       // 解析事件的用户数据
+        membuffer_t buff;       // 临时缓存
+        int curdepth;   // 当前层次
+        int maxdepth;   // 最大层次
+        int allowcomment; // 是否允许注释
+        char errmsg[ERRMSG_SIZE];       // 保存错误消息
+        //>>>jmp_buf jb;                        // 用于实现从解析中出错直接跳出
+} json_parser_t;
+static inline void parser_init(json_parser_t *parser, const char *str, size_t size, void *ud,
+        int maxdepth, int allowcomment) {
+        membuffer_init(&parser->buff);
+        membuffer_ensure_space(&parser->buff, size);
+        parser->str = str;
+        parser->ptr = str;
+        parser->ud = ud;
+        parser->maxdepth = maxdepth;
+        parser->curdepth = 0;
+        parser->allowcomment = allowcomment;
+}
+static inline void parser_free(json_parser_t *parser) {
+        membuffer_free(&parser->buff);
+}
+// 抛出错误
+static void parser_throw_error(json_parser_t *parser, const char *fmt, ...) {
+        membuffer_free(&parser->buff);
+        va_list arg;
+        va_start(arg, fmt);
+        vsnprintf(parser->errmsg, ERRMSG_SIZE, fmt, arg);
+        va_end(arg);
+        ON_ERROR(parser->ud, parser->errmsg);
+        // 直接跳出解析代码，由于Lua的lua_error也是用longjmp，所以下面的代码没有机会执行到。但其他语言就不一定。
+        //>>>longjmp(parser->jb, 1);
+}
+// 辅助宏
+#define peekchar(p) (*(p)->ptr)
+#define skipchar(p) (++(p)->ptr)
+#define get_and_next(p) (*(p)->ptr++)
+#define next_and_get(p) (*(++(p)->ptr))
+#define savechar(p, c) membuffer_putc_unsafe(&(p)->buff, (c))
+#define currpos(p) (size_t)((p)->ptr - (p)->str)
+// 取解析到的错误内容
+static const char* parser_error_content(json_parser_t *p) {
+        size_t n = currpos(p);
+        if (n > 50) n = 50;     // 调整这个数获得更长的内容
+        membuffer_reset(&p->buff);
+        membuffer_putb(&p->buff, p->ptr - n, n);
+        membuffer_putc(&p->buff, '\0');
+        return p->buff.b;
+}
+// 增加深度
+static inline void parser_add_depth(json_parser_t *p) {
+        p->curdepth++;
+        if (p->curdepth >= p->maxdepth)
+                parser_throw_error(p, "Too many nested data, max depth is %d, at: %s[:%lu]", p->maxdepth,
+                        parser_error_content(p), currpos(p));
+}
+static inline void parser_skip_whitespaces(json_parser_t *p) {
+        // colin: 要支持注释，请将下面注释去掉
+        // if (likely(!p->allowcomment)) {
+                char ch = peekchar(p);
+                while (ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r')
+                        ch = next_and_get(p);
+        // } else {
+        //      char ch = peekchar(p);
+        //      for (;;) {
+        //              while (ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r')
+        //                      ch = next_and_get(p);
+        //              if (ch == '/') {
+        //                      ch = next_and_get(p);
+        //                      if (ch == '/') {
+        //                              ch = next_and_get(p);
+        //                              while (ch != '\n' && ch != '\r' && ch != '\0')
+        //                                      ch = next_and_get(p);
+        //                              continue;
+        //                      } else {
+        //                              parser_throw_error(p, "Invalid comment, at: %s[:%lu]", parser_error_content(p), currpos(p));
+        //                      }
+        //              }
+        //              break;
+        //      }
+        // }
+}
+static inline void parser_expect_char(json_parser_t *p, char c) {
+        if (likely(peekchar(p) == c))
+                skipchar(p);
+        else
+                parser_throw_error(p, "Expect '%c' at: %s[:%lu]", c, parser_error_content(p), currpos(p));
+}
+static inline void parser_process_false(json_parser_t *p) {
+        if (likely(p->ptr[0] == 'a' && p->ptr[1] == 'l' && p->ptr[2] == 's' && p->ptr[3] == 'e')) {
+                p->ptr += 4;
+                ON_ADD_BOOLEAN(p->ud, 0);
+        } else {
+                parser_throw_error(p, "Invalid boolean, at: %s[:%lu]", parser_error_content(p), currpos(p));
+        }
+}
+static inline void parser_process_true(json_parser_t *p) {
+        if (likely(p->ptr[0] == 'r' && p->ptr[1] == 'u' && p->ptr[2] == 'e')) {
+                p->ptr += 3;
+                ON_ADD_BOOLEAN(p->ud, 1);
+        } else {
+                parser_throw_error(p, "Invalid boolean, at: %s[:%lu]", parser_error_content(p), currpos(p));
+        }
+}
+static inline void parser_process_null(json_parser_t *p) {
+        if (likely(p->ptr[0] == 'u' && p->ptr[1] == 'l' && p->ptr[2] == 'l')) {
+                p->ptr += 3;
+                ON_ADD_NULL(p->ud);
+        } else {
+                parser_throw_error(p, "Invalid null, at: %s[:%lu]", parser_error_content(p), currpos(p));
+        }
+}
+static inline uint32_t parser_read_hex(json_parser_t *p) {
+        uint32_t cp = 0;
+        unsigned char ch;
+        int i = 4;
+        while (i--) {
+                ch = (unsigned char)get_and_next(p);
+                if ('0' <= ch && ch <= '9')
+                        ch -= '0';
+                else if (ch >= 'a' && ch <= 'f')
+                        ch = ch - 'a' + 10;
+                else if (ch >= 'A' && ch <= 'F')
+                        ch = ch - 'A' + 10;
+                else {
+                        parser_throw_error(p, "Invalid utf8 escape sequence, at: %s[:%lu]", parser_error_content(p), currpos(p));
+                        return cp;
+                }
+                cp = (cp << 4) + ch;
+        }
+        return cp;
+}
+static inline void parser_process_utf8esc(json_parser_t *p) {
+        uint32_t cp = parser_read_hex(p);
+        // UTF-16 surrogate pairs, see https://unicodebook.readthedocs.io/unicode_encodings.html#utf-16-surrogate-pairs
+        if (cp >= 0xD800 && cp <= 0xDBFF) {
+                char p0 = p->ptr[0];
+                char p1 = p->ptr[1];
+                if (p0 != '\\' || p1 != 'u')
+                        parser_throw_error(p, "Invalid utf8 escape sequence, at: %s[:%lu]", parser_error_content(p), currpos(p));
+                p->ptr += 2;
+                uint32_t cp2 = parser_read_hex(p);
+                if (cp2 < 0xDC00 || cp2 > 0xDFFF)
+                        parser_throw_error(p, "Invalid utf8 escape sequence, at: %s[:%lu]", parser_error_content(p), currpos(p));
+                cp = 0x10000 + (((cp & 0x03FF) << 10) | (cp2 & 0x03FF));
+        }
+        if (cp < 0x80) {
+                membuffer_putc_unsafe(&p->buff, (char)cp);
+        } else if (cp < 0x800) {
+                membuffer_putc_unsafe(&p->buff, 0xC0 | (cp >> 6));
+                membuffer_putc_unsafe(&p->buff, 0x80 | (cp & 0x3F));
+        } else if (cp < 0x10000) {
+                membuffer_putc_unsafe(&p->buff, 0xE0 | (cp >> 12));
+                membuffer_putc_unsafe(&p->buff, 0x80 | ((cp >> 6) & 0x3F));
+                membuffer_putc_unsafe(&p->buff, 0x80 | (cp & 0x3F));
+        } else {
+                membuffer_putc_unsafe(&p->buff, 0xF0 | (cp >> 18));
+                membuffer_putc_unsafe(&p->buff, 0x80 | ((cp >> 12) & 0x3F));
+                membuffer_putc_unsafe(&p->buff, 0x80 | ((cp >> 6) & 0x3F));
+                membuffer_putc_unsafe(&p->buff, 0x80 | (cp & 0x3F));
+        }
+}
+static const char escape2char[256] = {
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 0~19
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0, '\"',0,  0,  0,  0,  0,  // 20~39
+        0,  0,  0,  0,  0,  0,  0, '/', 0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 40~59
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 60~79
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0, '\\',0,  0,  0,  0,  0, '\b',0,  // 80~99
+        0,  0, '\f',0,  0,  0,  0,  0,  0,  0,  '\n',0,  0,  0, '\r',0, '\t',0,  0,  0,  // 100~119
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 120~139
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 140~159
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 160~179
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 180~199
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 200~219
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  // 220~239
+        0,  0,  0,  0,  0,  0,  0,  0,  0,  0,   0,  0,  0,  0,  0,  0,                  // 240~256
+};
+static inline void parser_process_string(json_parser_t *p) {
+        membuffer_reset(&p->buff);
+        char ch = get_and_next(p);
+        for (;;) {
+                if (ch == '\\') {
+                        unsigned char nch = (unsigned char)peekchar(p);
+                        if (likely(escape2char[nch])) {
+                                savechar(p, escape2char[nch]);
+                                skipchar(p);
+                        } else if (nch == 'u') {
+                                skipchar(p);
+                                parser_process_utf8esc(p);
+                        } else {
+                                parser_throw_error(p, "Invalid escape sequence, at: %s[:%lu]", parser_error_content(p), currpos(p));
+                        }
+                } else if (ch == '"') {
+                        break;
+                } else if ((unsigned char)ch < 0x20) {
+                        parser_throw_error(p, "Invalid string, at: %s[:%lu]", parser_error_content(p), currpos(p));
+                } else {
+                        savechar(p, ch);
+                }
+                ch = get_and_next(p);
+        }
+}
+#define invalid_number(p) parser_throw_error(p, "Invalid value, at: %s[:%lu]", parser_error_content(p), currpos(p))
+#define MAXBY10         (int64_t)(922337203685477580)
+#define MAXLASTD        (int)(7)
+static double powersOf10[] = {10., 100., 1.0e4, 1.0e8, 1.0e16, 1.0e32, 1.0e64, 1.0e128, 1.0e256};
+static inline void parser_process_number(json_parser_t *p, char ch) {
+        double db;                              // 浮点数
+        int64_t in = 0;                 // 整型值
+        int isdouble = 0;               // 是否是浮点数
+        int neg = 0;                    // 是否是负数
+        int exponent = 0;               // 指数位数
+        if (ch == '-') {        // 负值
+                neg = 1;
+                ch = get_and_next(p);
+        }
+        if (unlikely(ch == '0')) {      // 0开头的后面只能是：.eE或\0
+                ch = peekchar(p);
+        } else if (likely(ch >= '1' && ch <= '9')) {
+                in = ch - '0';
+                ch = peekchar(p);
+                while (ch >= '0' && ch <= '9') {
+                        if (unlikely(in >= MAXBY10 && (in > MAXBY10 || (ch - '0') > MAXLASTD + neg))) { // 更大的数字就用浮点数表示
+                                isdouble = 1;
+                                db = (double)in;
+                                do {
+                                        db = db * 10.0 + (ch - '0');
+                                        ch = next_and_get(p);
+                                } while (ch >= '0' && ch <= '9');
+                                break;
+                        }
+                        in = in * 10 + (ch - '0');
+                        ch = next_and_get(p);
+                }
+        } else {
+                invalid_number(p);
+        }
+        if (ch == '.') {        // 小数点部分
+                if (likely(!isdouble)) {
+                        isdouble = 1;
+                        db = (double)in;
+                }
+                ch = next_and_get(p);
+                if (unlikely(!(ch >= '0' && ch <= '9')))
+                        invalid_number(p);  // .后面一定是数字
+                do {
+                        db = db * 10. + (ch - '0');
+                        exponent--;
+                        ch = next_and_get(p);
+                } while (ch >= '0' && ch <= '9');
+        }
+        if (ch == 'e' || ch == 'E') {   // 指数部分
+                if (!isdouble) {                // 有e强制认为是浮点数
+                        isdouble = 1;
+                        db = (double)in;
+                }
+                ch = next_and_get(p);
+                int eneg = 0;
+                if (ch == '-') {
+                        eneg = 1;
+                        ch = next_and_get(p);
+                } else if (ch == '+') {
+                        ch = next_and_get(p);
+                }
+                if (unlikely(!(ch >= '0' && ch <= '9')))
+                        invalid_number(p);  // 后面一定是数字
+                int exp = 0;
+                do {
+                        exp = exp * 10. + (ch - '0');
+                        ch = next_and_get(p);
+                } while (ch >= '0' && ch <= '9');
+                exponent += eneg ? (-exp) : (exp);
+        }
+        if (isdouble) {
+                int n = exponent < 0 ? -exponent : exponent;
+                if (unlikely(n>511))
+                        n = 511;        // inf
+                double p10 = 1.0;
+                double *d;
+                for (d = powersOf10; n != 0; n >>= 1, d += 1) {
+                        if (n & 1) p10 *= *d;
+                }
+                if (exponent < 0)
+                        db /= p10;
+                else
+                        db *= p10;
+                if (neg) db = -db;
+                ON_ADD_FLOAT(p->ud, db);
+        } else {
+                if (neg) in = -in;
+                ON_ADD_INTEGER(p->ud, in);
+        }
+}
+static void parser_process_value(json_parser_t *p);
+static inline void parser_process_object(json_parser_t *p) {
+        parser_add_depth(p);
+        ON_ADD_OBJECT(p->ud);
+        parser_skip_whitespaces(p);
+        char ch = peekchar(p);
+        if (ch == '}') {
+                skipchar(p);
+                p->curdepth--;
+                return;
+        }
+        for (;;) {
+                parser_expect_char(p, '"');
+                parser_process_string(p);               // key
+                ON_BEGIN_PAIR(p->ud, p->buff.b, p->buff.sz);
+                parser_skip_whitespaces(p);
+                parser_expect_char(p, ':');
+                parser_process_value(p);                        // value
+                ON_END_PAIR(p->ud);
+                parser_skip_whitespaces(p);
+                if (peekchar(p) == '}') {
+                        skipchar(p);
+                        p->curdepth--;
+                        return;
+                }
+                else {
+                        parser_expect_char(p, ',');
+                        parser_skip_whitespaces(p);
+                }
+        }
+}
+static inline void parser_process_array(json_parser_t *p) {
+        parser_add_depth(p);
+        ON_ADD_ARRAY(p->ud);
+        parser_skip_whitespaces(p);
+        char ch = peekchar(p);
+        if (ch == ']') {
+                skipchar(p);
+                p->curdepth--;
+                return;
+        }
+        int i;
+        for (i = 0; ;++i) {
+                parser_process_value(p);
+                ON_ADD_INDEX(p->ud, i);
+                parser_skip_whitespaces(p);
+                if (peekchar(p) == ']') {
+                        skipchar(p);
+                        p->curdepth--;
+                        return;
+                }
+                else {
+                        parser_expect_char(p, ',');
+                }
+        }
+}
+static void parser_process_value(json_parser_t *p) {
+        parser_skip_whitespaces(p);
+        char ch = get_and_next(p);
+        switch (ch) {
+                case 'f':
+                        parser_process_false(p);
+                        break;
+                case 't':
+                        parser_process_true(p);
+                        break;
+                case 'n':
+                        parser_process_null(p);
+                        break;
+                case '"':
+                        parser_process_string(p);
+                        ON_ADD_STRING(p->ud, p->buff.b, p->buff.sz);
+                        break;
+                case '{':
+                        parser_process_object(p);
+                        break;
+                case '[':
+                        parser_process_array(p);
+                        break;
+                default:
+                        parser_process_number(p, ch);
+                        break;
+        }
+}
+// 解析json文本
+static void parser_do_parse(const char *str, size_t size, void *ud, int maxdepth, int allowcomment) {
+        json_parser_t p;
+        parser_init(&p, str, size, ud, maxdepth, allowcomment);
+        //>>>if (setjmp(p.jb) == 0) {
+                parser_process_value(&p);
+                parser_skip_whitespaces(&p);
+                if (peekchar(&p) != '\0') {
+                        parser_throw_error(&p, "Expect '<eof>' but got '%c', at: %s[:%lu]", peekchar(&p),
+                                parser_error_content(&p), currpos(&p));
+                }
+                parser_free(&p);
+        //>>>}
+}
+//-----------------------------------------------------------------------------
+// dumpper
+typedef struct {
+        membuffer_t buff;       // 临时缓存
+        int maxdepth;   // 最大层次
+        int format;                     // 是否格式化
+        int empty_as_array; // 空表是否当成数组
+        int num_as_str;         // 数字Key转为字符串
+        char errmsg[ERRMSG_SIZE];       // 保存错误消息
+} json_dumpper_t;
+// 足够转换数字的缓存大小
+#define NUMBER_BUFF_SZ 44
+#define INTEGER_BUFF_SZ 24
+// 抛出错误
+static void dumpper_throw_error(json_dumpper_t *d, lua_State *L, const char *fmt, ...) {
+        membuffer_free(&d->buff);
+        va_list arg;
+        va_start(arg, fmt);
+        vsnprintf(d->errmsg, ERRMSG_SIZE, fmt, arg);
+        va_end(arg);
+        luaL_error(L, d->errmsg);
+}
+#if LUA_VERSION_NUM > 501
+static void dumpper_process_integer(json_dumpper_t *d, lua_State *L, int idx) {
+        char nbuff[INTEGER_BUFF_SZ];
+        int i = INTEGER_BUFF_SZ;
+        membuffer_ensure_space(&d->buff, INTEGER_BUFF_SZ);
+        int64_t x = (int64_t)lua_tointeger(L, idx);
+        uint64_t ux = (uint64_t)x;
+        if (x < 0) {
+                membuffer_putc_unsafe(&d->buff, '-');
+                ux = ~ux + 1;
+        }
+        do {
+                nbuff[--i] = (ux % 10) + '0';
+        } while (ux /= 10);
+        membuffer_putb_unsafe(&d->buff, nbuff+i, INTEGER_BUFF_SZ-i);
+}
+#endif
+static void dumpper_process_number(json_dumpper_t *d, lua_State *L, int idx) {
+        lua_Number num = lua_tonumber(L, idx);
+         if (isinf(num) || isnan(num))
+                 dumpper_throw_error(d, L, "The number is NaN or Infinity");
+        membuffer_ensure_space(&d->buff, NUMBER_BUFF_SZ);
+        char *p = membuffer_getp(&d->buff);
+        int len = sprintf(p, LUA_NUMBER_FMT, num);
+        membuffer_add_size(&d->buff, len);
+}
+// 字符转义表
+static const char char2escape[256] = {
+        'u', 'u', 'u', 'u', 'u', 'u', 'u', 'u', 'b', 't',  'n', 'u', 'f', 'r', 'u', 'u', 'u', 'u', 'u', 'u', // 0~19
+        'u', 'u', 'u', 'u', 'u', 'u', 'u', 'u', 'u', 'u',  'u', 'u',  0,   0,  '"',   0,   0,   0,   0,   0, // 20~39
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 40~59
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 60~79
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,  '\\', 0,   0,   0,   0,   0,   0,   0,  // 80~99
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 100~119
+         0,   0,   0,   0,   0,   0,   0,  'u',  0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 120~139
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 140~159
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 160~179
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 180~199
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 200~219
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,   0,   0,   0,   0,  // 220~239
+         0,   0,   0,   0,   0,   0,   0,   0,   0,   0,    0,   0,   0,   0,   0,   0,                      // 240~256
+};
+static const char hex_digits[16] = { '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F' };
+static void dumpper_process_string(json_dumpper_t *d, lua_State *L, int idx) {
+        membuffer_t *buff = &d->buff;
+        size_t len, i;
+        const char *str = lua_tolstring(L, idx, &len);
+        membuffer_ensure_space(buff, len * 6 + 2);
+        membuffer_putc_unsafe(buff, '\"');
+        char esc;
+        unsigned char ch;
+        for (i = 0; i < len; ++i) {
+                ch = (unsigned char)str[i];
+                esc = char2escape[ch];
+                if (likely(!esc))
+                        membuffer_putc_unsafe(buff, (char)ch);
+                else {
+                        membuffer_putc_unsafe(buff, '\\');
+                        membuffer_putc_unsafe(buff, esc);
+                        if (esc == 'u') {
+                                membuffer_putc_unsafe(buff, '0');
+                                membuffer_putc_unsafe(buff, '0');
+                                membuffer_putc_unsafe(buff, hex_digits[(unsigned char)esc >> 4]);
+                                membuffer_putc_unsafe(buff, hex_digits[(unsigned char)esc & 0xF]);
+                        }
+                }
+        }
+        membuffer_putc_unsafe(buff, '\"');
+}
+static void dumpper_process_value(json_dumpper_t *d, lua_State *L, int depth);
+static int dumpper_check_array(json_dumpper_t *d, lua_State *L, int *len) {
+        int asize = lua_objlen(L, -1);
+        if (asize > 0) {
+                lua_pushinteger(L, asize);
+                if (lua_next(L, -2) == 0) {
+                        *len = asize;
+                        return 1;
+                } else {
+                        lua_pop(L, 2);
+                        return 0;
+                }
+        } else {
+                lua_pushnil(L);
+                if (lua_next(L, -2) == 0) {
+                        *len = asize;
+                        return d->empty_as_array;
+                } else {
+                        lua_pop(L, 2);
+                        return 0;
+                }
+        }
+}
+static inline void dumpper_add_indent(json_dumpper_t *d, int count) {
+        membuffer_ensure_space(&d->buff, count);
+        int i;
+        for (i = 0; i < count; ++i)
+                membuffer_putc_unsafe(&d->buff, '\t');
+}
+static void dumpper_process_array(json_dumpper_t *d, lua_State *L, int len, int depth) {
+        membuffer_t *buff = &d->buff;
+        membuffer_putc(buff, '[');
+        int i;
+        for (i = 1; i <= len; ++i) {
+                if (unlikely(d->format && i == 1)) membuffer_putc(buff, '\n');
+                lua_rawgeti(L, -1, i);
+                if (unlikely(d->format)) dumpper_add_indent(d, depth);
+                dumpper_process_value(d, L, depth);
+                lua_pop(L, 1);
+                if (i < len)
+                        membuffer_putc(buff, ',');
+                if (unlikely(d->format)) membuffer_putc(buff, '\n');
+        }
+        if (unlikely(d->format && i > 1))  dumpper_add_indent(d, depth-1);
+        membuffer_putc(buff, ']');
+}
+static void dumpper_process_object(json_dumpper_t *d, lua_State *L, int depth) {
+        membuffer_t *buff = &d->buff;
+        membuffer_putc(buff, '{');
+        int ktp;
+        int comma = 0;
+        lua_pushnil(L);         // t nil
+        while (lua_next(L, -2) != 0) {  // t k v
+                if (comma) {
+                        membuffer_putc(buff, ',');
+                        if (unlikely(d->format)) membuffer_putc(buff, '\n');
+                } else {
+                        comma = 1;
+                        if (unlikely(d->format)) membuffer_putc(buff, '\n');
+                }
+                // key
+                ktp = lua_type(L, -2);
+                if (ktp == LUA_TSTRING) {
+                        if (unlikely(d->format)) dumpper_add_indent(d, depth);
+                        dumpper_process_string(d, L, -2);
+                        if (likely(!d->format))
+                                membuffer_putc(buff, ':');
+                        else
+                                membuffer_putb(buff, " : ", 3);
+                } else if (ktp == LUA_TNUMBER && d->num_as_str) {
+                        if (unlikely(d->format)) dumpper_add_indent(d, depth);
+                        membuffer_putc(buff, '\"');
+#if LUA_VERSION_NUM > 501
+                        if (lua_isinteger(L, -2))
+                                dumpper_process_integer(d, L, -2);
+                        else
+#endif
+                                dumpper_process_number(d, L, -2);
+                        if (likely(!d->format))
+                                membuffer_putb(buff, "\":", 2);
+                        else
+                                membuffer_putb(buff, "\" : ", 4);
+                } else {
+                        dumpper_throw_error(d, L, "Table key must be a string");
+                }
+                // value
+                dumpper_process_value(d, L, depth);
+                lua_pop(L, 1);
+        }
+        if (unlikely(d->format && comma)) {
+                membuffer_putc(buff, '\n');
+                dumpper_add_indent(d, depth-1);
+        }
+        membuffer_putc(buff, '}');
+}
+static inline void dumpper_process_table(json_dumpper_t *d, lua_State *L, int depth) {
+        depth++;
+        if (depth > d->maxdepth)
+                dumpper_throw_error(d, L, "Too many nested data, max depth is %d", d->maxdepth);
+        luaL_checkstack(L, 6, NULL);
+        int len;
+        if (dumpper_check_array(d, L, &len))
+                dumpper_process_array(d, L, len, depth);
+        else
+                dumpper_process_object(d, L, depth);
+}
+static void dumpper_process_value(json_dumpper_t *d, lua_State *L, int depth) {
+        int tp = lua_type(L, -1);
+        switch (tp) {
+                case LUA_TSTRING:
+                        dumpper_process_string(d, L, -1);
+                        break;
+                case LUA_TNUMBER:
+#if LUA_VERSION_NUM > 501
+                        if (lua_isinteger(L, -1))
+                                dumpper_process_integer(d, L, -1);
+                        else
+#endif
+                                dumpper_process_number(d, L, -1);
+                        break;
+                case LUA_TBOOLEAN:
+                        if (lua_toboolean(L, -1))
+                                membuffer_putb(&d->buff, "true", 4);
+                        else
+                                membuffer_putb(&d->buff, "false", 5);
+                        break;
+                case LUA_TTABLE:
+                        dumpper_process_table(d, L, depth);
+                        break;
+                case LUA_TNIL:
+                        membuffer_putb(&d->buff, "null", 4);
+                        break;
+                case LUA_TLIGHTUSERDATA:
+                        if (lua_touserdata(L, -1) == NULL) {
+                                membuffer_putb(&d->buff, "null", 4);
+                                break;
+                        }
+                        goto error;
+                default:
+                error:
+                        dumpper_throw_error(d, L, "Unsupport type %s", lua_typename(L, tp));
+        }
+}
+//-----------------------------------------------------------------------------
+// 接口
+#define DEF_MAX_DEPTH 128
+// 从字符串加载：json.decode(str, maxdepth) -> obj
+// 要求字符串必须以0结尾
+int colibc_json_decode(lua_State *L) {
+        size_t size;
+        const char *str = luaL_checklstring(L, 1, &size);
+        int maxdepth = (int)luaL_optinteger(L, 2, DEF_MAX_DEPTH);
+        int allowcomment = lua_toboolean(L, 3);
+        parser_do_parse(str, size, L, maxdepth, allowcomment);
+        return 1;
+}
+// 保存到字符串: json.encode(obj) -> str
+int colibc_json_encode(lua_State *L) {
+        luaL_checkany(L, 1);
+        json_dumpper_t dumpper;
+        membuffer_init(&dumpper.buff);
+        dumpper.format = lua_toboolean(L, 2);
+        dumpper.empty_as_array = lua_toboolean(L, 3);
+        dumpper.num_as_str = lua_toboolean(L, 4);
+        dumpper.maxdepth = (int)luaL_optinteger(L, 5, DEF_MAX_DEPTH);
+        lua_settop(L, 1);
+        dumpper_process_value(&dumpper, L, 0);
+        lua_pushlstring(L, dumpper.buff.b, dumpper.buff.sz);
+        membuffer_free(&dumpper.buff);
+        return 1;
+}
+static const luaL_Reg lib[] = {
+        {"decode", colibc_json_decode},
+        {"encode", colibc_json_encode},
+        {NULL, NULL},
+};
+LUALIB_API int luaopen_colibc_json(lua_State* L) {
+#if LUA_VERSION_NUM > 501
+        luaL_newlib(L, lib); // json
+#else
+        lua_getglobal(L, "package"); // package
+        lua_getfield(L, -1, "loaded"); // package loaded
+        lua_createtable(L, 0, 0); // package loaded json
+        lua_pushvalue(L, -1); // package loaded json json
+        lua_setfield(L, -3, "cojson"); // loaded["cojson"] = json, package loaded json
+        luaL_register(L, NULL, lib); // package loaded json
+#endif
+        // json.null
+        lua_pushlightuserdata(L, NULL);
+        lua_setfield(L, -2, "null");
+        return 1;
+}
diff --git a/src/3rdParty/utf8cpp.h b/src/3rdParty/utf8cpp.h
new file mode 100755
index 0000000..76f0fa1
--- /dev/null
+++ b/src/3rdParty/utf8cpp.h
@@ -0,0 +1,1277 @@
+// Copyright 2006 Nemanja Trifunovic
+/*
+Permission is hereby granted, free of charge, to any person or organization
+obtaining a copy of the software and accompanying documentation covered by
+this license (the "Software") to use, reproduce, display, distribute,
+execute, and transmit the Software, and to prepare derivative works of the
+Software, and to permit third-parties to whom the Software is furnished to
+do so, all subject to the following:
+The copyright notices in the Software and this entire statement, including
+the above license grant, this restriction and the following disclaimer,
+must be included in all copies of the Software, in whole or in part, and
+all derivative works of the Software, unless such copies or derivative
+works are solely in the form of machine-executable object code generated by
+a source language processor.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
+SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
+FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
+ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+DEALINGS IN THE SOFTWARE.
+*/
+#ifndef UTF8_FOR_CPP_2675DCD0_9480_4c0c_B92A_CC14C027B731
+#define UTF8_FOR_CPP_2675DCD0_9480_4c0c_B92A_CC14C027B731
+/*
+To control the C++ language version used by the library, you can define UTF_CPP_CPLUSPLUS macro
+and set it to one of the values used by the __cplusplus predefined macro.
+For instance,
+    #define UTF_CPP_CPLUSPLUS 199711L
+will cause the UTF-8 CPP library to use only types and language features available in the C++ 98 standard.
+Some library features will be disabled.
+If you leave UTF_CPP_CPLUSPLUS undefined, it will be internally assigned to __cplusplus.
+*/
+#include <iterator>
+#include <cstring>
+#include <string>
+// Determine the C++ standard version.
+// If the user defines UTF_CPP_CPLUSPLUS, use that.
+// Otherwise, trust the unreliable predefined macro __cplusplus
+#if !defined UTF_CPP_CPLUSPLUS
+    #define UTF_CPP_CPLUSPLUS __cplusplus
+#endif
+#if UTF_CPP_CPLUSPLUS >= 201103L // C++ 11 or later
+    #define UTF_CPP_OVERRIDE override
+    #define UTF_CPP_NOEXCEPT noexcept
+    #define UTF_CPP_STATIC_ASSERT(condition) static_assert(condition, "UTFCPP static assert");
+#else // C++ 98/03
+    #define UTF_CPP_OVERRIDE
+    #define UTF_CPP_NOEXCEPT throw()
+    // Simulate static_assert:
+    template<bool> struct UtfCppCompileTimeAssert;
+    template<> struct UtfCppCompileTimeAssert  <true> { };
+    #define UTF_CPP_STATIC_ASSERT(condition)  (UtfCppCompileTimeAssert <(condition) != 0>())
+#endif // C++ 11 or later
+namespace utf8
+{
+// The typedefs for 8-bit, 16-bit and 32-bit code units
+#if UTF_CPP_CPLUSPLUS >= 201103L // C++ 11 or later
+    #if UTF_CPP_CPLUSPLUS >= 202002L // C++ 20 or later
+        typedef char8_t         utfchar8_t;
+    #else // C++ 11/14/17
+        typedef unsigned char   utfchar8_t;
+    #endif
+    typedef char16_t        utfchar16_t;
+    typedef char32_t        utfchar32_t;
+#else // C++ 98/03
+    typedef unsigned char   utfchar8_t;
+    typedef unsigned short  utfchar16_t;
+    typedef unsigned int    utfchar32_t;
+#endif // C++ 11 or later
+// Helper code - not intended to be directly called by the library users. May be changed at any time
+namespace internal
+{
+    // Unicode constants
+    // Leading (high) surrogates: 0xd800 - 0xdbff
+    // Trailing (low) surrogates: 0xdc00 - 0xdfff
+    const utfchar16_t LEAD_SURROGATE_MIN  = 0xd800u;
+    const utfchar16_t LEAD_SURROGATE_MAX  = 0xdbffu;
+    const utfchar16_t TRAIL_SURROGATE_MIN = 0xdc00u;
+    const utfchar16_t TRAIL_SURROGATE_MAX = 0xdfffu;
+    const utfchar16_t LEAD_OFFSET         = 0xd7c0u;       // LEAD_SURROGATE_MIN - (0x10000 >> 10)
+    const utfchar32_t SURROGATE_OFFSET    = 0xfca02400u;   // 0x10000u - (LEAD_SURROGATE_MIN << 10) - TRAIL_SURROGATE_MIN
+    // Maximum valid value for a Unicode code point
+    const utfchar32_t CODE_POINT_MAX      = 0x0010ffffu;
+    template<typename octet_type>
+    inline utfchar8_t mask8(octet_type oc)
+    {
+        return static_cast<utfchar8_t>(0xff & oc);
+    }
+    template<typename u16_type>
+    inline utfchar16_t mask16(u16_type oc)
+    {
+        return static_cast<utfchar16_t>(0xffff & oc);
+    }
+    template<typename octet_type>
+    inline bool is_trail(octet_type oc)
+    {
+        return ((utf8::internal::mask8(oc) >> 6) == 0x2);
+    }
+    inline bool is_lead_surrogate(utfchar32_t cp)
+    {
+        return (cp >= static_cast<utfchar32_t>(LEAD_SURROGATE_MIN) && cp <= static_cast<utfchar32_t>(LEAD_SURROGATE_MAX));
+    }
+    inline bool is_trail_surrogate(utfchar32_t cp)
+    {
+        return (cp >= static_cast<utfchar32_t>(TRAIL_SURROGATE_MIN) && cp <= static_cast<utfchar32_t>(TRAIL_SURROGATE_MAX));
+    }
+    inline bool is_surrogate(utfchar32_t cp)
+    {
+        return (cp >= static_cast<utfchar32_t>(LEAD_SURROGATE_MIN) && cp <= static_cast<utfchar32_t>(TRAIL_SURROGATE_MAX));
+    }
+    inline bool is_code_point_valid(utfchar32_t cp)
+    {
+        return (cp <= CODE_POINT_MAX && !utf8::internal::is_surrogate(cp));
+    }
+    inline bool is_in_bmp(utfchar32_t cp)
+    {
+        return cp < utfchar32_t(0x10000);
+    }
+    template <typename octet_iterator>
+    int sequence_length(octet_iterator lead_it)
+    {
+        const utfchar8_t lead = utf8::internal::mask8(*lead_it);
+        if (lead < 0x80)
+            return 1;
+        else if ((lead >> 5) == 0x6)
+            return 2;
+        else if ((lead >> 4) == 0xe)
+            return 3;
+        else if ((lead >> 3) == 0x1e)
+            return 4;
+        else
+            return 0;
+    }
+    inline bool is_overlong_sequence(utfchar32_t cp, int length)
+    {
+        if (cp < 0x80) {
+            if (length != 1)
+                return true;
+        }
+        else if (cp < 0x800) {
+            if (length != 2)
+                return true;
+        }
+        else if (cp < 0x10000) {
+            if (length != 3)
+                return true;
+        }
+        return false;
+    }
+    enum utf_error {UTF8_OK, NOT_ENOUGH_ROOM, INVALID_LEAD, INCOMPLETE_SEQUENCE, OVERLONG_SEQUENCE, INVALID_CODE_POINT};
+    /// Helper for get_sequence_x
+    template <typename octet_iterator>
+    utf_error increase_safely(octet_iterator& it, const octet_iterator end)
+    {
+        if (++it == end)
+            return NOT_ENOUGH_ROOM;
+        if (!utf8::internal::is_trail(*it))
+            return INCOMPLETE_SEQUENCE;
+        return UTF8_OK;
+    }
+    #define UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(IT, END) {utf_error ret = increase_safely(IT, END); if (ret != UTF8_OK) return ret;}
+    /// get_sequence_x functions decode utf-8 sequences of the length x
+    template <typename octet_iterator>
+    utf_error get_sequence_1(octet_iterator& it, octet_iterator end, utfchar32_t& code_point)
+    {
+        if (it == end)
+            return NOT_ENOUGH_ROOM;
+        code_point = static_cast<utfchar32_t>(utf8::internal::mask8(*it));
+        return UTF8_OK;
+    }
+    template <typename octet_iterator>
+    utf_error get_sequence_2(octet_iterator& it, octet_iterator end, utfchar32_t& code_point)
+    {
+        if (it == end)
+            return NOT_ENOUGH_ROOM;
+        code_point = static_cast<utfchar32_t>(utf8::internal::mask8(*it));
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = ((code_point << 6) & 0x7ff) + ((*it) & 0x3f);
+        return UTF8_OK;
+    }
+    template <typename octet_iterator>
+    utf_error get_sequence_3(octet_iterator& it, octet_iterator end, utfchar32_t& code_point)
+    {
+        if (it == end)
+            return NOT_ENOUGH_ROOM;
+        code_point = static_cast<utfchar32_t>(utf8::internal::mask8(*it));
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = ((code_point << 12) & 0xffff) + ((utf8::internal::mask8(*it) << 6) & 0xfff);
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = static_cast<utfchar32_t>(code_point + ((*it) & 0x3f));
+        return UTF8_OK;
+    }
+    template <typename octet_iterator>
+    utf_error get_sequence_4(octet_iterator& it, octet_iterator end, utfchar32_t& code_point)
+    {
+        if (it == end)
+           return NOT_ENOUGH_ROOM;
+        code_point = static_cast<utfchar32_t>(utf8::internal::mask8(*it));
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = ((code_point << 18) & 0x1fffff) + ((utf8::internal::mask8(*it) << 12) & 0x3ffff);
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = static_cast<utfchar32_t>(code_point + ((utf8::internal::mask8(*it) << 6) & 0xfff));
+        UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR(it, end)
+        code_point = static_cast<utfchar32_t>(code_point + ((*it) & 0x3f));
+        return UTF8_OK;
+    }
+    #undef UTF8_CPP_INCREASE_AND_RETURN_ON_ERROR
+    template <typename octet_iterator>
+    utf_error validate_next(octet_iterator& it, octet_iterator end, utfchar32_t& code_point)
+    {
+        if (it == end)
+            return NOT_ENOUGH_ROOM;
+        // Save the original value of it so we can go back in case of failure
+        // Of course, it does not make much sense with i.e. stream iterators
+        octet_iterator original_it = it;
+        utfchar32_t cp = 0;
+        // Determine the sequence length based on the lead octet
+        const int length = utf8::internal::sequence_length(it);
+        // Get trail octets and calculate the code point
+        utf_error err = UTF8_OK;
+        switch (length) {
+            case 0:
+                return INVALID_LEAD;
+            case 1:
+                err = utf8::internal::get_sequence_1(it, end, cp);
+                break;
+            case 2:
+                err = utf8::internal::get_sequence_2(it, end, cp);
+            break;
+            case 3:
+                err = utf8::internal::get_sequence_3(it, end, cp);
+            break;
+            case 4:
+                err = utf8::internal::get_sequence_4(it, end, cp);
+            break;
+        }
+        if (err == UTF8_OK) {
+            // Decoding succeeded. Now, security checks...
+            if (utf8::internal::is_code_point_valid(cp)) {
+                if (!utf8::internal::is_overlong_sequence(cp, length)){
+                    // Passed! Return here.
+                    code_point = cp;
+                    ++it;
+                    return UTF8_OK;
+                }
+                else
+                    err = OVERLONG_SEQUENCE;
+            }
+            else
+                err = INVALID_CODE_POINT;
+        }
+        // Failure branch - restore the original value of the iterator
+        it = original_it;
+        return err;
+    }
+    template <typename octet_iterator>
+    inline utf_error validate_next(octet_iterator& it, octet_iterator end) {
+        utfchar32_t ignored;
+        return utf8::internal::validate_next(it, end, ignored);
+    }
+    template <typename word_iterator>
+    utf_error validate_next16(word_iterator& it, word_iterator end, utfchar32_t& code_point)
+    {
+        // Make sure the iterator dereferences a large enough type
+        typedef typename std::iterator_traits<word_iterator>::value_type word_type;
+        UTF_CPP_STATIC_ASSERT(sizeof(word_type) >= sizeof(utfchar16_t));
+        // Check the edge case:
+        if (it == end)
+            return NOT_ENOUGH_ROOM;
+        // Save the original value of it so we can go back in case of failure
+        // Of course, it does not make much sense with i.e. stream iterators
+        word_iterator original_it = it;
+        utf_error err = UTF8_OK;
+        const utfchar16_t first_word = *it++;
+        if (!is_surrogate(first_word)) {
+            code_point = first_word;
+            return UTF8_OK;
+        }
+        else {
+            if (it == end)
+                err = NOT_ENOUGH_ROOM;
+            else if (is_lead_surrogate(first_word)) {
+                const utfchar16_t second_word = *it++;
+                if (is_trail_surrogate(static_cast<utfchar32_t>(second_word))) {
+                    code_point = static_cast<utfchar32_t>(first_word << 10) +  static_cast<utfchar32_t>(second_word) + SURROGATE_OFFSET;
+                    return UTF8_OK;
+                } else
+                    err = INCOMPLETE_SEQUENCE;
+            } else {
+                err = INVALID_LEAD;
+            }
+        }
+        // error branch
+        it = original_it;
+        return err;
+    }
+    // Internal implementation of both checked and unchecked append() function
+    // This function will be invoked by the overloads below, as they will know
+    // the octet_type.
+    template <typename octet_iterator, typename octet_type>
+    octet_iterator append(utfchar32_t cp, octet_iterator result) {
+        if (cp < 0x80)                        // one octet
+            *(result++) = static_cast<octet_type>(cp);
+        else if (cp < 0x800) {                // two octets
+            *(result++) = static_cast<octet_type>((cp >> 6)          | 0xc0);
+            *(result++) = static_cast<octet_type>((cp & 0x3f)        | 0x80);
+        }
+        else if (cp < 0x10000) {              // three octets
+            *(result++) = static_cast<octet_type>((cp >> 12)         | 0xe0);
+            *(result++) = static_cast<octet_type>(((cp >> 6) & 0x3f) | 0x80);
+            *(result++) = static_cast<octet_type>((cp & 0x3f)        | 0x80);
+        }
+        else {                                // four octets
+            *(result++) = static_cast<octet_type>((cp >> 18)         | 0xf0);
+            *(result++) = static_cast<octet_type>(((cp >> 12) & 0x3f)| 0x80);
+            *(result++) = static_cast<octet_type>(((cp >> 6) & 0x3f) | 0x80);
+            *(result++) = static_cast<octet_type>((cp & 0x3f)        | 0x80);
+        }
+        return result;
+    }
+    // One of the following overloads will be invoked from the API calls
+    // A simple (but dangerous) case: the caller appends byte(s) to a char array
+    inline char* append(utfchar32_t cp, char* result) {
+        return append<char*, char>(cp, result);
+    }
+    // Hopefully, most common case: the caller uses back_inserter
+    // i.e. append(cp, std::back_inserter(str));
+    template<typename container_type>
+    std::back_insert_iterator<container_type> append
+            (utfchar32_t cp, std::back_insert_iterator<container_type> result) {
+        return append<std::back_insert_iterator<container_type>,
+            typename container_type::value_type>(cp, result);
+    }
+    // The caller uses some other kind of output operator - not covered above
+    // Note that in this case we are not able to determine octet_type
+    // so we assume it's utfchar8_t; that can cause a conversion warning if we are wrong.
+    template <typename octet_iterator>
+    octet_iterator append(utfchar32_t cp, octet_iterator result) {
+        return append<octet_iterator, utfchar8_t>(cp, result);
+    }
+    // Internal implementation of both checked and unchecked append16() function
+    // This function will be invoked by the overloads below, as they will know
+    // the word_type.
+    template <typename word_iterator, typename word_type>
+    word_iterator append16(utfchar32_t cp, word_iterator result) {
+        UTF_CPP_STATIC_ASSERT(sizeof(word_type) >= sizeof(utfchar16_t));
+        if (is_in_bmp(cp))
+            *(result++) = static_cast<word_type>(cp);
+        else {
+            // Code points from the supplementary planes are encoded via surrogate pairs
+            *(result++) = static_cast<word_type>(LEAD_OFFSET + (cp >> 10));
+            *(result++) = static_cast<word_type>(TRAIL_SURROGATE_MIN + (cp & 0x3FF));
+        }
+        return result;
+    }
+    // Hopefully, most common case: the caller uses back_inserter
+    // i.e. append16(cp, std::back_inserter(str));
+    template<typename container_type>
+    std::back_insert_iterator<container_type> append16
+            (utfchar32_t cp, std::back_insert_iterator<container_type> result) {
+        return append16<std::back_insert_iterator<container_type>,
+            typename container_type::value_type>(cp, result);
+    }
+    // The caller uses some other kind of output operator - not covered above
+    // Note that in this case we are not able to determine word_type
+    // so we assume it's utfchar16_t; that can cause a conversion warning if we are wrong.
+    template <typename word_iterator>
+    word_iterator append16(utfchar32_t cp, word_iterator result) {
+        return append16<word_iterator, utfchar16_t>(cp, result);
+    }
+} // namespace internal
+    /// The library API - functions intended to be called by the users
+    // Byte order mark
+    const utfchar8_t bom[] = {0xef, 0xbb, 0xbf};
+    template <typename octet_iterator>
+    octet_iterator find_invalid(octet_iterator start, octet_iterator end)
+    {
+        octet_iterator result = start;
+        while (result != end) {
+            utf8::internal::utf_error err_code = utf8::internal::validate_next(result, end);
+            if (err_code != internal::UTF8_OK)
+                return result;
+        }
+        return result;
+    }
+    inline const char* find_invalid(const char* str)
+    {
+        const char* end = str + std::strlen(str);
+        return find_invalid(str, end);
+    }
+    inline std::size_t find_invalid(const std::string& s)
+    {
+        std::string::const_iterator invalid = find_invalid(s.begin(), s.end());
+        return (invalid == s.end()) ? std::string::npos : static_cast<std::size_t>(invalid - s.begin());
+    }
+    template <typename octet_iterator>
+    inline bool is_valid(octet_iterator start, octet_iterator end)
+    {
+        return (utf8::find_invalid(start, end) == end);
+    }
+    inline bool is_valid(const char* str)
+    {
+        return (*(utf8::find_invalid(str)) == '\0');
+    }
+    inline bool is_valid(const std::string& s)
+    {
+        return is_valid(s.begin(), s.end());
+    }
+    template <typename octet_iterator>
+    inline bool starts_with_bom (octet_iterator it, octet_iterator end)
+    {
+        return (
+            ((it != end) && (utf8::internal::mask8(*it++)) == bom[0]) &&
+            ((it != end) && (utf8::internal::mask8(*it++)) == bom[1]) &&
+            ((it != end) && (utf8::internal::mask8(*it))   == bom[2])
+           );
+    }
+    inline bool starts_with_bom(const std::string& s)
+    {
+        return starts_with_bom(s.begin(), s.end());
+    }
+} // namespace utf8
+#include <stdexcept>
+namespace utf8
+{
+    // Base for the exceptions that may be thrown from the library
+    class exception : public ::std::exception {
+    };
+    // Exceptions that may be thrown from the library functions.
+    class invalid_code_point : public exception {
+        utfchar32_t cp;
+    public:
+        invalid_code_point(utfchar32_t codepoint) : cp(codepoint) {}
+        virtual const char* what() const UTF_CPP_NOEXCEPT UTF_CPP_OVERRIDE { return "Invalid code point"; }
+        utfchar32_t code_point() const {return cp;}
+    };
+    class invalid_utf8 : public exception {
+        utfchar8_t u8;
+    public:
+        invalid_utf8 (utfchar8_t u) : u8(u) {}
+        invalid_utf8 (char c) : u8(static_cast<utfchar8_t>(c)) {}
+        virtual const char* what() const UTF_CPP_NOEXCEPT UTF_CPP_OVERRIDE { return "Invalid UTF-8"; }
+        utfchar8_t utf8_octet() const {return u8;}
+    };
+    class invalid_utf16 : public exception {
+        utfchar16_t u16;
+    public:
+        invalid_utf16 (utfchar16_t u) : u16(u) {}
+        virtual const char* what() const UTF_CPP_NOEXCEPT UTF_CPP_OVERRIDE { return "Invalid UTF-16"; }
+        utfchar16_t utf16_word() const {return u16;}
+    };
+    class not_enough_room : public exception {
+    public:
+        virtual const char* what() const UTF_CPP_NOEXCEPT UTF_CPP_OVERRIDE { return "Not enough space"; }
+    };
+    /// The library API - functions intended to be called by the users
+    template <typename octet_iterator>
+    octet_iterator append(utfchar32_t cp, octet_iterator result)
+    {
+        if (!utf8::internal::is_code_point_valid(cp))
+            throw invalid_code_point(cp);
+        return internal::append(cp, result);
+    }
+    inline void append(utfchar32_t cp, std::string& s)
+    {
+        append(cp, std::back_inserter(s));
+    }
+    template <typename word_iterator>
+    word_iterator append16(utfchar32_t cp, word_iterator result)
+    {
+        if (!utf8::internal::is_code_point_valid(cp))
+            throw invalid_code_point(cp);
+        return internal::append16(cp, result);
+    }
+    template <typename octet_iterator, typename output_iterator>
+    output_iterator replace_invalid(octet_iterator start, octet_iterator end, output_iterator out, utfchar32_t replacement)
+    {
+        while (start != end) {
+            octet_iterator sequence_start = start;
+            internal::utf_error err_code = utf8::internal::validate_next(start, end);
+            switch (err_code) {
+                case internal::UTF8_OK :
+                    for (octet_iterator it = sequence_start; it != start; ++it)
+                        *out++ = *it;
+                    break;
+                case internal::NOT_ENOUGH_ROOM:
+                    out = utf8::append (replacement, out);
+                    start = end;
+                    break;
+                case internal::INVALID_LEAD:
+                    out = utf8::append (replacement, out);
+                    ++start;
+                    break;
+                case internal::INCOMPLETE_SEQUENCE:
+                case internal::OVERLONG_SEQUENCE:
+                case internal::INVALID_CODE_POINT:
+                    out = utf8::append (replacement, out);
+                    ++start;
+                    // just one replacement mark for the sequence
+                    while (start != end && utf8::internal::is_trail(*start))
+                        ++start;
+                    break;
+            }
+        }
+        return out;
+    }
+    template <typename octet_iterator, typename output_iterator>
+    inline output_iterator replace_invalid(octet_iterator start, octet_iterator end, output_iterator out)
+    {
+        static const utfchar32_t replacement_marker = static_cast<utfchar32_t>(utf8::internal::mask16(0xfffd));
+        return utf8::replace_invalid(start, end, out, replacement_marker);
+    }
+    inline std::string replace_invalid(const std::string& s, utfchar32_t replacement)
+    {
+        std::string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result), replacement);
+        return result;
+    }
+    inline std::string replace_invalid(const std::string& s)
+    {
+        std::string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    template <typename octet_iterator>
+    utfchar32_t next(octet_iterator& it, octet_iterator end)
+    {
+        utfchar32_t cp = 0;
+        internal::utf_error err_code = utf8::internal::validate_next(it, end, cp);
+        switch (err_code) {
+            case internal::UTF8_OK :
+                break;
+            case internal::NOT_ENOUGH_ROOM :
+                throw not_enough_room();
+            case internal::INVALID_LEAD :
+            case internal::INCOMPLETE_SEQUENCE :
+            case internal::OVERLONG_SEQUENCE :
+                throw invalid_utf8(static_cast<utfchar8_t>(*it));
+            case internal::INVALID_CODE_POINT :
+                throw invalid_code_point(cp);
+        }
+        return cp;
+    }
+    template <typename word_iterator>
+    utfchar32_t next16(word_iterator& it, word_iterator end)
+    {
+        utfchar32_t cp = 0;
+        internal::utf_error err_code = utf8::internal::validate_next16(it, end, cp);
+        if (err_code == internal::NOT_ENOUGH_ROOM)
+            throw not_enough_room();
+        return cp;
+    }
+    template <typename octet_iterator>
+    utfchar32_t peek_next(octet_iterator it, octet_iterator end)
+    {
+        return utf8::next(it, end);
+    }
+    template <typename octet_iterator>
+    utfchar32_t prior(octet_iterator& it, octet_iterator start)
+    {
+        // can't do much if it == start
+        if (it == start)
+            throw not_enough_room();
+        octet_iterator end = it;
+        // Go back until we hit either a lead octet or start
+        while (utf8::internal::is_trail(*(--it)))
+            if (it == start)
+                throw invalid_utf8(*it); // error - no lead byte in the sequence
+        return utf8::peek_next(it, end);
+    }
+    template <typename octet_iterator, typename distance_type>
+    void advance (octet_iterator& it, distance_type n, octet_iterator end)
+    {
+        const distance_type zero(0);
+        if (n < zero) {
+            // backward
+            for (distance_type i = n; i < zero; ++i)
+                utf8::prior(it, end);
+        } else {
+            // forward
+            for (distance_type i = zero; i < n; ++i)
+                utf8::next(it, end);
+        }
+    }
+    template <typename octet_iterator>
+    typename std::iterator_traits<octet_iterator>::difference_type
+    distance (octet_iterator first, octet_iterator last)
+    {
+        typename std::iterator_traits<octet_iterator>::difference_type dist;
+        for (dist = 0; first < last; ++dist)
+            utf8::next(first, last);
+        return dist;
+    }
+    template <typename u16bit_iterator, typename octet_iterator>
+    octet_iterator utf16to8 (u16bit_iterator start, u16bit_iterator end, octet_iterator result)
+    {
+        while (start != end) {
+            utfchar32_t cp = static_cast<utfchar32_t>(utf8::internal::mask16(*start++));
+            // Take care of surrogate pairs first
+            if (utf8::internal::is_lead_surrogate(cp)) {
+                if (start != end) {
+                    const utfchar32_t trail_surrogate = static_cast<utfchar32_t>(utf8::internal::mask16(*start++));
+                    if (utf8::internal::is_trail_surrogate(trail_surrogate))
+                        cp = (cp << 10) + trail_surrogate + internal::SURROGATE_OFFSET;
+                    else
+                        throw invalid_utf16(static_cast<utfchar16_t>(trail_surrogate));
+                }
+                else
+                    throw invalid_utf16(static_cast<utfchar16_t>(cp));
+            }
+            // Lone trail surrogate
+            else if (utf8::internal::is_trail_surrogate(cp))
+                throw invalid_utf16(static_cast<utfchar16_t>(cp));
+            result = utf8::append(cp, result);
+        }
+        return result;
+    }
+    template <typename u16bit_iterator, typename octet_iterator>
+    u16bit_iterator utf8to16 (octet_iterator start, octet_iterator end, u16bit_iterator result)
+    {
+        while (start < end) {
+            const utfchar32_t cp = utf8::next(start, end);
+            if (cp > 0xffff) { //make a surrogate pair
+                *result++ = static_cast<utfchar16_t>((cp >> 10)   + internal::LEAD_OFFSET);
+                *result++ = static_cast<utfchar16_t>((cp & 0x3ff) + internal::TRAIL_SURROGATE_MIN);
+            }
+            else
+                *result++ = static_cast<utfchar16_t>(cp);
+        }
+        return result;
+    }
+    template <typename octet_iterator, typename u32bit_iterator>
+    octet_iterator utf32to8 (u32bit_iterator start, u32bit_iterator end, octet_iterator result)
+    {
+        while (start != end)
+            result = utf8::append(*(start++), result);
+        return result;
+    }
+    template <typename octet_iterator, typename u32bit_iterator>
+    u32bit_iterator utf8to32 (octet_iterator start, octet_iterator end, u32bit_iterator result)
+    {
+        while (start < end)
+            (*result++) = utf8::next(start, end);
+        return result;
+    }
+    // The iterator class
+    template <typename octet_iterator>
+    class iterator {
+      octet_iterator it;
+      octet_iterator range_start;
+      octet_iterator range_end;
+      public:
+      typedef utfchar32_t value_type;
+      typedef utfchar32_t* pointer;
+      typedef utfchar32_t& reference;
+      typedef std::ptrdiff_t difference_type;
+      typedef std::bidirectional_iterator_tag iterator_category;
+      iterator () {}
+      explicit iterator (const octet_iterator& octet_it,
+                         const octet_iterator& rangestart,
+                         const octet_iterator& rangeend) :
+               it(octet_it), range_start(rangestart), range_end(rangeend)
+      {
+          if (it < range_start || it > range_end)
+              throw std::out_of_range("Invalid utf-8 iterator position");
+      }
+      // the default "big three" are OK
+      octet_iterator base () const { return it; }
+      utfchar32_t operator * () const
+      {
+          octet_iterator temp = it;
+          return utf8::next(temp, range_end);
+      }
+      bool operator == (const iterator& rhs) const
+      {
+          if (range_start != rhs.range_start || range_end != rhs.range_end)
+              throw std::logic_error("Comparing utf-8 iterators defined with different ranges");
+          return (it == rhs.it);
+      }
+      bool operator != (const iterator& rhs) const
+      {
+          return !(operator == (rhs));
+      }
+      iterator& operator ++ ()
+      {
+          utf8::next(it, range_end);
+          return *this;
+      }
+      iterator operator ++ (int)
+      {
+          iterator temp = *this;
+          utf8::next(it, range_end);
+          return temp;
+      }
+      iterator& operator -- ()
+      {
+          utf8::prior(it, range_start);
+          return *this;
+      }
+      iterator operator -- (int)
+      {
+          iterator temp = *this;
+          utf8::prior(it, range_start);
+          return temp;
+      }
+    }; // class iterator
+} // namespace utf8
+#if UTF_CPP_CPLUSPLUS >= 201103L // C++ 11 or later
+namespace utf8
+{
+    inline void append16(utfchar32_t cp, std::u16string& s)
+    {
+        append16(cp, std::back_inserter(s));
+    }
+    inline std::string utf16to8(const std::u16string& s)
+    {
+        std::string result;
+        utf16to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u16string utf8to16(const std::string& s)
+    {
+        std::u16string result;
+        utf8to16(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::string utf32to8(const std::u32string& s)
+    {
+        std::string result;
+        utf32to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u32string utf8to32(const std::string& s)
+    {
+        std::u32string result;
+        utf8to32(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+} // namespace utf8
+#endif // C++ 11 or later
+#if UTF_CPP_CPLUSPLUS >= 201703L // C++ 17 or later
+namespace utf8
+{
+    inline std::string utf16to8(std::u16string_view s)
+    {
+        std::string result;
+        utf16to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u16string utf8to16(std::string_view s)
+    {
+        std::u16string result;
+        utf8to16(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::string utf32to8(std::u32string_view s)
+    {
+        std::string result;
+        utf32to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u32string utf8to32(std::string_view s)
+    {
+        std::u32string result;
+        utf8to32(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::size_t find_invalid(std::string_view s)
+    {
+        std::string_view::const_iterator invalid = find_invalid(s.begin(), s.end());
+        return (invalid == s.end()) ? std::string_view::npos : static_cast<std::size_t>(invalid - s.begin());
+    }
+    inline bool is_valid(std::string_view s)
+    {
+        return is_valid(s.begin(), s.end());
+    }
+    inline std::string replace_invalid(std::string_view s, char32_t replacement)
+    {
+        std::string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result), replacement);
+        return result;
+    }
+    inline std::string replace_invalid(std::string_view s)
+    {
+        std::string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline bool starts_with_bom(std::string_view s)
+    {
+        return starts_with_bom(s.begin(), s.end());
+    }
+} // namespace utf8
+#endif // C++ 17 or later
+#if UTF_CPP_CPLUSPLUS >= 202002L // C++ 20 or later
+namespace utf8
+{
+    inline std::u8string utf16tou8(const std::u16string& s)
+    {
+        std::u8string result;
+        utf16to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u8string utf16tou8(std::u16string_view s)
+    {
+        std::u8string result;
+        utf16to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u16string utf8to16(const std::u8string& s)
+    {
+        std::u16string result;
+        utf8to16(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u16string utf8to16(const std::u8string_view& s)
+    {
+        std::u16string result;
+        utf8to16(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u8string utf32tou8(const std::u32string& s)
+    {
+        std::u8string result;
+        utf32to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u8string utf32tou8(const std::u32string_view& s)
+    {
+        std::u8string result;
+        utf32to8(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u32string utf8to32(const std::u8string& s)
+    {
+        std::u32string result;
+        utf8to32(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::u32string utf8to32(const std::u8string_view& s)
+    {
+        std::u32string result;
+        utf8to32(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline std::size_t find_invalid(const std::u8string& s)
+    {
+        std::u8string::const_iterator invalid = find_invalid(s.begin(), s.end());
+        return (invalid == s.end()) ? std::string_view::npos : static_cast<std::size_t>(invalid - s.begin());
+    }
+    inline bool is_valid(const std::u8string& s)
+    {
+        return is_valid(s.begin(), s.end());
+    }
+    inline std::u8string replace_invalid(const std::u8string& s, char32_t replacement)
+    {
+        std::u8string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result), replacement);
+        return result;
+    }
+    inline std::u8string replace_invalid(const std::u8string& s)
+    {
+        std::u8string result;
+        replace_invalid(s.begin(), s.end(), std::back_inserter(result));
+        return result;
+    }
+    inline bool starts_with_bom(const std::u8string& s)
+    {
+        return starts_with_bom(s.begin(), s.end());
+    }
+ 
+} // namespace utf8
+#endif // C++ 20 or later
+namespace utf8
+{
+    namespace unchecked
+    {
+        template <typename octet_iterator>
+        octet_iterator append(utfchar32_t cp, octet_iterator result)
+        {
+            return internal::append(cp, result);
+        }
+        template <typename word_iterator>
+        word_iterator append16(utfchar32_t cp, word_iterator result)
+        {
+            return internal::append16(cp, result);
+        }
+        template <typename octet_iterator, typename output_iterator>
+        output_iterator replace_invalid(octet_iterator start, octet_iterator end, output_iterator out, utfchar32_t replacement)
+        {
+            while (start != end) {
+                octet_iterator sequence_start = start;
+                internal::utf_error err_code = utf8::internal::validate_next(start, end);
+                switch (err_code) {
+                    case internal::UTF8_OK :
+                        for (octet_iterator it = sequence_start; it != start; ++it)
+                            *out++ = *it;
+                        break;
+                    case internal::NOT_ENOUGH_ROOM:
+                        out = utf8::unchecked::append(replacement, out);
+                        start = end;
+                        break;
+                    case internal::INVALID_LEAD:
+                        out = utf8::unchecked::append(replacement, out);
+                        ++start;
+                        break;
+                    case internal::INCOMPLETE_SEQUENCE:
+                    case internal::OVERLONG_SEQUENCE:
+                    case internal::INVALID_CODE_POINT:
+                        out = utf8::unchecked::append(replacement, out);
+                        ++start;
+                        // just one replacement mark for the sequence
+                        while (start != end && utf8::internal::is_trail(*start))
+                            ++start;
+                        break;
+                }
+            }
+            return out;
+        }
+        template <typename octet_iterator, typename output_iterator>
+        inline output_iterator replace_invalid(octet_iterator start, octet_iterator end, output_iterator out)
+        {
+            static const utfchar32_t replacement_marker = static_cast<utfchar32_t>(utf8::internal::mask16(0xfffd));
+            return utf8::unchecked::replace_invalid(start, end, out, replacement_marker);
+        }
+        inline std::string replace_invalid(const std::string& s, utfchar32_t replacement)
+        {
+            std::string result;
+            replace_invalid(s.begin(), s.end(), std::back_inserter(result), replacement);
+            return result;
+        }
+        inline std::string replace_invalid(const std::string& s)
+        {
+            std::string result;
+            replace_invalid(s.begin(), s.end(), std::back_inserter(result));
+            return result;
+        }
+        template <typename octet_iterator>
+        utfchar32_t next(octet_iterator& it)
+        {
+            utfchar32_t cp = utf8::internal::mask8(*it);
+            switch (utf8::internal::sequence_length(it)) {
+                case 1:
+                    break;
+                case 2:
+                    ++it;
+                    cp = ((cp << 6) & 0x7ff) + ((*it) & 0x3f);
+                    break;
+                case 3:
+                    ++it;
+                    cp = ((cp << 12) & 0xffff) + ((utf8::internal::mask8(*it) << 6) & 0xfff);
+                    ++it;
+                    cp = static_cast<utfchar32_t>(cp + ((*it) & 0x3f));
+                    break;
+                case 4:
+                    ++it;
+                    cp = ((cp << 18) & 0x1fffff) + ((utf8::internal::mask8(*it) << 12) & 0x3ffff);
+                    ++it;
+                    cp = static_cast<utfchar32_t>(cp + ((utf8::internal::mask8(*it) << 6) & 0xfff));
+                    ++it;
+                    cp = static_cast<utfchar32_t>(cp + ((*it) & 0x3f));
+                    break;
+            }
+            ++it;
+            return cp;
+        }
+        template <typename octet_iterator>
+        utfchar32_t peek_next(octet_iterator it)
+        {
+            return utf8::unchecked::next(it);
+        }
+        template <typename word_iterator>
+        utfchar32_t next16(word_iterator& it)
+        {
+            utfchar32_t cp = utf8::internal::mask16(*it++);
+            if (utf8::internal::is_lead_surrogate(cp))
+                return (cp << 10) + *it++ + utf8::internal::SURROGATE_OFFSET;
+            return cp;
+        }
+        template <typename octet_iterator>
+        utfchar32_t prior(octet_iterator& it)
+        {
+            while (utf8::internal::is_trail(*(--it))) ;
+            octet_iterator temp = it;
+            return utf8::unchecked::next(temp);
+        }
+        template <typename octet_iterator, typename distance_type>
+        void advance(octet_iterator& it, distance_type n)
+        {
+            const distance_type zero(0);
+            if (n < zero) {
+                // backward
+                for (distance_type i = n; i < zero; ++i)
+                    utf8::unchecked::prior(it);
+            } else {
+                // forward
+                for (distance_type i = zero; i < n; ++i)
+                    utf8::unchecked::next(it);
+            }
+        }
+        template <typename octet_iterator>
+        typename std::iterator_traits<octet_iterator>::difference_type
+        distance(octet_iterator first, octet_iterator last)
+        {
+            typename std::iterator_traits<octet_iterator>::difference_type dist;
+            for (dist = 0; first < last; ++dist)
+                utf8::unchecked::next(first);
+            return dist;
+        }
+        template <typename u16bit_iterator, typename octet_iterator>
+        octet_iterator utf16to8(u16bit_iterator start, u16bit_iterator end, octet_iterator result)
+        {
+            while (start != end) {
+                utfchar32_t cp = utf8::internal::mask16(*start++);
+                // Take care of surrogate pairs first
+                if (utf8::internal::is_lead_surrogate(cp)) {
+                    if (start == end)
+                        return result;
+                    utfchar32_t trail_surrogate = utf8::internal::mask16(*start++);
+                    cp = (cp << 10) + trail_surrogate + internal::SURROGATE_OFFSET;
+                }
+                result = utf8::unchecked::append(cp, result);
+            }
+            return result;
+        }
+        template <typename u16bit_iterator, typename octet_iterator>
+        u16bit_iterator utf8to16(octet_iterator start, octet_iterator end, u16bit_iterator result)
+        {
+            while (start < end) {
+                utfchar32_t cp = utf8::unchecked::next(start);
+                if (cp > 0xffff) { //make a surrogate pair
+                    *result++ = static_cast<utfchar16_t>((cp >> 10)   + internal::LEAD_OFFSET);
+                    *result++ = static_cast<utfchar16_t>((cp & 0x3ff) + internal::TRAIL_SURROGATE_MIN);
+                }
+                else
+                    *result++ = static_cast<utfchar16_t>(cp);
+            }
+            return result;
+        }
+        template <typename octet_iterator, typename u32bit_iterator>
+        octet_iterator utf32to8(u32bit_iterator start, u32bit_iterator end, octet_iterator result)
+        {
+            while (start != end)
+                result = utf8::unchecked::append(*(start++), result);
+            return result;
+        }
+        template <typename octet_iterator, typename u32bit_iterator>
+        u32bit_iterator utf8to32(octet_iterator start, octet_iterator end, u32bit_iterator result)
+        {
+            while (start < end)
+                (*result++) = utf8::unchecked::next(start);
+            return result;
+        }
+        // The iterator class
+        template <typename octet_iterator>
+          class iterator {
+            octet_iterator it;
+            public:
+            typedef utfchar32_t value_type;
+            typedef utfchar32_t* pointer;
+            typedef utfchar32_t& reference;
+            typedef std::ptrdiff_t difference_type;
+            typedef std::bidirectional_iterator_tag iterator_category;
+            iterator () {}
+            explicit iterator (const octet_iterator& octet_it): it(octet_it) {}
+            // the default "big three" are OK
+            octet_iterator base () const { return it; }
+            utfchar32_t operator * () const
+            {
+                octet_iterator temp = it;
+                return utf8::unchecked::next(temp);
+            }
+            bool operator == (const iterator& rhs) const
+            {
+                return (it == rhs.it);
+            }
+            bool operator != (const iterator& rhs) const
+            {
+                return !(operator == (rhs));
+            }
+            iterator& operator ++ ()
+            {
+                ::std::advance(it, utf8::internal::sequence_length(it));
+                return *this;
+            }
+            iterator operator ++ (int)
+            {
+                iterator temp = *this;
+                ::std::advance(it, utf8::internal::sequence_length(it));
+                return temp;
+            }
+            iterator& operator -- ()
+            {
+                utf8::unchecked::prior(it);
+                return *this;
+            }
+            iterator operator -- (int)
+            {
+                iterator temp = *this;
+                utf8::unchecked::prior(it);
+                return temp;
+            }
+          }; // class iterator
+    } // namespace utf8::unchecked
+} // namespace utf8
+#endif // header guard