diff options
Diffstat (limited to 'tests/unit/check-qjson.c')
-rw-r--r-- | tests/unit/check-qjson.c | 1518 |
1 files changed, 1518 insertions, 0 deletions
diff --git a/tests/unit/check-qjson.c b/tests/unit/check-qjson.c new file mode 100644 index 0000000000..c845f91d43 --- /dev/null +++ b/tests/unit/check-qjson.c @@ -0,0 +1,1518 @@ +/* + * Copyright IBM, Corp. 2009 + * Copyright (c) 2013, 2015 Red Hat Inc. + * + * Authors: + * Anthony Liguori <aliguori@us.ibm.com> + * Markus Armbruster <armbru@redhat.com> + * + * This work is licensed under the terms of the GNU LGPL, version 2.1 or later. + * See the COPYING.LIB file in the top-level directory. + * + */ + +#include "qemu/osdep.h" + +#include "qapi/error.h" +#include "qapi/qmp/qbool.h" +#include "qapi/qmp/qjson.h" +#include "qapi/qmp/qlit.h" +#include "qapi/qmp/qnull.h" +#include "qapi/qmp/qnum.h" +#include "qapi/qmp/qstring.h" +#include "qemu/unicode.h" +#include "qemu-common.h" + +static QString *from_json_str(const char *jstr, bool single, Error **errp) +{ + char quote = single ? '\'' : '"'; + char *qjstr = g_strdup_printf("%c%s%c", quote, jstr, quote); + QString *ret = qobject_to(QString, qobject_from_json(qjstr, errp)); + + g_free(qjstr); + return ret; +} + +static char *to_json_str(QString *str) +{ + GString *json = qobject_to_json(QOBJECT(str)); + + if (!json) { + return NULL; + } + /* peel off double quotes */ + g_string_truncate(json, json->len - 1); + g_string_erase(json, 0, 1); + return g_string_free(json, false); +} + +static void escaped_string(void) +{ + struct { + /* Content of JSON string to parse with qobject_from_json() */ + const char *json_in; + /* Expected parse output; to unparse with qobject_to_json() */ + const char *utf8_out; + int skip; + } test_cases[] = { + { "\\b\\f\\n\\r\\t\\\\\\\"", "\b\f\n\r\t\\\"" }, + { "\\/\\'", "/'", .skip = 1 }, + { "single byte utf-8 \\u0020", "single byte utf-8 ", .skip = 1 }, + { "double byte utf-8 \\u00A2", "double byte utf-8 \xc2\xa2" }, + { "triple byte utf-8 \\u20AC", "triple byte utf-8 \xe2\x82\xac" }, + { "quadruple byte utf-8 \\uD834\\uDD1E", /* U+1D11E */ + "quadruple byte utf-8 \xF0\x9D\x84\x9E" }, + { "\\", NULL }, + { "\\z", NULL }, + { "\\ux", NULL }, + { "\\u1x", NULL }, + { "\\u12x", NULL }, + { "\\u123x", NULL }, + { "\\u12345", "\341\210\2645" }, + { "\\u0000x", "\xC0\x80x" }, + { "unpaired leading surrogate \\uD800", NULL }, + { "unpaired leading surrogate \\uD800\\uCAFE", NULL }, + { "unpaired leading surrogate \\uD800\\uD801\\uDC02", NULL }, + { "unpaired trailing surrogate \\uDC00", NULL }, + { "backward surrogate pair \\uDC00\\uD800", NULL }, + { "noncharacter U+FDD0 \\uFDD0", NULL }, + { "noncharacter U+FDEF \\uFDEF", NULL }, + { "noncharacter U+1FFFE \\uD87F\\uDFFE", NULL }, + { "noncharacter U+10FFFF \\uDC3F\\uDFFF", NULL }, + {} + }; + int i, j; + QString *cstr; + char *jstr; + + for (i = 0; test_cases[i].json_in; i++) { + for (j = 0; j < 2; j++) { + if (test_cases[i].utf8_out) { + cstr = from_json_str(test_cases[i].json_in, j, &error_abort); + g_assert_cmpstr(qstring_get_str(cstr), + ==, test_cases[i].utf8_out); + if (!test_cases[i].skip) { + jstr = to_json_str(cstr); + g_assert_cmpstr(jstr, ==, test_cases[i].json_in); + g_free(jstr); + } + qobject_unref(cstr); + } else { + cstr = from_json_str(test_cases[i].json_in, j, NULL); + g_assert(!cstr); + } + } + } +} + +static void string_with_quotes(void) +{ + const char *test_cases[] = { + "\"the bee's knees\"", + "'double quote \"'", + NULL + }; + int i; + QString *str; + char *cstr; + + for (i = 0; test_cases[i]; i++) { + str = qobject_to(QString, + qobject_from_json(test_cases[i], &error_abort)); + g_assert(str); + cstr = g_strndup(test_cases[i] + 1, strlen(test_cases[i]) - 2); + g_assert_cmpstr(qstring_get_str(str), ==, cstr); + g_free(cstr); + qobject_unref(str); + } +} + +static void utf8_string(void) +{ + /* + * Most test cases are scraped from Markus Kuhn's UTF-8 decoder + * capability and stress test at + * http://www.cl.cam.ac.uk/~mgk25/ucs/examples/UTF-8-test.txt + */ + static const struct { + /* Content of JSON string to parse with qobject_from_json() */ + const char *json_in; + /* Expected parse output */ + const char *utf8_out; + /* Expected unparse output, defaults to @json_in */ + const char *json_out; + } test_cases[] = { + /* 0 Control characters */ + { + /* + * Note: \x00 is impossible, other representations of + * U+0000 are covered under 4.3 + */ + "\x01\x02\x03\x04\x05\x06\x07" + "\x08\x09\x0A\x0B\x0C\x0D\x0E\x0F" + "\x10\x11\x12\x13\x14\x15\x16\x17" + "\x18\x19\x1A\x1B\x1C\x1D\x1E\x1F", + NULL, + "\\u0001\\u0002\\u0003\\u0004\\u0005\\u0006\\u0007" + "\\b\\t\\n\\u000B\\f\\r\\u000E\\u000F" + "\\u0010\\u0011\\u0012\\u0013\\u0014\\u0015\\u0016\\u0017" + "\\u0018\\u0019\\u001A\\u001B\\u001C\\u001D\\u001E\\u001F", + }, + /* 1 Some correct UTF-8 text */ + { + /* a bit of German */ + "Falsches \xC3\x9C" "ben von Xylophonmusik qu\xC3\xA4lt" + " jeden gr\xC3\xB6\xC3\x9F" "eren Zwerg.", + "Falsches \xC3\x9C" "ben von Xylophonmusik qu\xC3\xA4lt" + " jeden gr\xC3\xB6\xC3\x9F" "eren Zwerg.", + "Falsches \\u00DCben von Xylophonmusik qu\\u00E4lt" + " jeden gr\\u00F6\\u00DFeren Zwerg.", + }, + { + /* a bit of Greek */ + "\xCE\xBA\xE1\xBD\xB9\xCF\x83\xCE\xBC\xCE\xB5", + "\xCE\xBA\xE1\xBD\xB9\xCF\x83\xCE\xBC\xCE\xB5", + "\\u03BA\\u1F79\\u03C3\\u03BC\\u03B5", + }, + /* '%' character when not interpolating */ + { + "100%", + "100%", + }, + /* 2 Boundary condition test cases */ + /* 2.1 First possible sequence of a certain length */ + /* + * 2.1.1 1 byte U+0020 + * Control characters are already covered by their own test + * case under 0. Test the first 1 byte non-control character + * here. + */ + { + " ", + " ", + }, + /* 2.1.2 2 bytes U+0080 */ + { + "\xC2\x80", + "\xC2\x80", + "\\u0080", + }, + /* 2.1.3 3 bytes U+0800 */ + { + "\xE0\xA0\x80", + "\xE0\xA0\x80", + "\\u0800", + }, + /* 2.1.4 4 bytes U+10000 */ + { + "\xF0\x90\x80\x80", + "\xF0\x90\x80\x80", + "\\uD800\\uDC00", + }, + /* 2.1.5 5 bytes U+200000 */ + { + "\xF8\x88\x80\x80\x80", + NULL, + "\\uFFFD", + }, + /* 2.1.6 6 bytes U+4000000 */ + { + "\xFC\x84\x80\x80\x80\x80", + NULL, + "\\uFFFD", + }, + /* 2.2 Last possible sequence of a certain length */ + /* 2.2.1 1 byte U+007F */ + { + "\x7F", + "\x7F", + "\\u007F", + }, + /* 2.2.2 2 bytes U+07FF */ + { + "\xDF\xBF", + "\xDF\xBF", + "\\u07FF", + }, + /* + * 2.2.3 3 bytes U+FFFC + * The last possible sequence is actually U+FFFF. But that's + * a noncharacter, and already covered by its own test case + * under 5.3. Same for U+FFFE. U+FFFD is the last character + * in the BMP, and covered under 2.3. Because of U+FFFD's + * special role as replacement character, it's worth testing + * U+FFFC here. + */ + { + "\xEF\xBF\xBC", + "\xEF\xBF\xBC", + "\\uFFFC", + }, + /* 2.2.4 4 bytes U+1FFFFF */ + { + "\xF7\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 2.2.5 5 bytes U+3FFFFFF */ + { + "\xFB\xBF\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 2.2.6 6 bytes U+7FFFFFFF */ + { + "\xFD\xBF\xBF\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 2.3 Other boundary conditions */ + { + /* last one before surrogate range: U+D7FF */ + "\xED\x9F\xBF", + "\xED\x9F\xBF", + "\\uD7FF", + }, + { + /* first one after surrogate range: U+E000 */ + "\xEE\x80\x80", + "\xEE\x80\x80", + "\\uE000", + }, + { + /* last one in BMP: U+FFFD */ + "\xEF\xBF\xBD", + "\xEF\xBF\xBD", + "\\uFFFD", + }, + { + /* last one in last plane: U+10FFFD */ + "\xF4\x8F\xBF\xBD", + "\xF4\x8F\xBF\xBD", + "\\uDBFF\\uDFFD" + }, + { + /* first one beyond Unicode range: U+110000 */ + "\xF4\x90\x80\x80", + NULL, + "\\uFFFD", + }, + /* 3 Malformed sequences */ + /* 3.1 Unexpected continuation bytes */ + /* 3.1.1 First continuation byte */ + { + "\x80", + NULL, + "\\uFFFD", + }, + /* 3.1.2 Last continuation byte */ + { + "\xBF", + NULL, + "\\uFFFD", + }, + /* 3.1.3 2 continuation bytes */ + { + "\x80\xBF", + NULL, + "\\uFFFD\\uFFFD", + }, + /* 3.1.4 3 continuation bytes */ + { + "\x80\xBF\x80", + NULL, + "\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.1.5 4 continuation bytes */ + { + "\x80\xBF\x80\xBF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.1.6 5 continuation bytes */ + { + "\x80\xBF\x80\xBF\x80", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.1.7 6 continuation bytes */ + { + "\x80\xBF\x80\xBF\x80\xBF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.1.8 7 continuation bytes */ + { + "\x80\xBF\x80\xBF\x80\xBF\x80", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.1.9 Sequence of all 64 possible continuation bytes */ + { + "\x80\x81\x82\x83\x84\x85\x86\x87" + "\x88\x89\x8A\x8B\x8C\x8D\x8E\x8F" + "\x90\x91\x92\x93\x94\x95\x96\x97" + "\x98\x99\x9A\x9B\x9C\x9D\x9E\x9F" + "\xA0\xA1\xA2\xA3\xA4\xA5\xA6\xA7" + "\xA8\xA9\xAA\xAB\xAC\xAD\xAE\xAF" + "\xB0\xB1\xB2\xB3\xB4\xB5\xB6\xB7" + "\xB8\xB9\xBA\xBB\xBC\xBD\xBE\xBF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.2 Lonely start characters */ + /* 3.2.1 All 32 first bytes of 2-byte sequences, followed by space */ + { + "\xC0 \xC1 \xC2 \xC3 \xC4 \xC5 \xC6 \xC7 " + "\xC8 \xC9 \xCA \xCB \xCC \xCD \xCE \xCF " + "\xD0 \xD1 \xD2 \xD3 \xD4 \xD5 \xD6 \xD7 " + "\xD8 \xD9 \xDA \xDB \xDC \xDD \xDE \xDF ", + NULL, + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD " + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD " + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD " + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD ", + }, + /* 3.2.2 All 16 first bytes of 3-byte sequences, followed by space */ + { + "\xE0 \xE1 \xE2 \xE3 \xE4 \xE5 \xE6 \xE7 " + "\xE8 \xE9 \xEA \xEB \xEC \xED \xEE \xEF ", + NULL, + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD " + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD ", + }, + /* 3.2.3 All 8 first bytes of 4-byte sequences, followed by space */ + { + "\xF0 \xF1 \xF2 \xF3 \xF4 \xF5 \xF6 \xF7 ", + NULL, + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD \\uFFFD ", + }, + /* 3.2.4 All 4 first bytes of 5-byte sequences, followed by space */ + { + "\xF8 \xF9 \xFA \xFB ", + NULL, + "\\uFFFD \\uFFFD \\uFFFD \\uFFFD ", + }, + /* 3.2.5 All 2 first bytes of 6-byte sequences, followed by space */ + { + "\xFC \xFD ", + NULL, + "\\uFFFD \\uFFFD ", + }, + /* 3.3 Sequences with last continuation byte missing */ + /* 3.3.1 2-byte sequence with last byte missing (U+0000) */ + { + "\xC0", + NULL, + "\\uFFFD", + }, + /* 3.3.2 3-byte sequence with last byte missing (U+0000) */ + { + "\xE0\x80", + NULL, + "\\uFFFD", + }, + /* 3.3.3 4-byte sequence with last byte missing (U+0000) */ + { + "\xF0\x80\x80", + NULL, + "\\uFFFD", + }, + /* 3.3.4 5-byte sequence with last byte missing (U+0000) */ + { + "\xF8\x80\x80\x80", + NULL, + "\\uFFFD", + }, + /* 3.3.5 6-byte sequence with last byte missing (U+0000) */ + { + "\xFC\x80\x80\x80\x80", + NULL, + "\\uFFFD", + }, + /* 3.3.6 2-byte sequence with last byte missing (U+07FF) */ + { + "\xDF", + NULL, + "\\uFFFD", + }, + /* 3.3.7 3-byte sequence with last byte missing (U+FFFF) */ + { + "\xEF\xBF", + NULL, + "\\uFFFD", + }, + /* 3.3.8 4-byte sequence with last byte missing (U+1FFFFF) */ + { + "\xF7\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 3.3.9 5-byte sequence with last byte missing (U+3FFFFFF) */ + { + "\xFB\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 3.3.10 6-byte sequence with last byte missing (U+7FFFFFFF) */ + { + "\xFD\xBF\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 3.4 Concatenation of incomplete sequences */ + { + "\xC0\xE0\x80\xF0\x80\x80\xF8\x80\x80\x80\xFC\x80\x80\x80\x80" + "\xDF\xEF\xBF\xF7\xBF\xBF\xFB\xBF\xBF\xBF\xFD\xBF\xBF\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 3.5 Impossible bytes */ + { + "\xFE", + NULL, + "\\uFFFD", + }, + { + "\xFF", + NULL, + "\\uFFFD", + }, + { + "\xFE\xFE\xFF\xFF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + /* 4 Overlong sequences */ + /* 4.1 Overlong '/' */ + { + "\xC0\xAF", + NULL, + "\\uFFFD", + }, + { + "\xE0\x80\xAF", + NULL, + "\\uFFFD", + }, + { + "\xF0\x80\x80\xAF", + NULL, + "\\uFFFD", + }, + { + "\xF8\x80\x80\x80\xAF", + NULL, + "\\uFFFD", + }, + { + "\xFC\x80\x80\x80\x80\xAF", + NULL, + "\\uFFFD", + }, + /* + * 4.2 Maximum overlong sequences + * Highest Unicode value that is still resulting in an + * overlong sequence if represented with the given number of + * bytes. This is a boundary test for safe UTF-8 decoders. + */ + { + /* \U+007F */ + "\xC1\xBF", + NULL, + "\\uFFFD", + }, + { + /* \U+07FF */ + "\xE0\x9F\xBF", + NULL, + "\\uFFFD", + }, + { + /* + * \U+FFFC + * The actual maximum would be U+FFFF, but that's a + * noncharacter. Testing U+FFFC seems more useful. See + * also 2.2.3 + */ + "\xF0\x8F\xBF\xBC", + NULL, + "\\uFFFD", + }, + { + /* \U+1FFFFF */ + "\xF8\x87\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + { + /* \U+3FFFFFF */ + "\xFC\x83\xBF\xBF\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 4.3 Overlong representation of the NUL character */ + { + /* \U+0000 */ + "\xC0\x80", + "\xC0\x80", + "\\u0000", + }, + { + /* \U+0000 */ + "\xE0\x80\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+0000 */ + "\xF0\x80\x80\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+0000 */ + "\xF8\x80\x80\x80\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+0000 */ + "\xFC\x80\x80\x80\x80\x80", + NULL, + "\\uFFFD", + }, + /* 5 Illegal code positions */ + /* 5.1 Single UTF-16 surrogates */ + { + /* \U+D800 */ + "\xED\xA0\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+DB7F */ + "\xED\xAD\xBF", + NULL, + "\\uFFFD", + }, + { + /* \U+DB80 */ + "\xED\xAE\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+DBFF */ + "\xED\xAF\xBF", + NULL, + "\\uFFFD", + }, + { + /* \U+DC00 */ + "\xED\xB0\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+DF80 */ + "\xED\xBE\x80", + NULL, + "\\uFFFD", + }, + { + /* \U+DFFF */ + "\xED\xBF\xBF", + NULL, + "\\uFFFD", + }, + /* 5.2 Paired UTF-16 surrogates */ + { + /* \U+D800\U+DC00 */ + "\xED\xA0\x80\xED\xB0\x80", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+D800\U+DFFF */ + "\xED\xA0\x80\xED\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DB7F\U+DC00 */ + "\xED\xAD\xBF\xED\xB0\x80", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DB7F\U+DFFF */ + "\xED\xAD\xBF\xED\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DB80\U+DC00 */ + "\xED\xAE\x80\xED\xB0\x80", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DB80\U+DFFF */ + "\xED\xAE\x80\xED\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DBFF\U+DC00 */ + "\xED\xAF\xBF\xED\xB0\x80", + NULL, + "\\uFFFD\\uFFFD", + }, + { + /* \U+DBFF\U+DFFF */ + "\xED\xAF\xBF\xED\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD", + }, + /* 5.3 Other illegal code positions */ + /* BMP noncharacters */ + { + /* \U+FFFE */ + "\xEF\xBF\xBE", + NULL, + "\\uFFFD", + }, + { + /* \U+FFFF */ + "\xEF\xBF\xBF", + NULL, + "\\uFFFD", + }, + { + /* U+FDD0 */ + "\xEF\xB7\x90", + NULL, + "\\uFFFD", + }, + { + /* U+FDEF */ + "\xEF\xB7\xAF", + NULL, + "\\uFFFD", + }, + /* Plane 1 .. 16 noncharacters */ + { + /* U+1FFFE U+1FFFF U+2FFFE U+2FFFF ... U+10FFFE U+10FFFF */ + "\xF0\x9F\xBF\xBE\xF0\x9F\xBF\xBF" + "\xF0\xAF\xBF\xBE\xF0\xAF\xBF\xBF" + "\xF0\xBF\xBF\xBE\xF0\xBF\xBF\xBF" + "\xF1\x8F\xBF\xBE\xF1\x8F\xBF\xBF" + "\xF1\x9F\xBF\xBE\xF1\x9F\xBF\xBF" + "\xF1\xAF\xBF\xBE\xF1\xAF\xBF\xBF" + "\xF1\xBF\xBF\xBE\xF1\xBF\xBF\xBF" + "\xF2\x8F\xBF\xBE\xF2\x8F\xBF\xBF" + "\xF2\x9F\xBF\xBE\xF2\x9F\xBF\xBF" + "\xF2\xAF\xBF\xBE\xF2\xAF\xBF\xBF" + "\xF2\xBF\xBF\xBE\xF2\xBF\xBF\xBF" + "\xF3\x8F\xBF\xBE\xF3\x8F\xBF\xBF" + "\xF3\x9F\xBF\xBE\xF3\x9F\xBF\xBF" + "\xF3\xAF\xBF\xBE\xF3\xAF\xBF\xBF" + "\xF3\xBF\xBF\xBE\xF3\xBF\xBF\xBF" + "\xF4\x8F\xBF\xBE\xF4\x8F\xBF\xBF", + NULL, + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD" + "\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD\\uFFFD", + }, + {} + }; + int i, j; + QString *str; + const char *json_in, *utf8_out, *utf8_in, *json_out, *tail; + char *end, *in, *jstr; + + for (i = 0; test_cases[i].json_in; i++) { + for (j = 0; j < 2; j++) { + json_in = test_cases[i].json_in; + utf8_out = test_cases[i].utf8_out; + utf8_in = test_cases[i].utf8_out ?: test_cases[i].json_in; + json_out = test_cases[i].json_out ?: test_cases[i].json_in; + + /* Parse @json_in, expect @utf8_out */ + if (utf8_out) { + str = from_json_str(json_in, j, &error_abort); + g_assert_cmpstr(qstring_get_str(str), ==, utf8_out); + qobject_unref(str); + } else { + str = from_json_str(json_in, j, NULL); + g_assert(!str); + /* + * Failure may be due to any sequence, but *all* sequences + * are expected to fail. Test each one in isolation. + */ + for (tail = json_in; *tail; tail = end) { + mod_utf8_codepoint(tail, 6, &end); + if (*end == ' ') { + end++; + } + in = g_strndup(tail, end - tail); + str = from_json_str(in, j, NULL); + g_assert(!str); + g_free(in); + } + } + + /* Unparse @utf8_in, expect @json_out */ + str = qstring_from_str(utf8_in); + jstr = to_json_str(str); + g_assert_cmpstr(jstr, ==, json_out); + qobject_unref(str); + g_free(jstr); + + /* Parse @json_out right back, unless it has replacements */ + if (!strstr(json_out, "\\uFFFD")) { + str = from_json_str(json_out, j, &error_abort); + g_assert_cmpstr(qstring_get_str(str), ==, utf8_in); + qobject_unref(str); + } + } + } +} + +static void int_number(void) +{ + struct { + const char *encoded; + int64_t decoded; + const char *reencoded; + } test_cases[] = { + { "0", 0 }, + { "1234", 1234 }, + { "1", 1 }, + { "-32", -32 }, + { "-0", 0, "0" }, + {}, + }; + int i; + QNum *qnum; + int64_t ival; + uint64_t uval; + GString *str; + + for (i = 0; test_cases[i].encoded; i++) { + qnum = qobject_to(QNum, + qobject_from_json(test_cases[i].encoded, + &error_abort)); + g_assert(qnum); + g_assert(qnum_get_try_int(qnum, &ival)); + g_assert_cmpint(ival, ==, test_cases[i].decoded); + if (test_cases[i].decoded >= 0) { + g_assert(qnum_get_try_uint(qnum, &uval)); + g_assert_cmpuint(uval, ==, (uint64_t)test_cases[i].decoded); + } else { + g_assert(!qnum_get_try_uint(qnum, &uval)); + } + g_assert_cmpfloat(qnum_get_double(qnum), ==, + (double)test_cases[i].decoded); + + str = qobject_to_json(QOBJECT(qnum)); + g_assert_cmpstr(str->str, ==, + test_cases[i].reencoded ?: test_cases[i].encoded); + g_string_free(str, true); + + qobject_unref(qnum); + } +} + +static void uint_number(void) +{ + struct { + const char *encoded; + uint64_t decoded; + const char *reencoded; + } test_cases[] = { + { "9223372036854775808", (uint64_t)1 << 63 }, + { "18446744073709551615", UINT64_MAX }, + {}, + }; + int i; + QNum *qnum; + int64_t ival; + uint64_t uval; + GString *str; + + for (i = 0; test_cases[i].encoded; i++) { + qnum = qobject_to(QNum, + qobject_from_json(test_cases[i].encoded, + &error_abort)); + g_assert(qnum); + g_assert(qnum_get_try_uint(qnum, &uval)); + g_assert_cmpuint(uval, ==, test_cases[i].decoded); + g_assert(!qnum_get_try_int(qnum, &ival)); + g_assert_cmpfloat(qnum_get_double(qnum), ==, + (double)test_cases[i].decoded); + + str = qobject_to_json(QOBJECT(qnum)); + g_assert_cmpstr(str->str, ==, + test_cases[i].reencoded ?: test_cases[i].encoded); + g_string_free(str, true); + + qobject_unref(qnum); + } +} + +static void float_number(void) +{ + struct { + const char *encoded; + double decoded; + const char *reencoded; + } test_cases[] = { + { "32.43", 32.43 }, + { "0.222", 0.222 }, + { "-32.12313", -32.12313, "-32.123130000000003" }, + { "-32.20e-10", -32.20e-10, "-3.22e-09" }, + { "18446744073709551616", 0x1p64, "1.8446744073709552e+19" }, + { "-9223372036854775809", -0x1p63, "-9.2233720368547758e+18" }, + {}, + }; + int i; + QNum *qnum; + int64_t ival; + uint64_t uval; + GString *str; + + for (i = 0; test_cases[i].encoded; i++) { + qnum = qobject_to(QNum, + qobject_from_json(test_cases[i].encoded, + &error_abort)); + g_assert(qnum); + g_assert_cmpfloat(qnum_get_double(qnum), ==, test_cases[i].decoded); + g_assert(!qnum_get_try_int(qnum, &ival)); + g_assert(!qnum_get_try_uint(qnum, &uval)); + + str = qobject_to_json(QOBJECT(qnum)); + g_assert_cmpstr(str->str, ==, + test_cases[i].reencoded ?: test_cases[i].encoded); + g_string_free(str, true); + + qobject_unref(qnum); + } +} + +static void keyword_literal(void) +{ + QObject *obj; + QBool *qbool; + QNull *null; + GString *str; + + obj = qobject_from_json("true", &error_abort); + qbool = qobject_to(QBool, obj); + g_assert(qbool); + g_assert(qbool_get_bool(qbool) == true); + + str = qobject_to_json(obj); + g_assert_cmpstr(str->str, ==, "true"); + g_string_free(str, true); + + qobject_unref(qbool); + + obj = qobject_from_json("false", &error_abort); + qbool = qobject_to(QBool, obj); + g_assert(qbool); + g_assert(qbool_get_bool(qbool) == false); + + str = qobject_to_json(obj); + g_assert_cmpstr(str->str, ==, "false"); + g_string_free(str, true); + + qobject_unref(qbool); + + obj = qobject_from_json("null", &error_abort); + g_assert(obj != NULL); + g_assert(qobject_type(obj) == QTYPE_QNULL); + + null = qnull(); + g_assert(QOBJECT(null) == obj); + + qobject_unref(obj); + qobject_unref(null); +} + +static void interpolation_valid(void) +{ + long long value_lld = 0x123456789abcdefLL; + int64_t value_d64 = value_lld; + long value_ld = (long)value_lld; + int value_d = (int)value_lld; + unsigned long long value_llu = 0xfedcba9876543210ULL; + uint64_t value_u64 = value_llu; + unsigned long value_lu = (unsigned long)value_llu; + unsigned value_u = (unsigned)value_llu; + double value_f = 2.323423423; + const char *value_s = "hello world"; + QObject *value_p = QOBJECT(qnull()); + QBool *qbool; + QNum *qnum; + QString *qstr; + QObject *qobj; + + /* bool */ + + qbool = qobject_to(QBool, qobject_from_jsonf_nofail("%i", false)); + g_assert(qbool); + g_assert(qbool_get_bool(qbool) == false); + qobject_unref(qbool); + + /* Test that non-zero values other than 1 get collapsed to true */ + qbool = qobject_to(QBool, qobject_from_jsonf_nofail("%i", 2)); + g_assert(qbool); + g_assert(qbool_get_bool(qbool) == true); + qobject_unref(qbool); + + /* number */ + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%d", value_d)); + g_assert_cmpint(qnum_get_int(qnum), ==, value_d); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%ld", value_ld)); + g_assert_cmpint(qnum_get_int(qnum), ==, value_ld); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%lld", value_lld)); + g_assert_cmpint(qnum_get_int(qnum), ==, value_lld); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%" PRId64, value_d64)); + g_assert_cmpint(qnum_get_int(qnum), ==, value_lld); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%u", value_u)); + g_assert_cmpuint(qnum_get_uint(qnum), ==, value_u); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%lu", value_lu)); + g_assert_cmpuint(qnum_get_uint(qnum), ==, value_lu); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%llu", value_llu)); + g_assert_cmpuint(qnum_get_uint(qnum), ==, value_llu); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%" PRIu64, value_u64)); + g_assert_cmpuint(qnum_get_uint(qnum), ==, value_llu); + qobject_unref(qnum); + + qnum = qobject_to(QNum, qobject_from_jsonf_nofail("%f", value_f)); + g_assert(qnum_get_double(qnum) == value_f); + qobject_unref(qnum); + + /* string */ + + qstr = qobject_to(QString, qobject_from_jsonf_nofail("%s", value_s)); + g_assert_cmpstr(qstring_get_str(qstr), ==, value_s); + qobject_unref(qstr); + + /* object */ + + qobj = qobject_from_jsonf_nofail("%p", value_p); + g_assert(qobj == value_p); +} + +static void interpolation_unknown(void) +{ + if (g_test_subprocess()) { + qobject_from_jsonf_nofail("%x", 666); + } + g_test_trap_subprocess(NULL, 0, 0); + g_test_trap_assert_failed(); + g_test_trap_assert_stderr("*Unexpected error*" + "invalid interpolation '%x'*"); +} + +static void interpolation_string(void) +{ + if (g_test_subprocess()) { + qobject_from_jsonf_nofail("['%s', %s]", "eins", "zwei"); + } + g_test_trap_subprocess(NULL, 0, 0); + g_test_trap_assert_failed(); + g_test_trap_assert_stderr("*Unexpected error*" + "can't interpolate into string*"); +} + +static void simple_dict(void) +{ + int i; + struct { + const char *encoded; + QLitObject decoded; + } test_cases[] = { + { + .encoded = "{\"foo\": 42, \"bar\": \"hello world\"}", + .decoded = QLIT_QDICT(((QLitDictEntry[]){ + { "foo", QLIT_QNUM(42) }, + { "bar", QLIT_QSTR("hello world") }, + { } + })), + }, { + .encoded = "{}", + .decoded = QLIT_QDICT(((QLitDictEntry[]){ + { } + })), + }, { + .encoded = "{\"foo\": 43}", + .decoded = QLIT_QDICT(((QLitDictEntry[]){ + { "foo", QLIT_QNUM(43) }, + { } + })), + }, + { } + }; + + for (i = 0; test_cases[i].encoded; i++) { + QObject *obj; + GString *str; + + obj = qobject_from_json(test_cases[i].encoded, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + + str = qobject_to_json(obj); + qobject_unref(obj); + + obj = qobject_from_json(str->str, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + qobject_unref(obj); + g_string_free(str, true); + } +} + +/* + * this generates json of the form: + * a(0,m) = [0, 1, ..., m-1] + * a(n,m) = { + * 'key0': a(0,m), + * 'key1': a(1,m), + * ... + * 'key(n-1)': a(n-1,m) + * } + */ +static void gen_test_json(GString *gstr, int nest_level_max, + int elem_count) +{ + int i; + + g_assert(gstr); + if (nest_level_max == 0) { + g_string_append(gstr, "["); + for (i = 0; i < elem_count; i++) { + g_string_append_printf(gstr, "%d", i); + if (i < elem_count - 1) { + g_string_append_printf(gstr, ", "); + } + } + g_string_append(gstr, "]"); + return; + } + + g_string_append(gstr, "{"); + for (i = 0; i < nest_level_max; i++) { + g_string_append_printf(gstr, "'key%d': ", i); + gen_test_json(gstr, i, elem_count); + if (i < nest_level_max - 1) { + g_string_append(gstr, ","); + } + } + g_string_append(gstr, "}"); +} + +static void large_dict(void) +{ + GString *gstr = g_string_new(""); + QObject *obj; + + gen_test_json(gstr, 10, 100); + obj = qobject_from_json(gstr->str, &error_abort); + g_assert(obj != NULL); + + qobject_unref(obj); + g_string_free(gstr, true); +} + +static void simple_list(void) +{ + int i; + struct { + const char *encoded; + QLitObject decoded; + } test_cases[] = { + { + .encoded = "[43,42]", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(43), + QLIT_QNUM(42), + { } + })), + }, + { + .encoded = "[43]", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(43), + { } + })), + }, + { + .encoded = "[]", + .decoded = QLIT_QLIST(((QLitObject[]){ + { } + })), + }, + { + .encoded = "[{}]", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QDICT(((QLitDictEntry[]){ + {}, + })), + {}, + })), + }, + { } + }; + + for (i = 0; test_cases[i].encoded; i++) { + QObject *obj; + GString *str; + + obj = qobject_from_json(test_cases[i].encoded, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + + str = qobject_to_json(obj); + qobject_unref(obj); + + obj = qobject_from_json(str->str, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + qobject_unref(obj); + g_string_free(str, true); + } +} + +static void simple_whitespace(void) +{ + int i; + struct { + const char *encoded; + QLitObject decoded; + } test_cases[] = { + { + .encoded = " [ 43 , 42 ]", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(43), + QLIT_QNUM(42), + { } + })), + }, + { + .encoded = "\t[ 43 , { 'h' : 'b' },\r\n\t[ ], 42 ]\n", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(43), + QLIT_QDICT(((QLitDictEntry[]){ + { "h", QLIT_QSTR("b") }, + { }})), + QLIT_QLIST(((QLitObject[]){ + { }})), + QLIT_QNUM(42), + { } + })), + }, + { + .encoded = " [ 43 , { 'h' : 'b' , 'a' : 32 }, [ ], 42 ]", + .decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(43), + QLIT_QDICT(((QLitDictEntry[]){ + { "h", QLIT_QSTR("b") }, + { "a", QLIT_QNUM(32) }, + { }})), + QLIT_QLIST(((QLitObject[]){ + { }})), + QLIT_QNUM(42), + { } + })), + }, + { } + }; + + for (i = 0; test_cases[i].encoded; i++) { + QObject *obj; + GString *str; + + obj = qobject_from_json(test_cases[i].encoded, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + + str = qobject_to_json(obj); + qobject_unref(obj); + + obj = qobject_from_json(str->str, &error_abort); + g_assert(qlit_equal_qobject(&test_cases[i].decoded, obj)); + + qobject_unref(obj); + g_string_free(str, true); + } +} + +static void simple_interpolation(void) +{ + QObject *embedded_obj; + QObject *obj; + QLitObject decoded = QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(1), + QLIT_QSTR("100%"), + QLIT_QLIST(((QLitObject[]){ + QLIT_QNUM(32), + QLIT_QNUM(42), + {}})), + {}})); + + embedded_obj = qobject_from_json("[32, 42]", &error_abort); + g_assert(embedded_obj != NULL); + + obj = qobject_from_jsonf_nofail("[%d, '100%%', %p]", 1, embedded_obj); + g_assert(qlit_equal_qobject(&decoded, obj)); + + qobject_unref(obj); +} + +static void empty_input(void) +{ + Error *err = NULL; + QObject *obj; + + obj = qobject_from_json("", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void blank_input(void) +{ + Error *err = NULL; + QObject *obj; + + obj = qobject_from_json("\n ", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void junk_input(void) +{ + /* Note: junk within strings is covered elsewhere */ + Error *err = NULL; + QObject *obj; + + obj = qobject_from_json("@", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("{\x01", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("[0\xFF]", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("00", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("[1e", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("truer", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_string(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("\"abc", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_sq_string(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("'abc", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_escape(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("\"abc\\\"", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_array(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("[32", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_array_comma(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("[32,", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void invalid_array_comma(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("[32,}", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_dict(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("{'abc':32", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_dict_comma(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("{'abc':32,", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void invalid_dict_comma(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("{'abc':32,}", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void invalid_dict_key(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("{32:'abc'}", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void unterminated_literal(void) +{ + Error *err = NULL; + QObject *obj = qobject_from_json("nul", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static char *make_nest(char *buf, size_t cnt) +{ + memset(buf, '[', cnt - 1); + buf[cnt - 1] = '{'; + buf[cnt] = '}'; + memset(buf + cnt + 1, ']', cnt - 1); + buf[2 * cnt] = 0; + return buf; +} + +static void limits_nesting(void) +{ + Error *err = NULL; + enum { max_nesting = 1024 }; /* see qobject/json-streamer.c */ + char buf[2 * (max_nesting + 1) + 1]; + QObject *obj; + + obj = qobject_from_json(make_nest(buf, max_nesting), &error_abort); + g_assert(obj != NULL); + qobject_unref(obj); + + obj = qobject_from_json(make_nest(buf, max_nesting + 1), &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +static void multiple_values(void) +{ + Error *err = NULL; + QObject *obj; + + obj = qobject_from_json("false true", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); + + obj = qobject_from_json("} true", &err); + error_free_or_abort(&err); + g_assert(obj == NULL); +} + +int main(int argc, char **argv) +{ + g_test_init(&argc, &argv, NULL); + + g_test_add_func("/literals/string/escaped", escaped_string); + g_test_add_func("/literals/string/quotes", string_with_quotes); + g_test_add_func("/literals/string/utf8", utf8_string); + + g_test_add_func("/literals/number/int", int_number); + g_test_add_func("/literals/number/uint", uint_number); + g_test_add_func("/literals/number/float", float_number); + + g_test_add_func("/literals/keyword", keyword_literal); + + g_test_add_func("/literals/interpolation/valid", interpolation_valid); + g_test_add_func("/literals/interpolation/unkown", interpolation_unknown); + g_test_add_func("/literals/interpolation/string", interpolation_string); + + g_test_add_func("/dicts/simple_dict", simple_dict); + g_test_add_func("/dicts/large_dict", large_dict); + g_test_add_func("/lists/simple_list", simple_list); + + g_test_add_func("/mixed/simple_whitespace", simple_whitespace); + g_test_add_func("/mixed/interpolation", simple_interpolation); + + g_test_add_func("/errors/empty", empty_input); + g_test_add_func("/errors/blank", blank_input); + g_test_add_func("/errors/junk", junk_input); + g_test_add_func("/errors/unterminated/string", unterminated_string); + g_test_add_func("/errors/unterminated/escape", unterminated_escape); + g_test_add_func("/errors/unterminated/sq_string", unterminated_sq_string); + g_test_add_func("/errors/unterminated/array", unterminated_array); + g_test_add_func("/errors/unterminated/array_comma", unterminated_array_comma); + g_test_add_func("/errors/unterminated/dict", unterminated_dict); + g_test_add_func("/errors/unterminated/dict_comma", unterminated_dict_comma); + g_test_add_func("/errors/invalid_array_comma", invalid_array_comma); + g_test_add_func("/errors/invalid_dict_comma", invalid_dict_comma); + g_test_add_func("/errors/invalid_dict_key", invalid_dict_key); + g_test_add_func("/errors/unterminated/literal", unterminated_literal); + g_test_add_func("/errors/limits/nesting", limits_nesting); + g_test_add_func("/errors/multiple_values", multiple_values); + + return g_test_run(); +} |