… | |
… | |
27 | #define F_SPACE_AFTER 0x00000040UL |
27 | #define F_SPACE_AFTER 0x00000040UL |
28 | #define F_ALLOW_NONREF 0x00000100UL |
28 | #define F_ALLOW_NONREF 0x00000100UL |
29 | #define F_SHRINK 0x00000200UL |
29 | #define F_SHRINK 0x00000200UL |
30 | #define F_ALLOW_BLESSED 0x00000400UL |
30 | #define F_ALLOW_BLESSED 0x00000400UL |
31 | #define F_CONV_BLESSED 0x00000800UL |
31 | #define F_CONV_BLESSED 0x00000800UL |
|
|
32 | #define F_RELAXED 0x00001000UL |
|
|
33 | |
32 | #define F_MAXDEPTH 0xf8000000UL |
34 | #define F_MAXDEPTH 0xf8000000UL |
33 | #define S_MAXDEPTH 27 |
35 | #define S_MAXDEPTH 27 |
34 | #define F_MAXSIZE 0x01f00000UL |
36 | #define F_MAXSIZE 0x01f00000UL |
35 | #define S_MAXSIZE 20 |
37 | #define S_MAXSIZE 20 |
36 | #define F_HOOK 0x00080000UL // some hooks exist, so slow-path processing |
38 | #define F_HOOK 0x00080000UL // some hooks exist, so slow-path processing |
… | |
… | |
60 | #define expect_false(expr) expect ((expr) != 0, 0) |
62 | #define expect_false(expr) expect ((expr) != 0, 0) |
61 | #define expect_true(expr) expect ((expr) != 0, 1) |
63 | #define expect_true(expr) expect ((expr) != 0, 1) |
62 | |
64 | |
63 | #ifdef USE_ITHREADS |
65 | #ifdef USE_ITHREADS |
64 | # define JSON_SLOW 1 |
66 | # define JSON_SLOW 1 |
|
|
67 | # define JSON_STASH (json_stash ? json_stash : gv_stashpv ("JSON::XS", 1)) |
65 | #else |
68 | #else |
66 | # define JSON_SLOW 0 |
69 | # define JSON_SLOW 0 |
|
|
70 | # define JSON_STASH json_stash |
67 | #endif |
71 | #endif |
68 | |
72 | |
69 | static HV *json_stash, *json_boolean_stash; // JSON::XS:: |
73 | static HV *json_stash, *json_boolean_stash; // JSON::XS:: |
70 | static SV *json_true, *json_false; |
74 | static SV *json_true, *json_false; |
71 | |
75 | |
… | |
… | |
333 | --enc->indent; |
337 | --enc->indent; |
334 | encode_indent (enc); encode_ch (enc, ']'); |
338 | encode_indent (enc); encode_ch (enc, ']'); |
335 | } |
339 | } |
336 | |
340 | |
337 | static void |
341 | static void |
338 | encode_he (enc_t *enc, HE *he) |
342 | encode_hk (enc_t *enc, HE *he) |
339 | { |
343 | { |
340 | encode_ch (enc, '"'); |
344 | encode_ch (enc, '"'); |
341 | |
345 | |
342 | if (HeKLEN (he) == HEf_SVKEY) |
346 | if (HeKLEN (he) == HEf_SVKEY) |
343 | { |
347 | { |
… | |
… | |
356 | encode_ch (enc, '"'); |
360 | encode_ch (enc, '"'); |
357 | |
361 | |
358 | if (enc->json.flags & F_SPACE_BEFORE) encode_space (enc); |
362 | if (enc->json.flags & F_SPACE_BEFORE) encode_space (enc); |
359 | encode_ch (enc, ':'); |
363 | encode_ch (enc, ':'); |
360 | if (enc->json.flags & F_SPACE_AFTER ) encode_space (enc); |
364 | if (enc->json.flags & F_SPACE_AFTER ) encode_space (enc); |
361 | encode_sv (enc, HeVAL (he)); |
|
|
362 | } |
365 | } |
363 | |
366 | |
364 | // compare hash entries, used when all keys are bytestrings |
367 | // compare hash entries, used when all keys are bytestrings |
365 | static int |
368 | static int |
366 | he_cmp_fast (const void *a_, const void *b_) |
369 | he_cmp_fast (const void *a_, const void *b_) |
… | |
… | |
371 | HE *b = *(HE **)b_; |
374 | HE *b = *(HE **)b_; |
372 | |
375 | |
373 | STRLEN la = HeKLEN (a); |
376 | STRLEN la = HeKLEN (a); |
374 | STRLEN lb = HeKLEN (b); |
377 | STRLEN lb = HeKLEN (b); |
375 | |
378 | |
376 | if (!(cmp = memcmp (HeKEY (a), HeKEY (b), la < lb ? la : lb))) |
379 | if (!(cmp = memcmp (HeKEY (b), HeKEY (a), lb < la ? lb : la))) |
377 | cmp = la - lb; |
380 | cmp = lb - la; |
378 | |
381 | |
379 | return cmp; |
382 | return cmp; |
380 | } |
383 | } |
381 | |
384 | |
382 | // compare hash entries, used when some keys are sv's or utf-x |
385 | // compare hash entries, used when some keys are sv's or utf-x |
383 | static int |
386 | static int |
384 | he_cmp_slow (const void *a, const void *b) |
387 | he_cmp_slow (const void *a, const void *b) |
385 | { |
388 | { |
386 | return sv_cmp (HeSVKEY_force (*(HE **)a), HeSVKEY_force (*(HE **)b)); |
389 | return sv_cmp (HeSVKEY_force (*(HE **)b), HeSVKEY_force (*(HE **)a)); |
387 | } |
390 | } |
388 | |
391 | |
389 | static void |
392 | static void |
390 | encode_hv (enc_t *enc, HV *hv) |
393 | encode_hv (enc_t *enc, HV *hv) |
391 | { |
394 | { |
|
|
395 | HE *he; |
392 | int count, i; |
396 | int count; |
393 | |
397 | |
394 | if (enc->indent >= enc->maxdepth) |
398 | if (enc->indent >= enc->maxdepth) |
395 | croak ("data structure too deep (hit recursion limit)"); |
399 | croak ("data structure too deep (hit recursion limit)"); |
396 | |
400 | |
397 | encode_ch (enc, '{'); encode_nl (enc); ++enc->indent; |
401 | encode_ch (enc, '{'); encode_nl (enc); ++enc->indent; |
398 | |
402 | |
399 | if ((count = hv_iterinit (hv))) |
|
|
400 | { |
|
|
401 | // for canonical output we have to sort by keys first |
403 | // for canonical output we have to sort by keys first |
402 | // actually, this is mostly due to the stupid so-called |
404 | // actually, this is mostly due to the stupid so-called |
403 | // security workaround added somewhere in 5.8.x. |
405 | // security workaround added somewhere in 5.8.x. |
404 | // that randomises hash orderings |
406 | // that randomises hash orderings |
405 | if (enc->json.flags & F_CANONICAL) |
407 | if (enc->json.flags & F_CANONICAL) |
|
|
408 | { |
|
|
409 | int count = hv_iterinit (hv); |
|
|
410 | |
|
|
411 | if (SvMAGICAL (hv)) |
406 | { |
412 | { |
|
|
413 | // need to count by iterating. could improve by dynamically building the vector below |
|
|
414 | // but I don't care for the speed of this special case. |
|
|
415 | // note also that we will run into undefined behaviour when the two iterations |
|
|
416 | // do not result in the same count, something I might care for in some later release. |
|
|
417 | |
|
|
418 | count = 0; |
|
|
419 | while (hv_iternext (hv)) |
|
|
420 | ++count; |
|
|
421 | |
|
|
422 | hv_iterinit (hv); |
|
|
423 | } |
|
|
424 | |
|
|
425 | if (count) |
|
|
426 | { |
407 | int fast = 1; |
427 | int i, fast = 1; |
408 | HE *he; |
|
|
409 | #if defined(__BORLANDC__) || defined(_MSC_VER) |
428 | #if defined(__BORLANDC__) || defined(_MSC_VER) |
410 | HE **hes = _alloca (count * sizeof (HE)); |
429 | HE **hes = _alloca (count * sizeof (HE)); |
411 | #else |
430 | #else |
412 | HE *hes [count]; // if your compiler dies here, you need to enable C99 mode |
431 | HE *hes [count]; // if your compiler dies here, you need to enable C99 mode |
413 | #endif |
432 | #endif |
… | |
… | |
440 | |
459 | |
441 | FREETMPS; |
460 | FREETMPS; |
442 | LEAVE; |
461 | LEAVE; |
443 | } |
462 | } |
444 | |
463 | |
445 | for (i = 0; i < count; ++i) |
464 | while (count--) |
446 | { |
465 | { |
447 | encode_indent (enc); |
466 | encode_indent (enc); |
|
|
467 | he = hes [count]; |
448 | encode_he (enc, hes [i]); |
468 | encode_hk (enc, he); |
|
|
469 | encode_sv (enc, expect_false (SvMAGICAL (hv)) ? hv_iterval (hv, he) : HeVAL (he)); |
449 | |
470 | |
450 | if (i < count - 1) |
471 | if (count) |
451 | encode_comma (enc); |
472 | encode_comma (enc); |
452 | } |
473 | } |
453 | |
|
|
454 | encode_nl (enc); |
|
|
455 | } |
474 | } |
|
|
475 | } |
456 | else |
476 | else |
457 | { |
477 | { |
|
|
478 | if (hv_iterinit (hv) || SvMAGICAL (hv)) |
458 | HE *he = hv_iternext (hv); |
479 | if ((he = hv_iternext (hv))) |
459 | |
|
|
460 | for (;;) |
480 | for (;;) |
461 | { |
481 | { |
462 | encode_indent (enc); |
482 | encode_indent (enc); |
463 | encode_he (enc, he); |
483 | encode_hk (enc, he); |
|
|
484 | encode_sv (enc, expect_false (SvMAGICAL (hv)) ? hv_iterval (hv, he) : HeVAL (he)); |
464 | |
485 | |
465 | if (!(he = hv_iternext (hv))) |
486 | if (!(he = hv_iternext (hv))) |
466 | break; |
487 | break; |
467 | |
488 | |
468 | encode_comma (enc); |
489 | encode_comma (enc); |
469 | } |
490 | } |
|
|
491 | } |
470 | |
492 | |
471 | encode_nl (enc); |
493 | encode_nl (enc); |
472 | } |
|
|
473 | } |
|
|
474 | |
494 | |
475 | --enc->indent; encode_indent (enc); encode_ch (enc, '}'); |
495 | --enc->indent; encode_indent (enc); encode_ch (enc, '}'); |
476 | } |
496 | } |
477 | |
497 | |
478 | // encode objects, arrays and special \0=false and \1=true values. |
498 | // encode objects, arrays and special \0=false and \1=true values. |
… | |
… | |
690 | |
710 | |
691 | if (ch > 0x20 |
711 | if (ch > 0x20 |
692 | || (ch != 0x20 && ch != 0x0a && ch != 0x0d && ch != 0x09)) |
712 | || (ch != 0x20 && ch != 0x0a && ch != 0x0d && ch != 0x09)) |
693 | break; |
713 | break; |
694 | |
714 | |
|
|
715 | if (ch == '#' && dec->json.flags & F_RELAXED) |
|
|
716 | ++dec->cur; |
|
|
717 | |
695 | ++dec->cur; |
718 | ++dec->cur; |
696 | } |
719 | } |
697 | } |
720 | } |
698 | |
721 | |
699 | #define ERR(reason) SB dec->err = reason; goto fail; SE |
722 | #define ERR(reason) SB dec->err = reason; goto fail; SE |
… | |
… | |
1035 | |
1058 | |
1036 | if (*dec->cur != ',') |
1059 | if (*dec->cur != ',') |
1037 | ERR (", or ] expected while parsing array"); |
1060 | ERR (", or ] expected while parsing array"); |
1038 | |
1061 | |
1039 | ++dec->cur; |
1062 | ++dec->cur; |
|
|
1063 | |
|
|
1064 | decode_ws (dec); |
|
|
1065 | |
|
|
1066 | if (*dec->cur == ']' && dec->json.flags & F_RELAXED) |
|
|
1067 | { |
|
|
1068 | ++dec->cur; |
|
|
1069 | break; |
|
|
1070 | } |
1040 | } |
1071 | } |
1041 | |
1072 | |
1042 | DEC_DEC_DEPTH; |
1073 | DEC_DEC_DEPTH; |
1043 | return newRV_noinc ((SV *)av); |
1074 | return newRV_noinc ((SV *)av); |
1044 | |
1075 | |
… | |
… | |
1060 | if (*dec->cur == '}') |
1091 | if (*dec->cur == '}') |
1061 | ++dec->cur; |
1092 | ++dec->cur; |
1062 | else |
1093 | else |
1063 | for (;;) |
1094 | for (;;) |
1064 | { |
1095 | { |
1065 | decode_ws (dec); EXPECT_CH ('"'); |
1096 | EXPECT_CH ('"'); |
1066 | |
1097 | |
1067 | // heuristic: assume that |
1098 | // heuristic: assume that |
1068 | // a) decode_str + hv_store_ent are abysmally slow. |
1099 | // a) decode_str + hv_store_ent are abysmally slow. |
1069 | // b) most hash keys are short, simple ascii text. |
1100 | // b) most hash keys are short, simple ascii text. |
1070 | // => try to "fast-match" such strings to avoid |
1101 | // => try to "fast-match" such strings to avoid |
… | |
… | |
1084 | if (!key) |
1115 | if (!key) |
1085 | goto fail; |
1116 | goto fail; |
1086 | |
1117 | |
1087 | decode_ws (dec); EXPECT_CH (':'); |
1118 | decode_ws (dec); EXPECT_CH (':'); |
1088 | |
1119 | |
|
|
1120 | decode_ws (dec); |
1089 | value = decode_sv (dec); |
1121 | value = decode_sv (dec); |
1090 | if (!value) |
1122 | if (!value) |
1091 | { |
1123 | { |
1092 | SvREFCNT_dec (key); |
1124 | SvREFCNT_dec (key); |
1093 | goto fail; |
1125 | goto fail; |
… | |
… | |
1105 | int len = p - key; |
1137 | int len = p - key; |
1106 | dec->cur = p + 1; |
1138 | dec->cur = p + 1; |
1107 | |
1139 | |
1108 | decode_ws (dec); EXPECT_CH (':'); |
1140 | decode_ws (dec); EXPECT_CH (':'); |
1109 | |
1141 | |
|
|
1142 | decode_ws (dec); |
1110 | value = decode_sv (dec); |
1143 | value = decode_sv (dec); |
1111 | if (!value) |
1144 | if (!value) |
1112 | goto fail; |
1145 | goto fail; |
1113 | |
1146 | |
1114 | hv_store (hv, key, len, value, 0); |
1147 | hv_store (hv, key, len, value, 0); |
… | |
… | |
1130 | |
1163 | |
1131 | if (*dec->cur != ',') |
1164 | if (*dec->cur != ',') |
1132 | ERR (", or } expected while parsing object/hash"); |
1165 | ERR (", or } expected while parsing object/hash"); |
1133 | |
1166 | |
1134 | ++dec->cur; |
1167 | ++dec->cur; |
|
|
1168 | |
|
|
1169 | decode_ws (dec); |
|
|
1170 | |
|
|
1171 | if (*dec->cur == '}' && dec->json.flags & F_RELAXED) |
|
|
1172 | { |
|
|
1173 | ++dec->cur; |
|
|
1174 | break; |
|
|
1175 | } |
1135 | } |
1176 | } |
1136 | |
1177 | |
1137 | DEC_DEC_DEPTH; |
1178 | DEC_DEC_DEPTH; |
1138 | sv = newRV_noinc ((SV *)hv); |
1179 | sv = newRV_noinc ((SV *)hv); |
1139 | |
1180 | |
… | |
… | |
1204 | } |
1245 | } |
1205 | |
1246 | |
1206 | static SV * |
1247 | static SV * |
1207 | decode_sv (dec_t *dec) |
1248 | decode_sv (dec_t *dec) |
1208 | { |
1249 | { |
1209 | decode_ws (dec); |
|
|
1210 | |
|
|
1211 | // the beauty of JSON: you need exactly one character lookahead |
1250 | // the beauty of JSON: you need exactly one character lookahead |
1212 | // to parse anything. |
1251 | // to parse anything. |
1213 | switch (*dec->cur) |
1252 | switch (*dec->cur) |
1214 | { |
1253 | { |
1215 | case '"': ++dec->cur; return decode_str (dec); |
1254 | case '"': ++dec->cur; return decode_str (dec); |
… | |
… | |
1223 | |
1262 | |
1224 | case 't': |
1263 | case 't': |
1225 | if (dec->end - dec->cur >= 4 && !memcmp (dec->cur, "true", 4)) |
1264 | if (dec->end - dec->cur >= 4 && !memcmp (dec->cur, "true", 4)) |
1226 | { |
1265 | { |
1227 | dec->cur += 4; |
1266 | dec->cur += 4; |
|
|
1267 | #if JSON_SLOW |
|
|
1268 | json_true = get_sv ("JSON::XS::true", 1); SvREADONLY_on (json_true); |
|
|
1269 | #endif |
1228 | return SvREFCNT_inc (json_true); |
1270 | return SvREFCNT_inc (json_true); |
1229 | } |
1271 | } |
1230 | else |
1272 | else |
1231 | ERR ("'true' expected"); |
1273 | ERR ("'true' expected"); |
1232 | |
1274 | |
… | |
… | |
1234 | |
1276 | |
1235 | case 'f': |
1277 | case 'f': |
1236 | if (dec->end - dec->cur >= 5 && !memcmp (dec->cur, "false", 5)) |
1278 | if (dec->end - dec->cur >= 5 && !memcmp (dec->cur, "false", 5)) |
1237 | { |
1279 | { |
1238 | dec->cur += 5; |
1280 | dec->cur += 5; |
|
|
1281 | #if JSON_SLOW |
|
|
1282 | json_false = get_sv ("JSON::XS::false", 1); SvREADONLY_on (json_false); |
|
|
1283 | #endif |
1239 | return SvREFCNT_inc (json_false); |
1284 | return SvREFCNT_inc (json_false); |
1240 | } |
1285 | } |
1241 | else |
1286 | else |
1242 | ERR ("'false' expected"); |
1287 | ERR ("'false' expected"); |
1243 | |
1288 | |
… | |
… | |
1293 | |
1338 | |
1294 | if (dec.json.cb_object || dec.json.cb_sk_object) |
1339 | if (dec.json.cb_object || dec.json.cb_sk_object) |
1295 | dec.json.flags |= F_HOOK; |
1340 | dec.json.flags |= F_HOOK; |
1296 | |
1341 | |
1297 | *dec.end = 0; // this should basically be a nop, too, but make sure it's there |
1342 | *dec.end = 0; // this should basically be a nop, too, but make sure it's there |
|
|
1343 | |
|
|
1344 | decode_ws (&dec); |
1298 | sv = decode_sv (&dec); |
1345 | sv = decode_sv (&dec); |
1299 | |
1346 | |
1300 | if (!(offset_return || !sv)) |
1347 | if (!(offset_return || !sv)) |
1301 | { |
1348 | { |
1302 | // check for trailing garbage |
1349 | // check for trailing garbage |
… | |
… | |
1378 | json_boolean_stash = 0; |
1425 | json_boolean_stash = 0; |
1379 | |
1426 | |
1380 | void new (char *klass) |
1427 | void new (char *klass) |
1381 | PPCODE: |
1428 | PPCODE: |
1382 | { |
1429 | { |
1383 | HV *stash = !JSON_SLOW || json_stash |
|
|
1384 | ? json_stash |
|
|
1385 | : gv_stashpv ("JSON::XS", 1); |
|
|
1386 | SV *pv = NEWSV (0, sizeof (JSON)); |
1430 | SV *pv = NEWSV (0, sizeof (JSON)); |
1387 | SvPOK_only (pv); |
1431 | SvPOK_only (pv); |
1388 | Zero (SvPVX (pv), 1, JSON); |
1432 | Zero (SvPVX (pv), 1, JSON); |
1389 | ((JSON *)SvPVX (pv))->flags = F_DEFAULT; |
1433 | ((JSON *)SvPVX (pv))->flags = F_DEFAULT; |
1390 | XPUSHs (sv_2mortal (sv_bless (newRV_noinc (pv), stash))); |
1434 | XPUSHs (sv_2mortal (sv_bless (newRV_noinc (pv), JSON_STASH))); |
1391 | } |
1435 | } |
1392 | |
1436 | |
1393 | void ascii (JSON *self, int enable = 1) |
1437 | void ascii (JSON *self, int enable = 1) |
1394 | ALIAS: |
1438 | ALIAS: |
1395 | ascii = F_ASCII |
1439 | ascii = F_ASCII |
… | |
… | |
1402 | pretty = F_PRETTY |
1446 | pretty = F_PRETTY |
1403 | allow_nonref = F_ALLOW_NONREF |
1447 | allow_nonref = F_ALLOW_NONREF |
1404 | shrink = F_SHRINK |
1448 | shrink = F_SHRINK |
1405 | allow_blessed = F_ALLOW_BLESSED |
1449 | allow_blessed = F_ALLOW_BLESSED |
1406 | convert_blessed = F_CONV_BLESSED |
1450 | convert_blessed = F_CONV_BLESSED |
|
|
1451 | relaxed = F_RELAXED |
1407 | PPCODE: |
1452 | PPCODE: |
1408 | { |
1453 | { |
1409 | if (enable) |
1454 | if (enable) |
1410 | self->flags |= ix; |
1455 | self->flags |= ix; |
1411 | else |
1456 | else |