ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/CBOR-XS/XS.xs
Revision: 1.56
Committed: Fri Nov 25 11:33:03 2016 UTC (7 years, 5 months ago) by root
Branch: MAIN
Changes since 1.55: +5 -3 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #include "EXTERN.h"
2 #include "perl.h"
3 #include "XSUB.h"
4
5 #include <assert.h>
6 #include <string.h>
7 #include <stdlib.h>
8 #include <stdio.h>
9 #include <limits.h>
10 #include <float.h>
11
12 #define ECB_NO_THREADS 1
13 #include "ecb.h"
14
15 // compatibility with perl <5.18
16 #ifndef HvNAMELEN_get
17 # define HvNAMELEN_get(hv) strlen (HvNAME (hv))
18 #endif
19 #ifndef HvNAMELEN
20 # define HvNAMELEN(hv) HvNAMELEN_get (hv)
21 #endif
22 #ifndef HvNAMEUTF8
23 # define HvNAMEUTF8(hv) 0
24 #endif
25 #ifndef SvREFCNT_dec_NN
26 # define SvREFCNT_dec_NN(sv) SvREFCNT_dec (sv)
27 #endif
28
29 // known major and minor types
30 enum cbor_type
31 {
32 MAJOR_SHIFT = 5,
33 MINOR_MASK = 0x1f,
34
35 MAJOR_POS_INT = 0 << MAJOR_SHIFT,
36 MAJOR_NEG_INT = 1 << MAJOR_SHIFT,
37 MAJOR_BYTES = 2 << MAJOR_SHIFT,
38 MAJOR_TEXT = 3 << MAJOR_SHIFT,
39 MAJOR_ARRAY = 4 << MAJOR_SHIFT,
40 MAJOR_MAP = 5 << MAJOR_SHIFT,
41 MAJOR_TAG = 6 << MAJOR_SHIFT,
42 MAJOR_MISC = 7 << MAJOR_SHIFT,
43
44 // INT/STRING/ARRAY/MAP subtypes
45 LENGTH_EXT1 = 24,
46 LENGTH_EXT2 = 25,
47 LENGTH_EXT4 = 26,
48 LENGTH_EXT8 = 27,
49
50 // SIMPLE types (effectively MISC subtypes)
51 SIMPLE_FALSE = 20,
52 SIMPLE_TRUE = 21,
53 SIMPLE_NULL = 22,
54 SIMPLE_UNDEF = 23,
55
56 // MISC subtype (unused)
57 MISC_EXT1 = 24,
58 MISC_FLOAT16 = 25,
59 MISC_FLOAT32 = 26,
60 MISC_FLOAT64 = 27,
61
62 // BYTES/TEXT/ARRAY/MAP
63 MINOR_INDEF = 31,
64 };
65
66 // known tags
67 enum cbor_tag
68 {
69 // extensions
70 CBOR_TAG_STRINGREF = 25, // http://cbor.schmorp.de/stringref
71 CBOR_TAG_PERL_OBJECT = 26, // http://cbor.schmorp.de/perl-object
72 CBOR_TAG_GENERIC_OBJECT = 27, // http://cbor.schmorp.de/generic-object
73 CBOR_TAG_VALUE_SHAREABLE = 28, // http://cbor.schmorp.de/value-sharing
74 CBOR_TAG_VALUE_SHAREDREF = 29, // http://cbor.schmorp.de/value-sharing
75 CBOR_TAG_STRINGREF_NAMESPACE = 256, // http://cbor.schmorp.de/stringref
76 CBOR_TAG_INDIRECTION = 22098, // http://cbor.schmorp.de/indirection
77
78 // rfc7049
79 CBOR_TAG_DATETIME = 0, // rfc4287, utf-8
80 CBOR_TAG_TIMESTAMP = 1, // unix timestamp, any
81 CBOR_TAG_POS_BIGNUM = 2, // byte string
82 CBOR_TAG_NEG_BIGNUM = 3, // byte string
83 CBOR_TAG_DECIMAL = 4, // decimal fraction, array
84 CBOR_TAG_BIGFLOAT = 5, // array
85
86 CBOR_TAG_CONV_B64U = 21, // base64url, any
87 CBOR_TAG_CONV_B64 = 22, // base64, any
88 CBOR_TAG_CONV_HEX = 23, // base16, any
89 CBOR_TAG_CBOR = 24, // embedded cbor, byte string
90
91 CBOR_TAG_URI = 32, // URI rfc3986, utf-8
92 CBOR_TAG_B64U = 33, // base64url rfc4648, utf-8
93 CBOR_TAG_B64 = 34, // base6 rfc46484, utf-8
94 CBOR_TAG_REGEX = 35, // regex pcre/ecma262, utf-8
95 CBOR_TAG_MIME = 36, // mime message rfc2045, utf-8
96
97 CBOR_TAG_MAGIC = 55799, // self-describe cbor
98 };
99
100 #define F_SHRINK 0x00000001UL
101 #define F_ALLOW_UNKNOWN 0x00000002UL
102 #define F_ALLOW_SHARING 0x00000004UL
103 #define F_ALLOW_CYCLES 0x00000008UL
104 #define F_PACK_STRINGS 0x00000010UL
105 #define F_TEXT_KEYS 0x00000020UL
106 #define F_TEXT_STRINGS 0x00000040UL
107 #define F_VALIDATE_UTF8 0x00000080UL
108
109 #define INIT_SIZE 32 // initial scalar size to be allocated
110
111 #define SB do {
112 #define SE } while (0)
113
114 #define IN_RANGE_INC(type,val,beg,end) \
115 ((unsigned type)((unsigned type)(val) - (unsigned type)(beg)) \
116 <= (unsigned type)((unsigned type)(end) - (unsigned type)(beg)))
117
118 #define ERR_NESTING_EXCEEDED "cbor text or perl structure exceeds maximum nesting level (max_depth set too low?)"
119
120 #ifdef USE_ITHREADS
121 # define CBOR_SLOW 1
122 # define CBOR_STASH (cbor_stash ? cbor_stash : gv_stashpv ("CBOR::XS", 1))
123 #else
124 # define CBOR_SLOW 0
125 # define CBOR_STASH cbor_stash
126 #endif
127
128 static HV *cbor_stash, *types_boolean_stash, *types_error_stash, *cbor_tagged_stash; // CBOR::XS::
129 static SV *types_true, *types_false, *types_error, *sv_cbor, *default_filter;
130
131 typedef struct {
132 U32 flags;
133 U32 max_depth;
134 STRLEN max_size;
135 SV *filter;
136
137 // for the incremental parser
138 STRLEN incr_pos; // the current offset into the text
139 STRLEN incr_need; // minimum bytes needed to decode
140 AV *incr_count; // for every nesting level, the number of outstanding values, or -1 for indef.
141 } CBOR;
142
143 ecb_inline void
144 cbor_init (CBOR *cbor)
145 {
146 Zero (cbor, 1, CBOR);
147 cbor->max_depth = 512;
148 }
149
150 ecb_inline void
151 cbor_free (CBOR *cbor)
152 {
153 SvREFCNT_dec (cbor->filter);
154 SvREFCNT_dec (cbor->incr_count);
155 }
156
157 /////////////////////////////////////////////////////////////////////////////
158 // utility functions
159
160 ecb_inline SV *
161 get_bool (const char *name)
162 {
163 SV *sv = get_sv (name, 1);
164
165 SvREADONLY_on (sv);
166 SvREADONLY_on (SvRV (sv));
167
168 return sv;
169 }
170
171 ecb_inline void
172 shrink (SV *sv)
173 {
174 sv_utf8_downgrade (sv, 1);
175
176 if (SvLEN (sv) > SvCUR (sv) + 1)
177 {
178 #ifdef SvPV_shrink_to_cur
179 SvPV_shrink_to_cur (sv);
180 #elif defined (SvPV_renew)
181 SvPV_renew (sv, SvCUR (sv) + 1);
182 #endif
183 }
184 }
185
186 // minimum length of a string to be registered for stringref
187 ecb_inline int
188 minimum_string_length (UV idx)
189 {
190 return idx > 23
191 ? idx > 0xffU
192 ? idx > 0xffffU
193 ? idx > 0xffffffffU
194 ? 11
195 : 7
196 : 5
197 : 4
198 : 3;
199 }
200
201 /////////////////////////////////////////////////////////////////////////////
202 // encoder
203
204 // structure used for encoding CBOR
205 typedef struct
206 {
207 char *cur; // SvPVX (sv) + current output position
208 char *end; // SvEND (sv)
209 SV *sv; // result scalar
210 CBOR cbor;
211 U32 depth; // recursion level
212 HV *stringref[2]; // string => index, or 0 ([0] = bytes, [1] = utf-8)
213 UV stringref_idx;
214 HV *shareable; // ptr => index, or 0
215 UV shareable_idx;
216 } enc_t;
217
218 ecb_inline void
219 need (enc_t *enc, STRLEN len)
220 {
221 if (ecb_expect_false (enc->cur + len >= enc->end))
222 {
223 STRLEN cur = enc->cur - (char *)SvPVX (enc->sv);
224 SvGROW (enc->sv, cur + (len < (cur >> 2) ? cur >> 2 : len) + 1);
225 enc->cur = SvPVX (enc->sv) + cur;
226 enc->end = SvPVX (enc->sv) + SvLEN (enc->sv) - 1;
227 }
228 }
229
230 ecb_inline void
231 encode_ch (enc_t *enc, char ch)
232 {
233 need (enc, 1);
234 *enc->cur++ = ch;
235 }
236
237 static void
238 encode_uint (enc_t *enc, int major, UV len)
239 {
240 need (enc, 9);
241
242 if (ecb_expect_true (len < LENGTH_EXT1))
243 *enc->cur++ = major | len;
244 else if (ecb_expect_true (len <= 0xffU))
245 {
246 *enc->cur++ = major | LENGTH_EXT1;
247 *enc->cur++ = len;
248 }
249 else if (len <= 0xffffU)
250 {
251 *enc->cur++ = major | LENGTH_EXT2;
252 *enc->cur++ = len >> 8;
253 *enc->cur++ = len;
254 }
255 else if (len <= 0xffffffffU)
256 {
257 *enc->cur++ = major | LENGTH_EXT4;
258 *enc->cur++ = len >> 24;
259 *enc->cur++ = len >> 16;
260 *enc->cur++ = len >> 8;
261 *enc->cur++ = len;
262 }
263 else
264 {
265 *enc->cur++ = major | LENGTH_EXT8;
266 *enc->cur++ = len >> 56;
267 *enc->cur++ = len >> 48;
268 *enc->cur++ = len >> 40;
269 *enc->cur++ = len >> 32;
270 *enc->cur++ = len >> 24;
271 *enc->cur++ = len >> 16;
272 *enc->cur++ = len >> 8;
273 *enc->cur++ = len;
274 }
275 }
276
277 ecb_inline void
278 encode_tag (enc_t *enc, UV tag)
279 {
280 encode_uint (enc, MAJOR_TAG, tag);
281 }
282
283 // exceptional (hopefully) slow path for byte strings that need to be utf8-encoded
284 ecb_noinline static void
285 encode_str_utf8 (enc_t *enc, int utf8, char *str, STRLEN len)
286 {
287 STRLEN ulen = len;
288 U8 *p, *pend = (U8 *)str + len;
289
290 for (p = (U8 *)str; p < pend; ++p)
291 ulen += *p >> 7; // count set high bits
292
293 encode_uint (enc, MAJOR_TEXT, ulen);
294
295 need (enc, ulen);
296 for (p = (U8 *)str; p < pend; ++p)
297 if (*p < 0x80)
298 *enc->cur++ = *p;
299 else
300 {
301 *enc->cur++ = 0xc0 + (*p >> 6);
302 *enc->cur++ = 0x80 + (*p & 63);
303 }
304 }
305
306 ecb_inline void
307 encode_str (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
308 {
309 if (ecb_expect_false (upgrade_utf8))
310 if (!utf8)
311 {
312 encode_str_utf8 (enc, utf8, str, len);
313 return;
314 }
315
316 encode_uint (enc, utf8 ? MAJOR_TEXT : MAJOR_BYTES, len);
317 need (enc, len);
318 memcpy (enc->cur, str, len);
319 enc->cur += len;
320 }
321
322 ecb_inline void
323 encode_strref (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
324 {
325 if (ecb_expect_false (enc->cbor.flags & F_PACK_STRINGS))
326 {
327 SV **svp = hv_fetch (enc->stringref[!!utf8], str, len, 1);
328
329 if (SvOK (*svp))
330 {
331 // already registered, use stringref
332 encode_tag (enc, CBOR_TAG_STRINGREF);
333 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
334 return;
335 }
336 else if (len >= minimum_string_length (enc->stringref_idx))
337 {
338 // register only
339 sv_setuv (*svp, enc->stringref_idx);
340 ++enc->stringref_idx;
341 }
342 }
343
344 encode_str (enc, upgrade_utf8, utf8, str, len);
345 }
346
347 static void encode_sv (enc_t *enc, SV *sv);
348
349 static void
350 encode_av (enc_t *enc, AV *av)
351 {
352 int i, len = av_len (av);
353
354 if (enc->depth >= enc->cbor.max_depth)
355 croak (ERR_NESTING_EXCEEDED);
356
357 ++enc->depth;
358
359 encode_uint (enc, MAJOR_ARRAY, len + 1);
360
361 if (SvMAGICAL (av))
362 for (i = 0; i <= len; ++i)
363 {
364 SV **svp = av_fetch (av, i, 0);
365 encode_sv (enc, svp ? *svp : &PL_sv_undef);
366 }
367 else
368 for (i = 0; i <= len; ++i)
369 {
370 SV *sv = AvARRAY (av)[i];
371 encode_sv (enc, sv ? sv : &PL_sv_undef);
372 }
373
374 --enc->depth;
375 }
376
377 static void
378 encode_hv (enc_t *enc, HV *hv)
379 {
380 HE *he;
381
382 if (enc->depth >= enc->cbor.max_depth)
383 croak (ERR_NESTING_EXCEEDED);
384
385 ++enc->depth;
386
387 int pairs = hv_iterinit (hv);
388 int mg = SvMAGICAL (hv);
389
390 if (mg)
391 encode_ch (enc, MAJOR_MAP | MINOR_INDEF);
392 else
393 encode_uint (enc, MAJOR_MAP, pairs);
394
395 while ((he = hv_iternext (hv)))
396 {
397 if (HeKLEN (he) == HEf_SVKEY)
398 encode_sv (enc, HeSVKEY (he));
399 else
400 encode_strref (enc, enc->cbor.flags & (F_TEXT_KEYS | F_TEXT_STRINGS), HeKUTF8 (he), HeKEY (he), HeKLEN (he));
401
402 encode_sv (enc, ecb_expect_false (mg) ? hv_iterval (hv, he) : HeVAL (he));
403 }
404
405 if (mg)
406 encode_ch (enc, MAJOR_MISC | MINOR_INDEF);
407
408 --enc->depth;
409 }
410
411 // encode objects, arrays and special \0=false and \1=true values.
412 static void
413 encode_rv (enc_t *enc, SV *sv)
414 {
415 SvGETMAGIC (sv);
416
417 svtype svt = SvTYPE (sv);
418
419 if (ecb_expect_false (SvOBJECT (sv)))
420 {
421 HV *boolean_stash = !CBOR_SLOW || types_boolean_stash
422 ? types_boolean_stash
423 : gv_stashpv ("Types::Serialiser::Boolean", 1);
424 HV *error_stash = !CBOR_SLOW || types_error_stash
425 ? types_error_stash
426 : gv_stashpv ("Types::Serialiser::Error", 1);
427 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
428 ? cbor_tagged_stash
429 : gv_stashpv ("CBOR::XS::Tagged" , 1);
430
431 HV *stash = SvSTASH (sv);
432
433 if (stash == boolean_stash)
434 {
435 encode_ch (enc, SvIV (sv) ? MAJOR_MISC | SIMPLE_TRUE : MAJOR_MISC | SIMPLE_FALSE);
436 return;
437 }
438 else if (stash == error_stash)
439 {
440 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
441 return;
442 }
443 else if (stash == tagged_stash)
444 {
445 if (svt != SVt_PVAV)
446 croak ("encountered CBOR::XS::Tagged object that isn't an array");
447
448 encode_uint (enc, MAJOR_TAG, SvUV (*av_fetch ((AV *)sv, 0, 1)));
449 encode_sv (enc, *av_fetch ((AV *)sv, 1, 1));
450
451 return;
452 }
453 }
454
455 if (ecb_expect_false (SvREFCNT (sv) > 1)
456 && ecb_expect_false (enc->cbor.flags & F_ALLOW_SHARING))
457 {
458 if (!enc->shareable)
459 enc->shareable = (HV *)sv_2mortal ((SV *)newHV ());
460
461 SV **svp = hv_fetch (enc->shareable, (char *)&sv, sizeof (sv), 1);
462
463 if (SvOK (*svp))
464 {
465 encode_tag (enc, CBOR_TAG_VALUE_SHAREDREF);
466 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
467 return;
468 }
469 else
470 {
471 sv_setuv (*svp, enc->shareable_idx);
472 ++enc->shareable_idx;
473 encode_tag (enc, CBOR_TAG_VALUE_SHAREABLE);
474 }
475 }
476
477 if (ecb_expect_false (SvOBJECT (sv)))
478 {
479 HV *stash = SvSTASH (sv);
480 GV *method;
481
482 if ((method = gv_fetchmethod_autoload (stash, "TO_CBOR", 0)))
483 {
484 dSP;
485
486 ENTER; SAVETMPS;
487 PUSHMARK (SP);
488 // we re-bless the reference to get overload and other niceties right
489 XPUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
490
491 PUTBACK;
492 // G_SCALAR ensures that return value is 1
493 call_sv ((SV *)GvCV (method), G_SCALAR);
494 SPAGAIN;
495
496 // catch this surprisingly common error
497 if (SvROK (TOPs) && SvRV (TOPs) == sv)
498 croak ("%s::TO_CBOR method returned same object as was passed instead of a new one", HvNAME (stash));
499
500 encode_sv (enc, POPs);
501
502 PUTBACK;
503
504 FREETMPS; LEAVE;
505 }
506 else if ((method = gv_fetchmethod_autoload (stash, "FREEZE", 0)) != 0)
507 {
508 dSP;
509
510 ENTER; SAVETMPS;
511 SAVESTACK_POS ();
512 PUSHMARK (SP);
513 EXTEND (SP, 2);
514 // we re-bless the reference to get overload and other niceties right
515 PUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
516 PUSHs (sv_cbor);
517
518 PUTBACK;
519 int count = call_sv ((SV *)GvCV (method), G_ARRAY);
520 SPAGAIN;
521
522 // catch this surprisingly common error
523 if (count == 1 && SvROK (TOPs) && SvRV (TOPs) == sv)
524 croak ("%s::FREEZE(CBOR) method returned same object as was passed instead of a new one", HvNAME (stash));
525
526 encode_tag (enc, CBOR_TAG_PERL_OBJECT);
527 encode_uint (enc, MAJOR_ARRAY, count + 1);
528 encode_strref (enc, 0, HvNAMEUTF8 (stash), HvNAME (stash), HvNAMELEN (stash));
529
530 while (count)
531 encode_sv (enc, SP[1 - count--]);
532
533 PUTBACK;
534
535 FREETMPS; LEAVE;
536 }
537 else
538 croak ("encountered object '%s', but no TO_CBOR or FREEZE methods available on it",
539 SvPV_nolen (sv_2mortal (newRV_inc (sv))));
540 }
541 else if (svt == SVt_PVHV)
542 encode_hv (enc, (HV *)sv);
543 else if (svt == SVt_PVAV)
544 encode_av (enc, (AV *)sv);
545 else
546 {
547 encode_tag (enc, CBOR_TAG_INDIRECTION);
548 encode_sv (enc, sv);
549 }
550 }
551
552 static void
553 encode_nv (enc_t *enc, SV *sv)
554 {
555 double nv = SvNVX (sv);
556
557 need (enc, 9);
558
559 if (ecb_expect_false (nv == (NV)(U32)nv))
560 encode_uint (enc, MAJOR_POS_INT, (U32)nv);
561 //TODO: maybe I32?
562 else if (ecb_expect_false (nv == (float)nv))
563 {
564 uint32_t fp = ecb_float_to_binary32 (nv);
565
566 *enc->cur++ = MAJOR_MISC | MISC_FLOAT32;
567
568 if (!ecb_big_endian ())
569 fp = ecb_bswap32 (fp);
570
571 memcpy (enc->cur, &fp, 4);
572 enc->cur += 4;
573 }
574 else
575 {
576 uint64_t fp = ecb_double_to_binary64 (nv);
577
578 *enc->cur++ = MAJOR_MISC | MISC_FLOAT64;
579
580 if (!ecb_big_endian ())
581 fp = ecb_bswap64 (fp);
582
583 memcpy (enc->cur, &fp, 8);
584 enc->cur += 8;
585 }
586 }
587
588 static void
589 encode_sv (enc_t *enc, SV *sv)
590 {
591 SvGETMAGIC (sv);
592
593 if (SvPOKp (sv))
594 {
595 STRLEN len;
596 char *str = SvPV (sv, len);
597 encode_strref (enc, enc->cbor.flags & F_TEXT_STRINGS, SvUTF8 (sv), str, len);
598 }
599 else if (SvNOKp (sv))
600 encode_nv (enc, sv);
601 else if (SvIOKp (sv))
602 {
603 if (SvIsUV (sv))
604 encode_uint (enc, MAJOR_POS_INT, SvUVX (sv));
605 else if (SvIVX (sv) >= 0)
606 encode_uint (enc, MAJOR_POS_INT, SvIVX (sv));
607 else
608 encode_uint (enc, MAJOR_NEG_INT, -(SvIVX (sv) + 1));
609 }
610 else if (SvROK (sv))
611 encode_rv (enc, SvRV (sv));
612 else if (!SvOK (sv))
613 encode_ch (enc, MAJOR_MISC | SIMPLE_NULL);
614 else if (enc->cbor.flags & F_ALLOW_UNKNOWN)
615 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
616 else
617 croak ("encountered perl type (%s,0x%x) that CBOR cannot handle, check your input data",
618 SvPV_nolen (sv), (unsigned int)SvFLAGS (sv));
619 }
620
621 static SV *
622 encode_cbor (SV *scalar, CBOR *cbor)
623 {
624 enc_t enc = { 0 };
625
626 enc.cbor = *cbor;
627 enc.sv = sv_2mortal (NEWSV (0, INIT_SIZE));
628 enc.cur = SvPVX (enc.sv);
629 enc.end = SvEND (enc.sv);
630
631 SvPOK_only (enc.sv);
632
633 if (cbor->flags & F_PACK_STRINGS)
634 {
635 encode_tag (&enc, CBOR_TAG_STRINGREF_NAMESPACE);
636 enc.stringref[0]= (HV *)sv_2mortal ((SV *)newHV ());
637 enc.stringref[1]= (HV *)sv_2mortal ((SV *)newHV ());
638 }
639
640 encode_sv (&enc, scalar);
641
642 SvCUR_set (enc.sv, enc.cur - SvPVX (enc.sv));
643 *SvEND (enc.sv) = 0; // many xs functions expect a trailing 0 for text strings
644
645 if (enc.cbor.flags & F_SHRINK)
646 shrink (enc.sv);
647
648 return enc.sv;
649 }
650
651 /////////////////////////////////////////////////////////////////////////////
652 // decoder
653
654 // structure used for decoding CBOR
655 typedef struct
656 {
657 U8 *cur; // current parser pointer
658 U8 *end; // end of input string
659 const char *err; // parse error, if != 0
660 CBOR cbor;
661 U32 depth; // recursion depth
662 U32 maxdepth; // recursion depth limit
663 AV *shareable;
664 AV *stringref;
665 SV *decode_tagged;
666 } dec_t;
667
668 #define ERR(reason) SB if (!dec->err) dec->err = reason; goto fail; SE
669
670 #define WANT(len) if (ecb_expect_false (dec->cur + len > dec->end)) ERR ("unexpected end of CBOR data")
671
672 #define DEC_INC_DEPTH if (ecb_expect_false (++dec->depth > dec->cbor.max_depth)) ERR (ERR_NESTING_EXCEEDED)
673 #define DEC_DEC_DEPTH --dec->depth
674
675 static UV
676 decode_uint (dec_t *dec)
677 {
678 U8 m = *dec->cur & MINOR_MASK;
679 ++dec->cur;
680
681 if (ecb_expect_true (m < LENGTH_EXT1))
682 return m;
683 else if (ecb_expect_true (m == LENGTH_EXT1))
684 {
685 WANT (1);
686 dec->cur += 1;
687 return dec->cur[-1];
688 }
689 else if (ecb_expect_true (m == LENGTH_EXT2))
690 {
691 WANT (2);
692 dec->cur += 2;
693 return (((UV)dec->cur[-2]) << 8)
694 | ((UV)dec->cur[-1]);
695 }
696 else if (ecb_expect_true (m == LENGTH_EXT4))
697 {
698 WANT (4);
699 dec->cur += 4;
700 return (((UV)dec->cur[-4]) << 24)
701 | (((UV)dec->cur[-3]) << 16)
702 | (((UV)dec->cur[-2]) << 8)
703 | ((UV)dec->cur[-1]);
704 }
705 else if (ecb_expect_true (m == LENGTH_EXT8))
706 {
707 WANT (8);
708 dec->cur += 8;
709
710 return
711 #if UVSIZE < 8
712 0
713 #else
714 (((UV)dec->cur[-8]) << 56)
715 | (((UV)dec->cur[-7]) << 48)
716 | (((UV)dec->cur[-6]) << 40)
717 | (((UV)dec->cur[-5]) << 32)
718 #endif
719 | (((UV)dec->cur[-4]) << 24)
720 | (((UV)dec->cur[-3]) << 16)
721 | (((UV)dec->cur[-2]) << 8)
722 | ((UV)dec->cur[-1]);
723 }
724 else
725 ERR ("corrupted CBOR data (unsupported integer minor encoding)");
726
727 fail:
728 return 0;
729 }
730
731 static SV *decode_sv (dec_t *dec);
732
733 static SV *
734 decode_av (dec_t *dec)
735 {
736 AV *av = newAV ();
737
738 DEC_INC_DEPTH;
739
740 if (*dec->cur == (MAJOR_ARRAY | MINOR_INDEF))
741 {
742 ++dec->cur;
743
744 for (;;)
745 {
746 WANT (1);
747
748 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
749 {
750 ++dec->cur;
751 break;
752 }
753
754 av_push (av, decode_sv (dec));
755 }
756 }
757 else
758 {
759 int i, len = decode_uint (dec);
760
761 WANT (len); // complexity check for av_fill - need at least one byte per value, do not allow supersize arrays
762 av_fill (av, len - 1);
763
764 for (i = 0; i < len; ++i)
765 AvARRAY (av)[i] = decode_sv (dec);
766 }
767
768 DEC_DEC_DEPTH;
769 return newRV_noinc ((SV *)av);
770
771 fail:
772 SvREFCNT_dec (av);
773 DEC_DEC_DEPTH;
774 return &PL_sv_undef;
775 }
776
777 static void
778 decode_he (dec_t *dec, HV *hv)
779 {
780 // for speed reasons, we specialcase single-string
781 // byte or utf-8 strings as keys, but only when !stringref
782
783 if (ecb_expect_true (!dec->stringref))
784 if (ecb_expect_true ((U8)(*dec->cur - MAJOR_BYTES) <= LENGTH_EXT8))
785 {
786 STRLEN len = decode_uint (dec);
787 char *key = (char *)dec->cur;
788
789 WANT (len);
790 dec->cur += len;
791
792 hv_store (hv, key, len, decode_sv (dec), 0);
793
794 return;
795 }
796 else if (ecb_expect_true ((U8)(*dec->cur - MAJOR_TEXT) <= LENGTH_EXT8))
797 {
798 STRLEN len = decode_uint (dec);
799 char *key = (char *)dec->cur;
800
801 WANT (len);
802 dec->cur += len;
803
804 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
805 if (!is_utf8_string (key, len))
806 ERR ("corrupted CBOR data (invalid UTF-8 in map key)");
807
808 hv_store (hv, key, -len, decode_sv (dec), 0);
809
810 return;
811 }
812
813 SV *k = decode_sv (dec);
814 SV *v = decode_sv (dec);
815
816 hv_store_ent (hv, k, v, 0);
817 SvREFCNT_dec (k);
818
819 fail:
820 ;
821 }
822
823 static SV *
824 decode_hv (dec_t *dec)
825 {
826 HV *hv = newHV ();
827
828 DEC_INC_DEPTH;
829
830 if (*dec->cur == (MAJOR_MAP | MINOR_INDEF))
831 {
832 ++dec->cur;
833
834 for (;;)
835 {
836 WANT (1);
837
838 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
839 {
840 ++dec->cur;
841 break;
842 }
843
844 decode_he (dec, hv);
845 }
846 }
847 else
848 {
849 int pairs = decode_uint (dec);
850
851 while (pairs--)
852 decode_he (dec, hv);
853 }
854
855 DEC_DEC_DEPTH;
856 return newRV_noinc ((SV *)hv);
857
858 fail:
859 SvREFCNT_dec (hv);
860 DEC_DEC_DEPTH;
861 return &PL_sv_undef;
862 }
863
864 static SV *
865 decode_str (dec_t *dec, int utf8)
866 {
867 SV *sv = 0;
868
869 if ((*dec->cur & MINOR_MASK) == MINOR_INDEF)
870 {
871 // indefinite length strings
872 ++dec->cur;
873
874 U8 major = *dec->cur & MAJOR_MISC;
875
876 sv = newSVpvn ("", 0);
877
878 for (;;)
879 {
880 WANT (1);
881
882 if ((*dec->cur - major) > LENGTH_EXT8)
883 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
884 {
885 ++dec->cur;
886 break;
887 }
888 else
889 ERR ("corrupted CBOR data (invalid chunks in indefinite length string)");
890
891 STRLEN len = decode_uint (dec);
892
893 WANT (len);
894 sv_catpvn (sv, dec->cur, len);
895 dec->cur += len;
896 }
897 }
898 else
899 {
900 STRLEN len = decode_uint (dec);
901
902 WANT (len);
903 sv = newSVpvn (dec->cur, len);
904 dec->cur += len;
905
906 if (ecb_expect_false (dec->stringref)
907 && SvCUR (sv) >= minimum_string_length (AvFILLp (dec->stringref) + 1))
908 av_push (dec->stringref, SvREFCNT_inc_NN (sv));
909 }
910
911 if (utf8)
912 {
913 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
914 if (!is_utf8_string (SvPVX (sv), SvCUR (sv)))
915 ERR ("corrupted CBOR data (invalid UTF-8 in text string)");
916
917 SvUTF8_on (sv);
918 }
919
920 return sv;
921
922 fail:
923 SvREFCNT_dec (sv);
924 return &PL_sv_undef;
925 }
926
927 static SV *
928 decode_tagged (dec_t *dec)
929 {
930 SV *sv = 0;
931 UV tag = decode_uint (dec);
932
933 WANT (1);
934
935 switch (tag)
936 {
937 case CBOR_TAG_MAGIC:
938 sv = decode_sv (dec);
939 break;
940
941 case CBOR_TAG_INDIRECTION:
942 sv = newRV_noinc (decode_sv (dec));
943 break;
944
945 case CBOR_TAG_STRINGREF_NAMESPACE:
946 {
947 // do nmot use SAVETMPS/FREETMPS, as these will
948 // erase mortalised caches, e.g. "shareable"
949 ENTER;
950
951 SAVESPTR (dec->stringref);
952 dec->stringref = (AV *)sv_2mortal ((SV *)newAV ());
953
954 sv = decode_sv (dec);
955
956 LEAVE;
957 }
958 break;
959
960 case CBOR_TAG_STRINGREF:
961 {
962 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
963 ERR ("corrupted CBOR data (stringref index not an unsigned integer)");
964
965 UV idx = decode_uint (dec);
966
967 if (!dec->stringref || (int)idx > AvFILLp (dec->stringref))
968 ERR ("corrupted CBOR data (stringref index out of bounds or outside namespace)");
969
970 sv = newSVsv (AvARRAY (dec->stringref)[idx]);
971 }
972 break;
973
974 case CBOR_TAG_VALUE_SHAREABLE:
975 {
976 if (ecb_expect_false (!dec->shareable))
977 dec->shareable = (AV *)sv_2mortal ((SV *)newAV ());
978
979 if (dec->cbor.flags & F_ALLOW_CYCLES)
980 {
981 sv = newSV (0);
982 av_push (dec->shareable, SvREFCNT_inc_NN (sv));
983
984 SV *osv = decode_sv (dec);
985 sv_setsv (sv, osv);
986 SvREFCNT_dec_NN (osv);
987 }
988 else
989 {
990 av_push (dec->shareable, &PL_sv_undef);
991 int idx = AvFILLp (dec->shareable);
992 sv = decode_sv (dec);
993 av_store (dec->shareable, idx, SvREFCNT_inc_NN (sv));
994 }
995 }
996 break;
997
998 case CBOR_TAG_VALUE_SHAREDREF:
999 {
1000 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
1001 ERR ("corrupted CBOR data (sharedref index not an unsigned integer)");
1002
1003 UV idx = decode_uint (dec);
1004
1005 if (!dec->shareable || (int)idx > AvFILLp (dec->shareable))
1006 ERR ("corrupted CBOR data (sharedref index out of bounds)");
1007
1008 sv = SvREFCNT_inc_NN (AvARRAY (dec->shareable)[idx]);
1009
1010 if (sv == &PL_sv_undef)
1011 ERR ("cyclic CBOR data structure found, but allow_cycles is not enabled");
1012 }
1013 break;
1014
1015 case CBOR_TAG_PERL_OBJECT:
1016 {
1017 sv = decode_sv (dec);
1018
1019 if (!SvROK (sv) || SvTYPE (SvRV (sv)) != SVt_PVAV)
1020 ERR ("corrupted CBOR data (non-array perl object)");
1021
1022 AV *av = (AV *)SvRV (sv);
1023 int len = av_len (av) + 1;
1024 HV *stash = gv_stashsv (*av_fetch (av, 0, 1), 0);
1025
1026 if (!stash)
1027 ERR ("cannot decode perl-object (package does not exist)");
1028
1029 GV *method = gv_fetchmethod_autoload (stash, "THAW", 0);
1030
1031 if (!method)
1032 ERR ("cannot decode perl-object (package does not have a THAW method)");
1033
1034 dSP;
1035
1036 ENTER; SAVETMPS;
1037 PUSHMARK (SP);
1038 EXTEND (SP, len + 1);
1039 // we re-bless the reference to get overload and other niceties right
1040 PUSHs (*av_fetch (av, 0, 1));
1041 PUSHs (sv_cbor);
1042
1043 int i;
1044
1045 for (i = 1; i < len; ++i)
1046 PUSHs (*av_fetch (av, i, 1));
1047
1048 PUTBACK;
1049 call_sv ((SV *)GvCV (method), G_SCALAR | G_EVAL);
1050 SPAGAIN;
1051
1052 if (SvTRUE (ERRSV))
1053 {
1054 FREETMPS; LEAVE;
1055 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1056 }
1057
1058 SvREFCNT_dec (sv);
1059 sv = SvREFCNT_inc (POPs);
1060
1061 PUTBACK;
1062
1063 FREETMPS; LEAVE;
1064 }
1065 break;
1066
1067 default:
1068 {
1069 sv = decode_sv (dec);
1070
1071 dSP;
1072 ENTER; SAVETMPS;
1073 SAVESTACK_POS ();
1074 PUSHMARK (SP);
1075 EXTEND (SP, 2);
1076 PUSHs (newSVuv (tag));
1077 PUSHs (sv);
1078
1079 PUTBACK;
1080 int count = call_sv (dec->cbor.filter ? dec->cbor.filter : default_filter, G_ARRAY | G_EVAL);
1081 SPAGAIN;
1082
1083 if (SvTRUE (ERRSV))
1084 {
1085 FREETMPS; LEAVE;
1086 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1087 }
1088
1089 if (count)
1090 {
1091 SvREFCNT_dec (sv);
1092 sv = SvREFCNT_inc (POPs);
1093 }
1094 else
1095 {
1096 AV *av = newAV ();
1097 av_push (av, newSVuv (tag));
1098 av_push (av, sv);
1099
1100 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
1101 ? cbor_tagged_stash
1102 : gv_stashpv ("CBOR::XS::Tagged" , 1);
1103 sv = sv_bless (newRV_noinc ((SV *)av), tagged_stash);
1104 }
1105
1106 PUTBACK;
1107
1108 FREETMPS; LEAVE;
1109 }
1110 break;
1111 }
1112
1113 return sv;
1114
1115 fail:
1116 SvREFCNT_dec (sv);
1117 return &PL_sv_undef;
1118 }
1119
1120 static SV *
1121 decode_sv (dec_t *dec)
1122 {
1123 WANT (1);
1124
1125 switch (*dec->cur >> MAJOR_SHIFT)
1126 {
1127 case MAJOR_POS_INT >> MAJOR_SHIFT: return newSVuv (decode_uint (dec));
1128 case MAJOR_NEG_INT >> MAJOR_SHIFT: return newSViv (-1 - (IV)decode_uint (dec));
1129 case MAJOR_BYTES >> MAJOR_SHIFT: return decode_str (dec, 0);
1130 case MAJOR_TEXT >> MAJOR_SHIFT: return decode_str (dec, 1);
1131 case MAJOR_ARRAY >> MAJOR_SHIFT: return decode_av (dec);
1132 case MAJOR_MAP >> MAJOR_SHIFT: return decode_hv (dec);
1133 case MAJOR_TAG >> MAJOR_SHIFT: return decode_tagged (dec);
1134
1135 case MAJOR_MISC >> MAJOR_SHIFT:
1136 switch (*dec->cur++ & MINOR_MASK)
1137 {
1138 case SIMPLE_FALSE:
1139 #if CBOR_SLOW
1140 types_false = get_bool ("Types::Serialiser::false");
1141 #endif
1142 return newSVsv (types_false);
1143 case SIMPLE_TRUE:
1144 #if CBOR_SLOW
1145 types_true = get_bool ("Types::Serialiser::true");
1146 #endif
1147 return newSVsv (types_true);
1148 case SIMPLE_NULL:
1149 return newSVsv (&PL_sv_undef);
1150 case SIMPLE_UNDEF:
1151 #if CBOR_SLOW
1152 types_error = get_bool ("Types::Serialiser::error");
1153 #endif
1154 return newSVsv (types_error);
1155
1156 case MISC_FLOAT16:
1157 {
1158 WANT (2);
1159
1160 uint16_t fp = (dec->cur[0] << 8) | dec->cur[1];
1161 dec->cur += 2;
1162
1163 return newSVnv (ecb_binary16_to_float (fp));
1164 }
1165
1166 case MISC_FLOAT32:
1167 {
1168 uint32_t fp;
1169 WANT (4);
1170 memcpy (&fp, dec->cur, 4);
1171 dec->cur += 4;
1172
1173 if (!ecb_big_endian ())
1174 fp = ecb_bswap32 (fp);
1175
1176 return newSVnv (ecb_binary32_to_float (fp));
1177 }
1178
1179 case MISC_FLOAT64:
1180 {
1181 uint64_t fp;
1182 WANT (8);
1183 memcpy (&fp, dec->cur, 8);
1184 dec->cur += 8;
1185
1186 if (!ecb_big_endian ())
1187 fp = ecb_bswap64 (fp);
1188
1189 return newSVnv (ecb_binary64_to_double (fp));
1190 }
1191
1192 // 0..19 unassigned simple
1193 // 24 reserved + unassigned simple (reserved values are not encodable)
1194 // 28-30 unassigned misc
1195 // 31 break code
1196 default:
1197 ERR ("corrupted CBOR data (reserved/unassigned/unexpected major 7 value)");
1198 }
1199
1200 break;
1201 }
1202
1203 fail:
1204 return &PL_sv_undef;
1205 }
1206
1207 static SV *
1208 decode_cbor (SV *string, CBOR *cbor, char **offset_return)
1209 {
1210 dec_t dec = { 0 };
1211 SV *sv;
1212 STRLEN len;
1213 char *data = SvPVbyte (string, len);
1214
1215 if (len > cbor->max_size && cbor->max_size)
1216 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1217 (unsigned long)len, (unsigned long)cbor->max_size);
1218
1219 dec.cbor = *cbor;
1220 dec.cur = (U8 *)data;
1221 dec.end = (U8 *)data + len;
1222
1223 sv = decode_sv (&dec);
1224
1225 if (offset_return)
1226 *offset_return = dec.cur;
1227
1228 if (!(offset_return || !sv))
1229 if (dec.cur != dec.end && !dec.err)
1230 dec.err = "garbage after CBOR object";
1231
1232 if (dec.err)
1233 {
1234 if (dec.shareable)
1235 {
1236 // need to break cyclic links, which whould all be in shareable
1237 int i;
1238 SV **svp;
1239
1240 for (i = av_len (dec.shareable) + 1; i--; )
1241 if ((svp = av_fetch (dec.shareable, i, 0)))
1242 sv_setsv (*svp, &PL_sv_undef);
1243 }
1244
1245 SvREFCNT_dec (sv);
1246 croak ("%s, at offset %d (octet 0x%02x)", dec.err, dec.cur - (U8 *)data, (int)(uint8_t)*dec.cur);
1247 }
1248
1249 sv = sv_2mortal (sv);
1250
1251 return sv;
1252 }
1253
1254 /////////////////////////////////////////////////////////////////////////////
1255 // incremental parser
1256
1257 #define INCR_DONE(cbor) (AvFILLp (cbor->incr_count) < 0)
1258
1259 // returns 0 for notyet, 1 for success or error
1260 static int
1261 incr_parse (CBOR *self, SV *cborstr)
1262 {
1263 STRLEN cur;
1264 SvPV (cborstr, cur);
1265
1266 while (ecb_expect_true (self->incr_need <= cur))
1267 {
1268 // table of integer count bytes
1269 static I8 incr_len[MINOR_MASK + 1] = {
1270 0, 0, 0, 0, 0, 0, 0, 0,
1271 0, 0, 0, 0, 0, 0, 0, 0,
1272 0, 0, 0, 0, 0, 0, 0, 0,
1273 1, 2, 4, 8,-1,-1,-1,-2
1274 };
1275
1276 const U8 *p = SvPVX (cborstr) + self->incr_pos;
1277 U8 m = *p & MINOR_MASK;
1278 IV count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1279 I8 ilen = incr_len[m];
1280
1281 self->incr_need = self->incr_pos + 1;
1282
1283 if (ecb_expect_false (ilen < 0))
1284 {
1285 if (m != MINOR_INDEF)
1286 return 1; // error
1287
1288 if (*p == (MAJOR_MISC | MINOR_INDEF))
1289 {
1290 if (count >= 0)
1291 return 1; // error
1292
1293 count = 1;
1294 }
1295 else
1296 {
1297 av_push (self->incr_count, newSViv (-1)); //TODO: nest
1298 count = -1;
1299 }
1300 }
1301 else
1302 {
1303 self->incr_need += ilen;
1304 if (ecb_expect_false (self->incr_need > cur))
1305 return 0;
1306
1307 int major = *p >> MAJOR_SHIFT;
1308
1309 switch (major)
1310 {
1311 case MAJOR_TAG >> MAJOR_SHIFT:
1312 ++count; // tags merely prefix another value
1313 break;
1314
1315 case MAJOR_BYTES >> MAJOR_SHIFT:
1316 case MAJOR_TEXT >> MAJOR_SHIFT:
1317 case MAJOR_ARRAY >> MAJOR_SHIFT:
1318 case MAJOR_MAP >> MAJOR_SHIFT:
1319 {
1320 UV len;
1321
1322 if (ecb_expect_false (ilen))
1323 {
1324 len = 0;
1325
1326 do {
1327 len = (len << 8) | *++p;
1328 } while (--ilen);
1329 }
1330 else
1331 len = m;
1332
1333 switch (major)
1334 {
1335 case MAJOR_BYTES >> MAJOR_SHIFT:
1336 case MAJOR_TEXT >> MAJOR_SHIFT:
1337 self->incr_need += len;
1338 if (ecb_expect_false (self->incr_need > cur))
1339 return 0;
1340
1341 break;
1342
1343 case MAJOR_MAP >> MAJOR_SHIFT:
1344 len <<= 1;
1345 case MAJOR_ARRAY >> MAJOR_SHIFT:
1346 if (len)
1347 {
1348 av_push (self->incr_count, newSViv (len + 1)); //TODO: nest
1349 count = len + 1;
1350 }
1351 break;
1352 }
1353 }
1354 }
1355 }
1356
1357 self->incr_pos = self->incr_need;
1358
1359 if (count > 0)
1360 {
1361 while (!--count)
1362 {
1363 if (!AvFILLp (self->incr_count))
1364 return 1; // done
1365
1366 SvREFCNT_dec_NN (av_pop (self->incr_count));
1367 count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1368 }
1369
1370 SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]) = count;
1371 }
1372 }
1373
1374 return 0;
1375 }
1376
1377
1378 /////////////////////////////////////////////////////////////////////////////
1379 // XS interface functions
1380
1381 MODULE = CBOR::XS PACKAGE = CBOR::XS
1382
1383 BOOT:
1384 {
1385 cbor_stash = gv_stashpv ("CBOR::XS" , 1);
1386 cbor_tagged_stash = gv_stashpv ("CBOR::XS::Tagged" , 1);
1387
1388 types_boolean_stash = gv_stashpv ("Types::Serialiser::Boolean", 1);
1389 types_error_stash = gv_stashpv ("Types::Serialiser::Error" , 1);
1390
1391 types_true = get_bool ("Types::Serialiser::true" );
1392 types_false = get_bool ("Types::Serialiser::false");
1393 types_error = get_bool ("Types::Serialiser::error");
1394
1395 default_filter = newSVpv ("CBOR::XS::default_filter", 0);
1396
1397 sv_cbor = newSVpv ("CBOR", 0);
1398 SvREADONLY_on (sv_cbor);
1399
1400 assert (("STRLEN must be an unsigned type", 0 <= (STRLEN)-1));
1401 }
1402
1403 PROTOTYPES: DISABLE
1404
1405 void CLONE (...)
1406 CODE:
1407 cbor_stash = 0;
1408 cbor_tagged_stash = 0;
1409 types_error_stash = 0;
1410 types_boolean_stash = 0;
1411
1412 void new (char *klass)
1413 PPCODE:
1414 {
1415 SV *pv = NEWSV (0, sizeof (CBOR));
1416 SvPOK_only (pv);
1417 cbor_init ((CBOR *)SvPVX (pv));
1418 XPUSHs (sv_2mortal (sv_bless (
1419 newRV_noinc (pv),
1420 strEQ (klass, "CBOR::XS") ? CBOR_STASH : gv_stashpv (klass, 1)
1421 )));
1422 }
1423
1424 void shrink (CBOR *self, int enable = 1)
1425 ALIAS:
1426 shrink = F_SHRINK
1427 allow_unknown = F_ALLOW_UNKNOWN
1428 allow_sharing = F_ALLOW_SHARING
1429 allow_cycles = F_ALLOW_CYCLES
1430 pack_strings = F_PACK_STRINGS
1431 text_keys = F_TEXT_KEYS
1432 text_strings = F_TEXT_STRINGS
1433 validate_utf8 = F_VALIDATE_UTF8
1434 PPCODE:
1435 {
1436 if (enable)
1437 self->flags |= ix;
1438 else
1439 self->flags &= ~ix;
1440
1441 XPUSHs (ST (0));
1442 }
1443
1444 void get_shrink (CBOR *self)
1445 ALIAS:
1446 get_shrink = F_SHRINK
1447 get_allow_unknown = F_ALLOW_UNKNOWN
1448 get_allow_sharing = F_ALLOW_SHARING
1449 get_allow_cycles = F_ALLOW_CYCLES
1450 get_pack_strings = F_PACK_STRINGS
1451 get_text_keys = F_TEXT_KEYS
1452 get_text_strings = F_TEXT_STRINGS
1453 get_validate_utf8 = F_VALIDATE_UTF8
1454 PPCODE:
1455 XPUSHs (boolSV (self->flags & ix));
1456
1457 void max_depth (CBOR *self, U32 max_depth = 0x80000000UL)
1458 PPCODE:
1459 self->max_depth = max_depth;
1460 XPUSHs (ST (0));
1461
1462 U32 get_max_depth (CBOR *self)
1463 CODE:
1464 RETVAL = self->max_depth;
1465 OUTPUT:
1466 RETVAL
1467
1468 void max_size (CBOR *self, U32 max_size = 0)
1469 PPCODE:
1470 self->max_size = max_size;
1471 XPUSHs (ST (0));
1472
1473 int get_max_size (CBOR *self)
1474 CODE:
1475 RETVAL = self->max_size;
1476 OUTPUT:
1477 RETVAL
1478
1479 void filter (CBOR *self, SV *filter = 0)
1480 PPCODE:
1481 SvREFCNT_dec (self->filter);
1482 self->filter = filter ? newSVsv (filter) : filter;
1483 XPUSHs (ST (0));
1484
1485 SV *get_filter (CBOR *self)
1486 CODE:
1487 RETVAL = self->filter ? self->filter : NEWSV (0, 0);
1488 OUTPUT:
1489 RETVAL
1490
1491 void encode (CBOR *self, SV *scalar)
1492 PPCODE:
1493 PUTBACK; scalar = encode_cbor (scalar, self); SPAGAIN;
1494 XPUSHs (scalar);
1495
1496 void decode (CBOR *self, SV *cborstr)
1497 PPCODE:
1498 PUTBACK; cborstr = decode_cbor (cborstr, self, 0); SPAGAIN;
1499 XPUSHs (cborstr);
1500
1501 void decode_prefix (CBOR *self, SV *cborstr)
1502 PPCODE:
1503 {
1504 SV *sv;
1505 char *offset;
1506 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1507 EXTEND (SP, 2);
1508 PUSHs (sv);
1509 PUSHs (sv_2mortal (newSVuv (offset - SvPVX (cborstr))));
1510 }
1511
1512 void incr_parse (CBOR *self, SV *cborstr)
1513 ALIAS:
1514 incr_parse_multiple = 1
1515 PPCODE:
1516 {
1517 if (SvUTF8 (cborstr))
1518 sv_utf8_downgrade (cborstr, 0);
1519
1520 if (!self->incr_count)
1521 {
1522 self->incr_count = newAV ();
1523 self->incr_pos = 0;
1524 self->incr_need = 1;
1525
1526 av_push (self->incr_count, newSViv (1));
1527 }
1528
1529 do
1530 {
1531 if (!incr_parse (self, cborstr))
1532 {
1533 if (self->incr_need > self->max_size && self->max_size)
1534 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1535 (unsigned long)self->incr_need, (unsigned long)self->max_size);
1536
1537 break;
1538 }
1539
1540 SV *sv;
1541 char *offset;
1542
1543 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1544 XPUSHs (sv);
1545
1546 sv_chop (cborstr, offset);
1547
1548 av_clear (self->incr_count);
1549 av_push (self->incr_count, newSViv (1));
1550
1551 self->incr_pos = 0;
1552 self->incr_need = self->incr_pos + 1;
1553 }
1554 while (ix);
1555 }
1556
1557 void incr_reset (CBOR *self)
1558 CODE:
1559 {
1560 SvREFCNT_dec (self->incr_count);
1561 self->incr_count = 0;
1562 }
1563
1564 void DESTROY (CBOR *self)
1565 PPCODE:
1566 cbor_free (self);
1567
1568 PROTOTYPES: ENABLE
1569
1570 void encode_cbor (SV *scalar)
1571 ALIAS:
1572 encode_cbor = 0
1573 encode_cbor_sharing = F_ALLOW_SHARING
1574 PPCODE:
1575 {
1576 CBOR cbor;
1577 cbor_init (&cbor);
1578 cbor.flags |= ix;
1579 PUTBACK; scalar = encode_cbor (scalar, &cbor); SPAGAIN;
1580 XPUSHs (scalar);
1581 }
1582
1583 void decode_cbor (SV *cborstr)
1584 PPCODE:
1585 {
1586 CBOR cbor;
1587 cbor_init (&cbor);
1588 PUTBACK; cborstr = decode_cbor (cborstr, &cbor, 0); SPAGAIN;
1589 XPUSHs (cborstr);
1590 }
1591