ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/CBOR-XS/XS.xs
Revision: 1.53
Committed: Sun Apr 24 19:51:41 2016 UTC (8 years ago) by root
Branch: MAIN
Changes since 1.52: +34 -28 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #include "EXTERN.h"
2 #include "perl.h"
3 #include "XSUB.h"
4
5 #include <assert.h>
6 #include <string.h>
7 #include <stdlib.h>
8 #include <stdio.h>
9 #include <limits.h>
10 #include <float.h>
11
12 #define ECB_NO_THREADS 1
13 #include "ecb.h"
14
15 // compatibility with perl <5.18
16 #ifndef HvNAMELEN_get
17 # define HvNAMELEN_get(hv) strlen (HvNAME (hv))
18 #endif
19 #ifndef HvNAMELEN
20 # define HvNAMELEN(hv) HvNAMELEN_get (hv)
21 #endif
22 #ifndef HvNAMEUTF8
23 # define HvNAMEUTF8(hv) 0
24 #endif
25 #ifndef SvREFCNT_dec_NN
26 # define SvREFCNT_dec_NN(sv) SvREFCNT_dec (sv)
27 #endif
28
29 // known major and minor types
30 enum cbor_type
31 {
32 MAJOR_SHIFT = 5,
33 MINOR_MASK = 0x1f,
34
35 MAJOR_POS_INT = 0 << MAJOR_SHIFT,
36 MAJOR_NEG_INT = 1 << MAJOR_SHIFT,
37 MAJOR_BYTES = 2 << MAJOR_SHIFT,
38 MAJOR_TEXT = 3 << MAJOR_SHIFT,
39 MAJOR_ARRAY = 4 << MAJOR_SHIFT,
40 MAJOR_MAP = 5 << MAJOR_SHIFT,
41 MAJOR_TAG = 6 << MAJOR_SHIFT,
42 MAJOR_MISC = 7 << MAJOR_SHIFT,
43
44 // INT/STRING/ARRAY/MAP subtypes
45 LENGTH_EXT1 = 24,
46 LENGTH_EXT2 = 25,
47 LENGTH_EXT4 = 26,
48 LENGTH_EXT8 = 27,
49
50 // SIMPLE types (effectively MISC subtypes)
51 SIMPLE_FALSE = 20,
52 SIMPLE_TRUE = 21,
53 SIMPLE_NULL = 22,
54 SIMPLE_UNDEF = 23,
55
56 // MISC subtype (unused)
57 MISC_EXT1 = 24,
58 MISC_FLOAT16 = 25,
59 MISC_FLOAT32 = 26,
60 MISC_FLOAT64 = 27,
61
62 // BYTES/TEXT/ARRAY/MAP
63 MINOR_INDEF = 31,
64 };
65
66 // known tags
67 enum cbor_tag
68 {
69 // extensions
70 CBOR_TAG_STRINGREF = 25, // http://cbor.schmorp.de/stringref
71 CBOR_TAG_PERL_OBJECT = 26, // http://cbor.schmorp.de/perl-object
72 CBOR_TAG_GENERIC_OBJECT = 27, // http://cbor.schmorp.de/generic-object
73 CBOR_TAG_VALUE_SHAREABLE = 28, // http://cbor.schmorp.de/value-sharing
74 CBOR_TAG_VALUE_SHAREDREF = 29, // http://cbor.schmorp.de/value-sharing
75 CBOR_TAG_STRINGREF_NAMESPACE = 256, // http://cbor.schmorp.de/stringref
76 CBOR_TAG_INDIRECTION = 22098, // http://cbor.schmorp.de/indirection
77
78 // rfc7049
79 CBOR_TAG_DATETIME = 0, // rfc4287, utf-8
80 CBOR_TAG_TIMESTAMP = 1, // unix timestamp, any
81 CBOR_TAG_POS_BIGNUM = 2, // byte string
82 CBOR_TAG_NEG_BIGNUM = 3, // byte string
83 CBOR_TAG_DECIMAL = 4, // decimal fraction, array
84 CBOR_TAG_BIGFLOAT = 5, // array
85
86 CBOR_TAG_CONV_B64U = 21, // base64url, any
87 CBOR_TAG_CONV_B64 = 22, // base64, any
88 CBOR_TAG_CONV_HEX = 23, // base16, any
89 CBOR_TAG_CBOR = 24, // embedded cbor, byte string
90
91 CBOR_TAG_URI = 32, // URI rfc3986, utf-8
92 CBOR_TAG_B64U = 33, // base64url rfc4648, utf-8
93 CBOR_TAG_B64 = 34, // base6 rfc46484, utf-8
94 CBOR_TAG_REGEX = 35, // regex pcre/ecma262, utf-8
95 CBOR_TAG_MIME = 36, // mime message rfc2045, utf-8
96
97 CBOR_TAG_MAGIC = 55799, // self-describe cbor
98 };
99
100 #define F_SHRINK 0x00000001UL
101 #define F_ALLOW_UNKNOWN 0x00000002UL
102 #define F_ALLOW_SHARING 0x00000004UL
103 #define F_ALLOW_CYCLES 0x00000008UL
104 #define F_PACK_STRINGS 0x00000010UL
105 #define F_UTF8_STRINGS 0x00000020UL
106 #define F_UTF8_KEYS 0x00000040UL
107 #define F_VALIDATE_UTF8 0x00000080UL
108
109 #define INIT_SIZE 32 // initial scalar size to be allocated
110
111 #define SB do {
112 #define SE } while (0)
113
114 #define IN_RANGE_INC(type,val,beg,end) \
115 ((unsigned type)((unsigned type)(val) - (unsigned type)(beg)) \
116 <= (unsigned type)((unsigned type)(end) - (unsigned type)(beg)))
117
118 #define ERR_NESTING_EXCEEDED "cbor text or perl structure exceeds maximum nesting level (max_depth set too low?)"
119
120 #ifdef USE_ITHREADS
121 # define CBOR_SLOW 1
122 # define CBOR_STASH (cbor_stash ? cbor_stash : gv_stashpv ("CBOR::XS", 1))
123 #else
124 # define CBOR_SLOW 0
125 # define CBOR_STASH cbor_stash
126 #endif
127
128 static HV *cbor_stash, *types_boolean_stash, *types_error_stash, *cbor_tagged_stash; // CBOR::XS::
129 static SV *types_true, *types_false, *types_error, *sv_cbor, *default_filter;
130
131 typedef struct {
132 U32 flags;
133 U32 max_depth;
134 STRLEN max_size;
135 SV *filter;
136
137 // for the incremental parser
138 STRLEN incr_pos; // the current offset into the text
139 STRLEN incr_need; // minimum bytes needed to decode
140 AV *incr_count; // for every nesting level, the number of outstanding values, or -1 for indef.
141 } CBOR;
142
143 ecb_inline void
144 cbor_init (CBOR *cbor)
145 {
146 Zero (cbor, 1, CBOR);
147 cbor->max_depth = 512;
148 }
149
150 ecb_inline void
151 cbor_free (CBOR *cbor)
152 {
153 SvREFCNT_dec (cbor->filter);
154 SvREFCNT_dec (cbor->incr_count);
155 }
156
157 /////////////////////////////////////////////////////////////////////////////
158 // utility functions
159
160 ecb_inline SV *
161 get_bool (const char *name)
162 {
163 SV *sv = get_sv (name, 1);
164
165 SvREADONLY_on (sv);
166 SvREADONLY_on (SvRV (sv));
167
168 return sv;
169 }
170
171 ecb_inline void
172 shrink (SV *sv)
173 {
174 sv_utf8_downgrade (sv, 1);
175
176 if (SvLEN (sv) > SvCUR (sv) + 1)
177 {
178 #ifdef SvPV_shrink_to_cur
179 SvPV_shrink_to_cur (sv);
180 #elif defined (SvPV_renew)
181 SvPV_renew (sv, SvCUR (sv) + 1);
182 #endif
183 }
184 }
185
186 // minimum length of a string to be registered for stringref
187 ecb_inline int
188 minimum_string_length (UV idx)
189 {
190 return idx > 23
191 ? idx > 0xffU
192 ? idx > 0xffffU
193 ? idx > 0xffffffffU
194 ? 11
195 : 7
196 : 5
197 : 4
198 : 3;
199 }
200
201 /////////////////////////////////////////////////////////////////////////////
202 // encoder
203
204 // structure used for encoding CBOR
205 typedef struct
206 {
207 char *cur; // SvPVX (sv) + current output position
208 char *end; // SvEND (sv)
209 SV *sv; // result scalar
210 CBOR cbor;
211 U32 depth; // recursion level
212 HV *stringref[2]; // string => index, or 0 ([0] = bytes, [1] = utf-8)
213 UV stringref_idx;
214 HV *shareable; // ptr => index, or 0
215 UV shareable_idx;
216 } enc_t;
217
218 ecb_inline void
219 need (enc_t *enc, STRLEN len)
220 {
221 if (ecb_expect_false (enc->cur + len >= enc->end))
222 {
223 STRLEN cur = enc->cur - (char *)SvPVX (enc->sv);
224 SvGROW (enc->sv, cur + (len < (cur >> 2) ? cur >> 2 : len) + 1);
225 enc->cur = SvPVX (enc->sv) + cur;
226 enc->end = SvPVX (enc->sv) + SvLEN (enc->sv) - 1;
227 }
228 }
229
230 ecb_inline void
231 encode_ch (enc_t *enc, char ch)
232 {
233 need (enc, 1);
234 *enc->cur++ = ch;
235 }
236
237 static void
238 encode_uint (enc_t *enc, int major, UV len)
239 {
240 need (enc, 9);
241
242 if (ecb_expect_true (len < LENGTH_EXT1))
243 *enc->cur++ = major | len;
244 else if (ecb_expect_true (len <= 0xffU))
245 {
246 *enc->cur++ = major | LENGTH_EXT1;
247 *enc->cur++ = len;
248 }
249 else if (len <= 0xffffU)
250 {
251 *enc->cur++ = major | LENGTH_EXT2;
252 *enc->cur++ = len >> 8;
253 *enc->cur++ = len;
254 }
255 else if (len <= 0xffffffffU)
256 {
257 *enc->cur++ = major | LENGTH_EXT4;
258 *enc->cur++ = len >> 24;
259 *enc->cur++ = len >> 16;
260 *enc->cur++ = len >> 8;
261 *enc->cur++ = len;
262 }
263 else
264 {
265 *enc->cur++ = major | LENGTH_EXT8;
266 *enc->cur++ = len >> 56;
267 *enc->cur++ = len >> 48;
268 *enc->cur++ = len >> 40;
269 *enc->cur++ = len >> 32;
270 *enc->cur++ = len >> 24;
271 *enc->cur++ = len >> 16;
272 *enc->cur++ = len >> 8;
273 *enc->cur++ = len;
274 }
275 }
276
277 ecb_inline void
278 encode_tag (enc_t *enc, UV tag)
279 {
280 encode_uint (enc, MAJOR_TAG, tag);
281 }
282
283 // exceptional (hopefully) slow path for byte strings that need to be utf8-encoded
284 ecb_noinline static void
285 encode_str_utf8 (enc_t *enc, int utf8, char *str, STRLEN len)
286 {
287 STRLEN ulen = len;
288 U8 *p, *pend = (U8 *)str + len;
289
290 for (p = (U8 *)str; p < pend; ++p)
291 ulen += *p >> 7; // count set high bits
292
293 encode_uint (enc, MAJOR_TEXT, ulen);
294
295 need (enc, ulen);
296 for (p = (U8 *)str; p < pend; ++p)
297 if (*p < 0x80)
298 *enc->cur++ = *p;
299 else
300 {
301 *enc->cur++ = 0xc0 + (*p >> 6);
302 *enc->cur++ = 0x80 + (*p & 63);
303 }
304 }
305
306 ecb_inline void
307 encode_str (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
308 {
309 if (ecb_expect_false (upgrade_utf8))
310 if (!utf8)
311 {
312 encode_str_utf8 (enc, utf8, str, len);
313 return;
314 }
315
316 encode_uint (enc, utf8 ? MAJOR_TEXT : MAJOR_BYTES, len);
317 need (enc, len);
318 memcpy (enc->cur, str, len);
319 enc->cur += len;
320 }
321
322 ecb_inline
323 encode_strref (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
324 {
325 if (ecb_expect_false (enc->cbor.flags & F_PACK_STRINGS))
326 {
327 SV **svp = hv_fetch (enc->stringref[!!utf8], str, len, 1);
328
329 if (SvOK (*svp))
330 {
331 // already registered, use stringref
332 encode_tag (enc, CBOR_TAG_STRINGREF);
333 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
334 return;
335 }
336 else if (len >= minimum_string_length (enc->stringref_idx))
337 {
338 // register only
339 sv_setuv (*svp, enc->stringref_idx);
340 ++enc->stringref_idx;
341 }
342 }
343
344 encode_str (enc, upgrade_utf8, utf8, str, len);
345 }
346
347 static void encode_sv (enc_t *enc, SV *sv);
348
349 static void
350 encode_av (enc_t *enc, AV *av)
351 {
352 int i, len = av_len (av);
353
354 if (enc->depth >= enc->cbor.max_depth)
355 croak (ERR_NESTING_EXCEEDED);
356
357 ++enc->depth;
358
359 encode_uint (enc, MAJOR_ARRAY, len + 1);
360
361 if (SvMAGICAL (av))
362 for (i = 0; i <= len; ++i)
363 {
364 SV **svp = av_fetch (av, i, 0);
365 encode_sv (enc, svp ? *svp : &PL_sv_undef);
366 }
367 else
368 for (i = 0; i <= len; ++i)
369 {
370 SV *sv = AvARRAY (av)[i];
371 encode_sv (enc, sv ? sv : &PL_sv_undef);
372 }
373
374 --enc->depth;
375 }
376
377 static void
378 encode_hv (enc_t *enc, HV *hv)
379 {
380 HE *he;
381
382 if (enc->depth >= enc->cbor.max_depth)
383 croak (ERR_NESTING_EXCEEDED);
384
385 ++enc->depth;
386
387 int pairs = hv_iterinit (hv);
388 int mg = SvMAGICAL (hv);
389
390 if (mg)
391 encode_ch (enc, MAJOR_MAP | MINOR_INDEF);
392 else
393 encode_uint (enc, MAJOR_MAP, pairs);
394
395 while ((he = hv_iternext (hv)))
396 {
397 if (HeKLEN (he) == HEf_SVKEY)
398 encode_sv (enc, HeSVKEY (he));
399 else
400 encode_strref (enc, enc->cbor.flags & (F_UTF8_KEYS | F_UTF8_STRINGS), HeKUTF8 (he), HeKEY (he), HeKLEN (he));
401
402 encode_sv (enc, ecb_expect_false (mg) ? hv_iterval (hv, he) : HeVAL (he));
403 }
404
405 if (mg)
406 encode_ch (enc, MAJOR_MISC | MINOR_INDEF);
407
408 --enc->depth;
409 }
410
411 // encode objects, arrays and special \0=false and \1=true values.
412 static void
413 encode_rv (enc_t *enc, SV *sv)
414 {
415 SvGETMAGIC (sv);
416
417 svtype svt = SvTYPE (sv);
418
419 if (ecb_expect_false (SvOBJECT (sv)))
420 {
421 HV *boolean_stash = !CBOR_SLOW || types_boolean_stash
422 ? types_boolean_stash
423 : gv_stashpv ("Types::Serialiser::Boolean", 1);
424 HV *error_stash = !CBOR_SLOW || types_error_stash
425 ? types_error_stash
426 : gv_stashpv ("Types::Serialiser::Error", 1);
427 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
428 ? cbor_tagged_stash
429 : gv_stashpv ("CBOR::XS::Tagged" , 1);
430
431 HV *stash = SvSTASH (sv);
432
433 if (stash == boolean_stash)
434 {
435 encode_ch (enc, SvIV (sv) ? MAJOR_MISC | SIMPLE_TRUE : MAJOR_MISC | SIMPLE_FALSE);
436 return;
437 }
438 else if (stash == error_stash)
439 {
440 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
441 return;
442 }
443 else if (stash == tagged_stash)
444 {
445 if (svt != SVt_PVAV)
446 croak ("encountered CBOR::XS::Tagged object that isn't an array");
447
448 encode_uint (enc, MAJOR_TAG, SvUV (*av_fetch ((AV *)sv, 0, 1)));
449 encode_sv (enc, *av_fetch ((AV *)sv, 1, 1));
450
451 return;
452 }
453 }
454
455 if (ecb_expect_false (SvREFCNT (sv) > 1)
456 && ecb_expect_false (enc->cbor.flags & F_ALLOW_SHARING))
457 {
458 if (!enc->shareable)
459 enc->shareable = (HV *)sv_2mortal ((SV *)newHV ());
460
461 SV **svp = hv_fetch (enc->shareable, (char *)&sv, sizeof (sv), 1);
462
463 if (SvOK (*svp))
464 {
465 encode_tag (enc, CBOR_TAG_VALUE_SHAREDREF);
466 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
467 return;
468 }
469 else
470 {
471 sv_setuv (*svp, enc->shareable_idx);
472 ++enc->shareable_idx;
473 encode_tag (enc, CBOR_TAG_VALUE_SHAREABLE);
474 }
475 }
476
477 if (ecb_expect_false (SvOBJECT (sv)))
478 {
479 HV *stash = SvSTASH (sv);
480 GV *method;
481
482 if ((method = gv_fetchmethod_autoload (stash, "TO_CBOR", 0)))
483 {
484 dSP;
485
486 ENTER; SAVETMPS;
487 PUSHMARK (SP);
488 // we re-bless the reference to get overload and other niceties right
489 XPUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
490
491 PUTBACK;
492 // G_SCALAR ensures that return value is 1
493 call_sv ((SV *)GvCV (method), G_SCALAR);
494 SPAGAIN;
495
496 // catch this surprisingly common error
497 if (SvROK (TOPs) && SvRV (TOPs) == sv)
498 croak ("%s::TO_CBOR method returned same object as was passed instead of a new one", HvNAME (stash));
499
500 encode_sv (enc, POPs);
501
502 PUTBACK;
503
504 FREETMPS; LEAVE;
505 }
506 else if ((method = gv_fetchmethod_autoload (stash, "FREEZE", 0)) != 0)
507 {
508 dSP;
509
510 ENTER; SAVETMPS;
511 SAVESTACK_POS ();
512 PUSHMARK (SP);
513 EXTEND (SP, 2);
514 // we re-bless the reference to get overload and other niceties right
515 PUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
516 PUSHs (sv_cbor);
517
518 PUTBACK;
519 int count = call_sv ((SV *)GvCV (method), G_ARRAY);
520 SPAGAIN;
521
522 // catch this surprisingly common error
523 if (count == 1 && SvROK (TOPs) && SvRV (TOPs) == sv)
524 croak ("%s::FREEZE(CBOR) method returned same object as was passed instead of a new one", HvNAME (stash));
525
526 encode_tag (enc, CBOR_TAG_PERL_OBJECT);
527 encode_uint (enc, MAJOR_ARRAY, count + 1);
528 encode_strref (enc, 0, HvNAMEUTF8 (stash), HvNAME (stash), HvNAMELEN (stash));
529
530 while (count)
531 encode_sv (enc, SP[1 - count--]);
532
533 PUTBACK;
534
535 FREETMPS; LEAVE;
536 }
537 else
538 croak ("encountered object '%s', but no TO_CBOR or FREEZE methods available on it",
539 SvPV_nolen (sv_2mortal (newRV_inc (sv))));
540 }
541 else if (svt == SVt_PVHV)
542 encode_hv (enc, (HV *)sv);
543 else if (svt == SVt_PVAV)
544 encode_av (enc, (AV *)sv);
545 else
546 {
547 encode_tag (enc, CBOR_TAG_INDIRECTION);
548 encode_sv (enc, sv);
549 }
550 }
551
552 static void
553 encode_nv (enc_t *enc, SV *sv)
554 {
555 double nv = SvNVX (sv);
556
557 need (enc, 9);
558
559 if (ecb_expect_false (nv == (NV)(U32)nv))
560 encode_uint (enc, MAJOR_POS_INT, (U32)nv);
561 //TODO: maybe I32?
562 else if (ecb_expect_false (nv == (float)nv))
563 {
564 uint32_t fp = ecb_float_to_binary32 (nv);
565
566 *enc->cur++ = MAJOR_MISC | MISC_FLOAT32;
567
568 if (!ecb_big_endian ())
569 fp = ecb_bswap32 (fp);
570
571 memcpy (enc->cur, &fp, 4);
572 enc->cur += 4;
573 }
574 else
575 {
576 uint64_t fp = ecb_double_to_binary64 (nv);
577
578 *enc->cur++ = MAJOR_MISC | MISC_FLOAT64;
579
580 if (!ecb_big_endian ())
581 fp = ecb_bswap64 (fp);
582
583 memcpy (enc->cur, &fp, 8);
584 enc->cur += 8;
585 }
586 }
587
588 static void
589 encode_sv (enc_t *enc, SV *sv)
590 {
591 SvGETMAGIC (sv);
592
593 if (SvPOKp (sv))
594 {
595 STRLEN len;
596 char *str = SvPV (sv, len);
597 encode_strref (enc, enc->cbor.flags & F_UTF8_STRINGS, SvUTF8 (sv), str, len);
598 }
599 else if (SvNOKp (sv))
600 encode_nv (enc, sv);
601 else if (SvIOKp (sv))
602 {
603 if (SvIsUV (sv))
604 encode_uint (enc, MAJOR_POS_INT, SvUVX (sv));
605 else if (SvIVX (sv) >= 0)
606 encode_uint (enc, MAJOR_POS_INT, SvIVX (sv));
607 else
608 encode_uint (enc, MAJOR_NEG_INT, -(SvIVX (sv) + 1));
609 }
610 else if (SvROK (sv))
611 encode_rv (enc, SvRV (sv));
612 else if (!SvOK (sv))
613 encode_ch (enc, MAJOR_MISC | SIMPLE_NULL);
614 else if (enc->cbor.flags & F_ALLOW_UNKNOWN)
615 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
616 else
617 croak ("encountered perl type (%s,0x%x) that CBOR cannot handle, check your input data",
618 SvPV_nolen (sv), (unsigned int)SvFLAGS (sv));
619 }
620
621 static SV *
622 encode_cbor (SV *scalar, CBOR *cbor)
623 {
624 enc_t enc = { 0 };
625
626 enc.cbor = *cbor;
627 enc.sv = sv_2mortal (NEWSV (0, INIT_SIZE));
628 enc.cur = SvPVX (enc.sv);
629 enc.end = SvEND (enc.sv);
630
631 SvPOK_only (enc.sv);
632
633 if (cbor->flags & F_PACK_STRINGS)
634 {
635 encode_tag (&enc, CBOR_TAG_STRINGREF_NAMESPACE);
636 enc.stringref[0]= (HV *)sv_2mortal ((SV *)newHV ());
637 enc.stringref[1]= (HV *)sv_2mortal ((SV *)newHV ());
638 }
639
640 encode_sv (&enc, scalar);
641
642 SvCUR_set (enc.sv, enc.cur - SvPVX (enc.sv));
643 *SvEND (enc.sv) = 0; // many xs functions expect a trailing 0 for text strings
644
645 if (enc.cbor.flags & F_SHRINK)
646 shrink (enc.sv);
647
648 return enc.sv;
649 }
650
651 /////////////////////////////////////////////////////////////////////////////
652 // decoder
653
654 // structure used for decoding CBOR
655 typedef struct
656 {
657 U8 *cur; // current parser pointer
658 U8 *end; // end of input string
659 const char *err; // parse error, if != 0
660 CBOR cbor;
661 U32 depth; // recursion depth
662 U32 maxdepth; // recursion depth limit
663 AV *shareable;
664 AV *stringref;
665 SV *decode_tagged;
666 } dec_t;
667
668 #define ERR(reason) SB if (!dec->err) dec->err = reason; goto fail; SE
669
670 #define WANT(len) if (ecb_expect_false (dec->cur + len > dec->end)) ERR ("unexpected end of CBOR data")
671
672 #define DEC_INC_DEPTH if (++dec->depth > dec->cbor.max_depth) ERR (ERR_NESTING_EXCEEDED)
673 #define DEC_DEC_DEPTH --dec->depth
674
675 static UV
676 decode_uint (dec_t *dec)
677 {
678 U8 m = *dec->cur & MINOR_MASK;
679 ++dec->cur;
680
681 if (ecb_expect_true (m < LENGTH_EXT1))
682 return m;
683 else if (ecb_expect_true (m == LENGTH_EXT1))
684 {
685 WANT (1);
686 dec->cur += 1;
687 return dec->cur[-1];
688 }
689 else if (ecb_expect_true (m == LENGTH_EXT2))
690 {
691 WANT (2);
692 dec->cur += 2;
693 return (((UV)dec->cur[-2]) << 8)
694 | ((UV)dec->cur[-1]);
695 }
696 else if (ecb_expect_true (m == LENGTH_EXT4))
697 {
698 WANT (4);
699 dec->cur += 4;
700 return (((UV)dec->cur[-4]) << 24)
701 | (((UV)dec->cur[-3]) << 16)
702 | (((UV)dec->cur[-2]) << 8)
703 | ((UV)dec->cur[-1]);
704 }
705 else if (ecb_expect_true (m == LENGTH_EXT8))
706 {
707 WANT (8);
708 dec->cur += 8;
709
710 return
711 #if UVSIZE < 8
712 0
713 #else
714 (((UV)dec->cur[-8]) << 56)
715 | (((UV)dec->cur[-7]) << 48)
716 | (((UV)dec->cur[-6]) << 40)
717 | (((UV)dec->cur[-5]) << 32)
718 #endif
719 | (((UV)dec->cur[-4]) << 24)
720 | (((UV)dec->cur[-3]) << 16)
721 | (((UV)dec->cur[-2]) << 8)
722 | ((UV)dec->cur[-1]);
723 }
724 else
725 ERR ("corrupted CBOR data (unsupported integer minor encoding)");
726
727 fail:
728 return 0;
729 }
730
731 static SV *decode_sv (dec_t *dec);
732
733 static SV *
734 decode_av (dec_t *dec)
735 {
736 AV *av = newAV ();
737
738 DEC_INC_DEPTH;
739
740 if (*dec->cur == (MAJOR_ARRAY | MINOR_INDEF))
741 {
742 ++dec->cur;
743
744 for (;;)
745 {
746 WANT (1);
747
748 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
749 {
750 ++dec->cur;
751 break;
752 }
753
754 av_push (av, decode_sv (dec));
755 }
756 }
757 else
758 {
759 int i, len = decode_uint (dec);
760
761 WANT (len); // complexity check for av_fill - need at least one byte per value, do not allow supersize arrays
762 av_fill (av, len - 1);
763
764 for (i = 0; i < len; ++i)
765 AvARRAY (av)[i] = decode_sv (dec);
766 }
767
768 DEC_DEC_DEPTH;
769 return newRV_noinc ((SV *)av);
770
771 fail:
772 SvREFCNT_dec (av);
773 DEC_DEC_DEPTH;
774 return &PL_sv_undef;
775 }
776
777 static void
778 decode_he (dec_t *dec, HV *hv)
779 {
780 // for speed reasons, we specialcase single-string
781 // byte or utf-8 strings as keys, but only when !stringref
782
783 if (ecb_expect_true (!dec->stringref))
784 if (ecb_expect_true ((U8)(*dec->cur - MAJOR_BYTES) <= LENGTH_EXT8))
785 {
786 I32 len = decode_uint (dec);
787 char *key = (char *)dec->cur;
788
789 WANT (len);
790 dec->cur += len;
791
792 hv_store (hv, key, len, decode_sv (dec), 0);
793
794 return;
795 }
796 else if (ecb_expect_true ((U8)(*dec->cur - MAJOR_TEXT) <= LENGTH_EXT8))
797 {
798 I32 len = decode_uint (dec);
799 char *key = (char *)dec->cur;
800
801 WANT (len);
802 dec->cur += len;
803
804 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
805 if (!is_utf8_string (key, len))
806 ERR ("corrupted CBOR data (invalid UTF-8 in map key)");
807
808 hv_store (hv, key, -len, decode_sv (dec), 0);
809
810 return;
811 }
812
813 SV *k = decode_sv (dec);
814 SV *v = decode_sv (dec);
815
816 hv_store_ent (hv, k, v, 0);
817 SvREFCNT_dec (k);
818
819 fail:
820 ;
821 }
822
823 static SV *
824 decode_hv (dec_t *dec)
825 {
826 HV *hv = newHV ();
827
828 DEC_INC_DEPTH;
829
830 if (*dec->cur == (MAJOR_MAP | MINOR_INDEF))
831 {
832 ++dec->cur;
833
834 for (;;)
835 {
836 WANT (1);
837
838 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
839 {
840 ++dec->cur;
841 break;
842 }
843
844 decode_he (dec, hv);
845 }
846 }
847 else
848 {
849 int pairs = decode_uint (dec);
850
851 while (pairs--)
852 decode_he (dec, hv);
853 }
854
855 DEC_DEC_DEPTH;
856 return newRV_noinc ((SV *)hv);
857
858 fail:
859 SvREFCNT_dec (hv);
860 DEC_DEC_DEPTH;
861 return &PL_sv_undef;
862 }
863
864 static SV *
865 decode_str (dec_t *dec, int utf8)
866 {
867 SV *sv = 0;
868
869 if ((*dec->cur & MINOR_MASK) == MINOR_INDEF)
870 {
871 // indefinite length strings
872 ++dec->cur;
873
874 U8 major = *dec->cur & MAJOR_MISC;
875
876 sv = newSVpvn ("", 0);
877
878 for (;;)
879 {
880 WANT (1);
881
882 if ((*dec->cur - major) > LENGTH_EXT8)
883 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
884 {
885 ++dec->cur;
886 break;
887 }
888 else
889 ERR ("corrupted CBOR data (invalid chunks in indefinite length string)");
890
891 STRLEN len = decode_uint (dec);
892
893 WANT (len);
894 sv_catpvn (sv, dec->cur, len);
895 dec->cur += len;
896 }
897 }
898 else
899 {
900 STRLEN len = decode_uint (dec);
901
902 WANT (len);
903 sv = newSVpvn (dec->cur, len);
904 dec->cur += len;
905
906 if (ecb_expect_false (dec->stringref)
907 && SvCUR (sv) >= minimum_string_length (AvFILLp (dec->stringref) + 1))
908 av_push (dec->stringref, SvREFCNT_inc_NN (sv));
909 }
910
911 if (utf8)
912 {
913 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
914 if (!is_utf8_string (SvPVX (sv), SvCUR (sv)))
915 ERR ("corrupted CBOR data (invalid UTF-8 in text string)");
916
917 SvUTF8_on (sv);
918 }
919
920 return sv;
921
922 fail:
923 SvREFCNT_dec (sv);
924 return &PL_sv_undef;
925 }
926
927 static SV *
928 decode_tagged (dec_t *dec)
929 {
930 SV *sv = 0;
931 UV tag = decode_uint (dec);
932
933 WANT (1);
934
935 switch (tag)
936 {
937 case CBOR_TAG_MAGIC:
938 sv = decode_sv (dec);
939 break;
940
941 case CBOR_TAG_INDIRECTION:
942 sv = newRV_noinc (decode_sv (dec));
943 break;
944
945 case CBOR_TAG_STRINGREF_NAMESPACE:
946 {
947 ENTER; SAVETMPS;
948
949 SAVESPTR (dec->stringref);
950 dec->stringref = (AV *)sv_2mortal ((SV *)newAV ());
951
952 sv = decode_sv (dec);
953
954 FREETMPS; LEAVE;
955 }
956 break;
957
958 case CBOR_TAG_STRINGREF:
959 {
960 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
961 ERR ("corrupted CBOR data (stringref index not an unsigned integer)");
962
963 UV idx = decode_uint (dec);
964
965 if (!dec->stringref || (int)idx > AvFILLp (dec->stringref))
966 ERR ("corrupted CBOR data (stringref index out of bounds or outside namespace)");
967
968 sv = newSVsv (AvARRAY (dec->stringref)[idx]);
969 }
970 break;
971
972 case CBOR_TAG_VALUE_SHAREABLE:
973 {
974 if (ecb_expect_false (!dec->shareable))
975 dec->shareable = (AV *)sv_2mortal ((SV *)newAV ());
976
977 if (dec->cbor.flags & F_ALLOW_CYCLES)
978 {
979 sv = newSV (0);
980 av_push (dec->shareable, SvREFCNT_inc_NN (sv));
981
982 SV *osv = decode_sv (dec);
983 sv_setsv (sv, osv);
984 SvREFCNT_dec_NN (osv);
985 }
986 else
987 {
988 av_push (dec->shareable, &PL_sv_undef);
989 int idx = AvFILLp (dec->shareable);
990 sv = decode_sv (dec);
991 av_store (dec->shareable, idx, SvREFCNT_inc_NN (sv));
992 }
993 }
994 break;
995
996 case CBOR_TAG_VALUE_SHAREDREF:
997 {
998 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
999 ERR ("corrupted CBOR data (sharedref index not an unsigned integer)");
1000
1001 UV idx = decode_uint (dec);
1002
1003 if (!dec->shareable || (int)idx > AvFILLp (dec->shareable))
1004 ERR ("corrupted CBOR data (sharedref index out of bounds)");
1005
1006 sv = SvREFCNT_inc_NN (AvARRAY (dec->shareable)[idx]);
1007
1008 if (sv == &PL_sv_undef)
1009 ERR ("cyclic CBOR data structure found, but allow_cycles is not enabled");
1010 }
1011 break;
1012
1013 case CBOR_TAG_PERL_OBJECT:
1014 {
1015 sv = decode_sv (dec);
1016
1017 if (!SvROK (sv) || SvTYPE (SvRV (sv)) != SVt_PVAV)
1018 ERR ("corrupted CBOR data (non-array perl object)");
1019
1020 AV *av = (AV *)SvRV (sv);
1021 int len = av_len (av) + 1;
1022 HV *stash = gv_stashsv (*av_fetch (av, 0, 1), 0);
1023
1024 if (!stash)
1025 ERR ("cannot decode perl-object (package does not exist)");
1026
1027 GV *method = gv_fetchmethod_autoload (stash, "THAW", 0);
1028
1029 if (!method)
1030 ERR ("cannot decode perl-object (package does not have a THAW method)");
1031
1032 dSP;
1033
1034 ENTER; SAVETMPS;
1035 PUSHMARK (SP);
1036 EXTEND (SP, len + 1);
1037 // we re-bless the reference to get overload and other niceties right
1038 PUSHs (*av_fetch (av, 0, 1));
1039 PUSHs (sv_cbor);
1040
1041 int i;
1042
1043 for (i = 1; i < len; ++i)
1044 PUSHs (*av_fetch (av, i, 1));
1045
1046 PUTBACK;
1047 call_sv ((SV *)GvCV (method), G_SCALAR | G_EVAL);
1048 SPAGAIN;
1049
1050 if (SvTRUE (ERRSV))
1051 {
1052 FREETMPS; LEAVE;
1053 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1054 }
1055
1056 SvREFCNT_dec (sv);
1057 sv = SvREFCNT_inc (POPs);
1058
1059 PUTBACK;
1060
1061 FREETMPS; LEAVE;
1062 }
1063 break;
1064
1065 default:
1066 {
1067 sv = decode_sv (dec);
1068
1069 dSP;
1070 ENTER; SAVETMPS;
1071 SAVESTACK_POS ();
1072 PUSHMARK (SP);
1073 EXTEND (SP, 2);
1074 PUSHs (newSVuv (tag));
1075 PUSHs (sv);
1076
1077 PUTBACK;
1078 int count = call_sv (dec->cbor.filter ? dec->cbor.filter : default_filter, G_ARRAY | G_EVAL);
1079 SPAGAIN;
1080
1081 if (SvTRUE (ERRSV))
1082 {
1083 FREETMPS; LEAVE;
1084 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1085 }
1086
1087 if (count)
1088 {
1089 SvREFCNT_dec (sv);
1090 sv = SvREFCNT_inc (POPs);
1091 }
1092 else
1093 {
1094 AV *av = newAV ();
1095 av_push (av, newSVuv (tag));
1096 av_push (av, sv);
1097
1098 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
1099 ? cbor_tagged_stash
1100 : gv_stashpv ("CBOR::XS::Tagged" , 1);
1101 sv = sv_bless (newRV_noinc ((SV *)av), tagged_stash);
1102 }
1103
1104 PUTBACK;
1105
1106 FREETMPS; LEAVE;
1107 }
1108 break;
1109 }
1110
1111 return sv;
1112
1113 fail:
1114 SvREFCNT_dec (sv);
1115 return &PL_sv_undef;
1116 }
1117
1118 static SV *
1119 decode_sv (dec_t *dec)
1120 {
1121 WANT (1);
1122
1123 switch (*dec->cur >> MAJOR_SHIFT)
1124 {
1125 case MAJOR_POS_INT >> MAJOR_SHIFT: return newSVuv (decode_uint (dec));
1126 case MAJOR_NEG_INT >> MAJOR_SHIFT: return newSViv (-1 - (IV)decode_uint (dec));
1127 case MAJOR_BYTES >> MAJOR_SHIFT: return decode_str (dec, 0);
1128 case MAJOR_TEXT >> MAJOR_SHIFT: return decode_str (dec, 1);
1129 case MAJOR_ARRAY >> MAJOR_SHIFT: return decode_av (dec);
1130 case MAJOR_MAP >> MAJOR_SHIFT: return decode_hv (dec);
1131 case MAJOR_TAG >> MAJOR_SHIFT: return decode_tagged (dec);
1132
1133 case MAJOR_MISC >> MAJOR_SHIFT:
1134 switch (*dec->cur++ & MINOR_MASK)
1135 {
1136 case SIMPLE_FALSE:
1137 #if CBOR_SLOW
1138 types_false = get_bool ("Types::Serialiser::false");
1139 #endif
1140 return newSVsv (types_false);
1141 case SIMPLE_TRUE:
1142 #if CBOR_SLOW
1143 types_true = get_bool ("Types::Serialiser::true");
1144 #endif
1145 return newSVsv (types_true);
1146 case SIMPLE_NULL:
1147 return newSVsv (&PL_sv_undef);
1148 case SIMPLE_UNDEF:
1149 #if CBOR_SLOW
1150 types_error = get_bool ("Types::Serialiser::error");
1151 #endif
1152 return newSVsv (types_error);
1153
1154 case MISC_FLOAT16:
1155 {
1156 WANT (2);
1157
1158 uint16_t fp = (dec->cur[0] << 8) | dec->cur[1];
1159 dec->cur += 2;
1160
1161 return newSVnv (ecb_binary16_to_float (fp));
1162 }
1163
1164 case MISC_FLOAT32:
1165 {
1166 uint32_t fp;
1167 WANT (4);
1168 memcpy (&fp, dec->cur, 4);
1169 dec->cur += 4;
1170
1171 if (!ecb_big_endian ())
1172 fp = ecb_bswap32 (fp);
1173
1174 return newSVnv (ecb_binary32_to_float (fp));
1175 }
1176
1177 case MISC_FLOAT64:
1178 {
1179 uint64_t fp;
1180 WANT (8);
1181 memcpy (&fp, dec->cur, 8);
1182 dec->cur += 8;
1183
1184 if (!ecb_big_endian ())
1185 fp = ecb_bswap64 (fp);
1186
1187 return newSVnv (ecb_binary64_to_double (fp));
1188 }
1189
1190 // 0..19 unassigned simple
1191 // 24 reserved + unassigned simple (reserved values are not encodable)
1192 // 28-30 unassigned misc
1193 // 31 break code
1194 default:
1195 ERR ("corrupted CBOR data (reserved/unassigned/unexpected major 7 value)");
1196 }
1197
1198 break;
1199 }
1200
1201 fail:
1202 return &PL_sv_undef;
1203 }
1204
1205 static SV *
1206 decode_cbor (SV *string, CBOR *cbor, char **offset_return)
1207 {
1208 dec_t dec = { 0 };
1209 SV *sv;
1210 STRLEN len;
1211 char *data = SvPVbyte (string, len);
1212
1213 if (len > cbor->max_size && cbor->max_size)
1214 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1215 (unsigned long)len, (unsigned long)cbor->max_size);
1216
1217 dec.cbor = *cbor;
1218 dec.cur = (U8 *)data;
1219 dec.end = (U8 *)data + len;
1220
1221 sv = decode_sv (&dec);
1222
1223 if (offset_return)
1224 *offset_return = dec.cur;
1225
1226 if (!(offset_return || !sv))
1227 if (dec.cur != dec.end && !dec.err)
1228 dec.err = "garbage after CBOR object";
1229
1230 if (dec.err)
1231 {
1232 if (dec.shareable)
1233 {
1234 // need to break cyclic links, which whould all be in shareable
1235 int i;
1236 SV **svp;
1237
1238 for (i = av_len (dec.shareable) + 1; i--; )
1239 if ((svp = av_fetch (dec.shareable, i, 0)))
1240 sv_setsv (*svp, &PL_sv_undef);
1241 }
1242
1243 SvREFCNT_dec (sv);
1244 croak ("%s, at offset %d (octet 0x%02x)", dec.err, dec.cur - (U8 *)data, (int)(uint8_t)*dec.cur);
1245 }
1246
1247 sv = sv_2mortal (sv);
1248
1249 return sv;
1250 }
1251
1252 /////////////////////////////////////////////////////////////////////////////
1253 // incremental parser
1254
1255 #define INCR_DONE(cbor) (AvFILLp (cbor->incr_count) < 0)
1256
1257 // returns 0 for notyet, 1 for success or error
1258 static int
1259 incr_parse (CBOR *self, SV *cborstr)
1260 {
1261 STRLEN cur;
1262 SvPV (cborstr, cur);
1263
1264 while (ecb_expect_true (self->incr_need <= cur))
1265 {
1266 // table of integer count bytes
1267 static I8 incr_len[MINOR_MASK + 1] = {
1268 0, 0, 0, 0, 0, 0, 0, 0,
1269 0, 0, 0, 0, 0, 0, 0, 0,
1270 0, 0, 0, 0, 0, 0, 0, 0,
1271 1, 2, 4, 8,-1,-1,-1,-2
1272 };
1273
1274 const U8 *p = SvPVX (cborstr) + self->incr_pos;
1275 U8 m = *p & MINOR_MASK;
1276 IV count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1277 I8 ilen = incr_len[m];
1278
1279 self->incr_need = self->incr_pos + 1;
1280
1281 if (ecb_expect_false (ilen < 0))
1282 {
1283 if (m != MINOR_INDEF)
1284 return 1; // error
1285
1286 if (*p == (MAJOR_MISC | MINOR_INDEF))
1287 {
1288 if (count >= 0)
1289 return 1; // error
1290
1291 count = 1;
1292 }
1293 else
1294 {
1295 av_push (self->incr_count, newSViv (-1)); //TODO: nest
1296 count = -1;
1297 }
1298 }
1299 else
1300 {
1301 self->incr_need += ilen;
1302 if (ecb_expect_false (self->incr_need > cur))
1303 return 0;
1304
1305 int major = *p >> MAJOR_SHIFT;
1306
1307 switch (major)
1308 {
1309 case MAJOR_TAG >> MAJOR_SHIFT:
1310 ++count; // tags merely prefix another value
1311 break;
1312
1313 case MAJOR_BYTES >> MAJOR_SHIFT:
1314 case MAJOR_TEXT >> MAJOR_SHIFT:
1315 case MAJOR_ARRAY >> MAJOR_SHIFT:
1316 case MAJOR_MAP >> MAJOR_SHIFT:
1317 {
1318 UV len;
1319
1320 if (ecb_expect_false (ilen))
1321 {
1322 len = 0;
1323
1324 do {
1325 len = (len << 8) | *++p;
1326 } while (--ilen);
1327 }
1328 else
1329 len = m;
1330
1331 switch (major)
1332 {
1333 case MAJOR_BYTES >> MAJOR_SHIFT:
1334 case MAJOR_TEXT >> MAJOR_SHIFT:
1335 self->incr_need += len;
1336 if (ecb_expect_false (self->incr_need > cur))
1337 return 0;
1338
1339 break;
1340
1341 case MAJOR_MAP >> MAJOR_SHIFT:
1342 len <<= 1;
1343 case MAJOR_ARRAY >> MAJOR_SHIFT:
1344 if (len)
1345 {
1346 av_push (self->incr_count, newSViv (len + 1)); //TODO: nest
1347 count = len + 1;
1348 }
1349 break;
1350 }
1351 }
1352 }
1353 }
1354
1355 self->incr_pos = self->incr_need;
1356
1357 if (count > 0)
1358 {
1359 while (!--count)
1360 {
1361 if (!AvFILLp (self->incr_count))
1362 return 1; // done
1363
1364 SvREFCNT_dec_NN (av_pop (self->incr_count));
1365 count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1366 }
1367
1368 SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]) = count;
1369 }
1370 }
1371
1372 return 0;
1373 }
1374
1375
1376 /////////////////////////////////////////////////////////////////////////////
1377 // XS interface functions
1378
1379 MODULE = CBOR::XS PACKAGE = CBOR::XS
1380
1381 BOOT:
1382 {
1383 cbor_stash = gv_stashpv ("CBOR::XS" , 1);
1384 cbor_tagged_stash = gv_stashpv ("CBOR::XS::Tagged" , 1);
1385
1386 types_boolean_stash = gv_stashpv ("Types::Serialiser::Boolean", 1);
1387 types_error_stash = gv_stashpv ("Types::Serialiser::Error" , 1);
1388
1389 types_true = get_bool ("Types::Serialiser::true" );
1390 types_false = get_bool ("Types::Serialiser::false");
1391 types_error = get_bool ("Types::Serialiser::error");
1392
1393 default_filter = newSVpv ("CBOR::XS::default_filter", 0);
1394
1395 sv_cbor = newSVpv ("CBOR", 0);
1396 SvREADONLY_on (sv_cbor);
1397 }
1398
1399 PROTOTYPES: DISABLE
1400
1401 void CLONE (...)
1402 CODE:
1403 cbor_stash = 0;
1404 cbor_tagged_stash = 0;
1405 types_error_stash = 0;
1406 types_boolean_stash = 0;
1407
1408 void new (char *klass)
1409 PPCODE:
1410 {
1411 SV *pv = NEWSV (0, sizeof (CBOR));
1412 SvPOK_only (pv);
1413 cbor_init ((CBOR *)SvPVX (pv));
1414 XPUSHs (sv_2mortal (sv_bless (
1415 newRV_noinc (pv),
1416 strEQ (klass, "CBOR::XS") ? CBOR_STASH : gv_stashpv (klass, 1)
1417 )));
1418 }
1419
1420 void shrink (CBOR *self, int enable = 1)
1421 ALIAS:
1422 shrink = F_SHRINK
1423 allow_unknown = F_ALLOW_UNKNOWN
1424 allow_sharing = F_ALLOW_SHARING
1425 allow_cycles = F_ALLOW_CYCLES
1426 pack_strings = F_PACK_STRINGS
1427 utf8_strings = F_UTF8_STRINGS
1428 validate_utf8 = F_VALIDATE_UTF8
1429 PPCODE:
1430 {
1431 if (enable)
1432 self->flags |= ix;
1433 else
1434 self->flags &= ~ix;
1435
1436 XPUSHs (ST (0));
1437 }
1438
1439 void get_shrink (CBOR *self)
1440 ALIAS:
1441 get_shrink = F_SHRINK
1442 get_allow_unknown = F_ALLOW_UNKNOWN
1443 get_allow_sharing = F_ALLOW_SHARING
1444 get_allow_cycles = F_ALLOW_CYCLES
1445 get_pack_strings = F_PACK_STRINGS
1446 get_validate_utf8 = F_VALIDATE_UTF8
1447 PPCODE:
1448 XPUSHs (boolSV (self->flags & ix));
1449
1450 void max_depth (CBOR *self, U32 max_depth = 0x80000000UL)
1451 PPCODE:
1452 self->max_depth = max_depth;
1453 XPUSHs (ST (0));
1454
1455 U32 get_max_depth (CBOR *self)
1456 CODE:
1457 RETVAL = self->max_depth;
1458 OUTPUT:
1459 RETVAL
1460
1461 void max_size (CBOR *self, U32 max_size = 0)
1462 PPCODE:
1463 self->max_size = max_size;
1464 XPUSHs (ST (0));
1465
1466 int get_max_size (CBOR *self)
1467 CODE:
1468 RETVAL = self->max_size;
1469 OUTPUT:
1470 RETVAL
1471
1472 void filter (CBOR *self, SV *filter = 0)
1473 PPCODE:
1474 SvREFCNT_dec (self->filter);
1475 self->filter = filter ? newSVsv (filter) : filter;
1476 XPUSHs (ST (0));
1477
1478 SV *get_filter (CBOR *self)
1479 CODE:
1480 RETVAL = self->filter ? self->filter : NEWSV (0, 0);
1481 OUTPUT:
1482 RETVAL
1483
1484 void encode (CBOR *self, SV *scalar)
1485 PPCODE:
1486 PUTBACK; scalar = encode_cbor (scalar, self); SPAGAIN;
1487 XPUSHs (scalar);
1488
1489 void decode (CBOR *self, SV *cborstr)
1490 PPCODE:
1491 PUTBACK; cborstr = decode_cbor (cborstr, self, 0); SPAGAIN;
1492 XPUSHs (cborstr);
1493
1494 void decode_prefix (CBOR *self, SV *cborstr)
1495 PPCODE:
1496 {
1497 SV *sv;
1498 char *offset;
1499 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1500 EXTEND (SP, 2);
1501 PUSHs (sv);
1502 PUSHs (sv_2mortal (newSVuv (offset - SvPVX (cborstr))));
1503 }
1504
1505 void incr_parse (CBOR *self, SV *cborstr)
1506 ALIAS:
1507 incr_parse_multiple = 1
1508 PPCODE:
1509 {
1510 if (SvUTF8 (cborstr))
1511 sv_utf8_downgrade (cborstr, 0);
1512
1513 if (!self->incr_count)
1514 {
1515 self->incr_count = newAV ();
1516 self->incr_pos = 0;
1517 self->incr_need = 1;
1518
1519 av_push (self->incr_count, newSViv (1));
1520 }
1521
1522 do
1523 {
1524 if (!incr_parse (self, cborstr))
1525 {
1526 if (self->incr_need > self->max_size && self->max_size)
1527 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1528 (unsigned long)self->incr_need, (unsigned long)self->max_size);
1529
1530 break;
1531 }
1532
1533 SV *sv;
1534 char *offset;
1535
1536 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1537 XPUSHs (sv);
1538
1539 sv_chop (cborstr, offset);
1540
1541 av_clear (self->incr_count);
1542 av_push (self->incr_count, newSViv (1));
1543
1544 self->incr_pos = 0;
1545 self->incr_need = self->incr_pos + 1;
1546 }
1547 while (ix);
1548 }
1549
1550 void incr_reset (CBOR *self)
1551 CODE:
1552 {
1553 SvREFCNT_dec (self->incr_count);
1554 self->incr_count = 0;
1555 }
1556
1557 void DESTROY (CBOR *self)
1558 PPCODE:
1559 cbor_free (self);
1560
1561 PROTOTYPES: ENABLE
1562
1563 void encode_cbor (SV *scalar)
1564 ALIAS:
1565 encode_cbor = 0
1566 encode_cbor_sharing = F_ALLOW_SHARING
1567 PPCODE:
1568 {
1569 CBOR cbor;
1570 cbor_init (&cbor);
1571 cbor.flags |= ix;
1572 PUTBACK; scalar = encode_cbor (scalar, &cbor); SPAGAIN;
1573 XPUSHs (scalar);
1574 }
1575
1576 void decode_cbor (SV *cborstr)
1577 PPCODE:
1578 {
1579 CBOR cbor;
1580 cbor_init (&cbor);
1581 PUTBACK; cborstr = decode_cbor (cborstr, &cbor, 0); SPAGAIN;
1582 XPUSHs (cborstr);
1583 }
1584