ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/CBOR-XS/XS.xs
Revision: 1.58
Committed: Fri Nov 25 13:27:29 2016 UTC (7 years, 5 months ago) by root
Branch: MAIN
Changes since 1.57: +7 -3 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #include "EXTERN.h"
2 #include "perl.h"
3 #include "XSUB.h"
4
5 #include <assert.h>
6 #include <string.h>
7 #include <stdlib.h>
8 #include <stdio.h>
9 #include <limits.h>
10 #include <float.h>
11
12 #define ECB_NO_THREADS 1
13 #include "ecb.h"
14
15 // compatibility with perl <5.18
16 #ifndef HvNAMELEN_get
17 # define HvNAMELEN_get(hv) strlen (HvNAME (hv))
18 #endif
19 #ifndef HvNAMELEN
20 # define HvNAMELEN(hv) HvNAMELEN_get (hv)
21 #endif
22 #ifndef HvNAMEUTF8
23 # define HvNAMEUTF8(hv) 0
24 #endif
25 #ifndef SvREFCNT_dec_NN
26 # define SvREFCNT_dec_NN(sv) SvREFCNT_dec (sv)
27 #endif
28
29 // known major and minor types
30 enum cbor_type
31 {
32 MAJOR_SHIFT = 5,
33 MINOR_MASK = 0x1f,
34
35 MAJOR_POS_INT = 0 << MAJOR_SHIFT,
36 MAJOR_NEG_INT = 1 << MAJOR_SHIFT,
37 MAJOR_BYTES = 2 << MAJOR_SHIFT,
38 MAJOR_TEXT = 3 << MAJOR_SHIFT,
39 MAJOR_ARRAY = 4 << MAJOR_SHIFT,
40 MAJOR_MAP = 5 << MAJOR_SHIFT,
41 MAJOR_TAG = 6 << MAJOR_SHIFT,
42 MAJOR_MISC = 7 << MAJOR_SHIFT,
43
44 // INT/STRING/ARRAY/MAP subtypes
45 LENGTH_EXT1 = 24,
46 LENGTH_EXT2 = 25,
47 LENGTH_EXT4 = 26,
48 LENGTH_EXT8 = 27,
49
50 // SIMPLE types (effectively MISC subtypes)
51 SIMPLE_FALSE = 20,
52 SIMPLE_TRUE = 21,
53 SIMPLE_NULL = 22,
54 SIMPLE_UNDEF = 23,
55
56 // MISC subtype (unused)
57 MISC_EXT1 = 24,
58 MISC_FLOAT16 = 25,
59 MISC_FLOAT32 = 26,
60 MISC_FLOAT64 = 27,
61
62 // BYTES/TEXT/ARRAY/MAP
63 MINOR_INDEF = 31,
64 };
65
66 // known tags
67 enum cbor_tag
68 {
69 // extensions
70 CBOR_TAG_STRINGREF = 25, // http://cbor.schmorp.de/stringref
71 CBOR_TAG_PERL_OBJECT = 26, // http://cbor.schmorp.de/perl-object
72 CBOR_TAG_GENERIC_OBJECT = 27, // http://cbor.schmorp.de/generic-object
73 CBOR_TAG_VALUE_SHAREABLE = 28, // http://cbor.schmorp.de/value-sharing
74 CBOR_TAG_VALUE_SHAREDREF = 29, // http://cbor.schmorp.de/value-sharing
75 CBOR_TAG_STRINGREF_NAMESPACE = 256, // http://cbor.schmorp.de/stringref
76 CBOR_TAG_INDIRECTION = 22098, // http://cbor.schmorp.de/indirection
77
78 // rfc7049
79 CBOR_TAG_DATETIME = 0, // rfc4287, utf-8
80 CBOR_TAG_TIMESTAMP = 1, // unix timestamp, any
81 CBOR_TAG_POS_BIGNUM = 2, // byte string
82 CBOR_TAG_NEG_BIGNUM = 3, // byte string
83 CBOR_TAG_DECIMAL = 4, // decimal fraction, array
84 CBOR_TAG_BIGFLOAT = 5, // array
85
86 CBOR_TAG_CONV_B64U = 21, // base64url, any
87 CBOR_TAG_CONV_B64 = 22, // base64, any
88 CBOR_TAG_CONV_HEX = 23, // base16, any
89 CBOR_TAG_CBOR = 24, // embedded cbor, byte string
90
91 CBOR_TAG_URI = 32, // URI rfc3986, utf-8
92 CBOR_TAG_B64U = 33, // base64url rfc4648, utf-8
93 CBOR_TAG_B64 = 34, // base6 rfc46484, utf-8
94 CBOR_TAG_REGEX = 35, // regex pcre/ecma262, utf-8
95 CBOR_TAG_MIME = 36, // mime message rfc2045, utf-8
96
97 CBOR_TAG_MAGIC = 55799, // self-describe cbor
98 };
99
100 #define F_SHRINK 0x00000001UL
101 #define F_ALLOW_UNKNOWN 0x00000002UL
102 #define F_ALLOW_SHARING 0x00000004UL
103 #define F_ALLOW_CYCLES 0x00000008UL
104 #define F_PACK_STRINGS 0x00000010UL
105 #define F_TEXT_KEYS 0x00000020UL
106 #define F_TEXT_STRINGS 0x00000040UL
107 #define F_VALIDATE_UTF8 0x00000080UL
108
109 #define INIT_SIZE 32 // initial scalar size to be allocated
110
111 #define SB do {
112 #define SE } while (0)
113
114 #define IN_RANGE_INC(type,val,beg,end) \
115 ((unsigned type)((unsigned type)(val) - (unsigned type)(beg)) \
116 <= (unsigned type)((unsigned type)(end) - (unsigned type)(beg)))
117
118 #define ERR_NESTING_EXCEEDED "cbor text or perl structure exceeds maximum nesting level (max_depth set too low?)"
119
120 #ifdef USE_ITHREADS
121 # define CBOR_SLOW 1
122 # define CBOR_STASH (cbor_stash ? cbor_stash : gv_stashpv ("CBOR::XS", 1))
123 #else
124 # define CBOR_SLOW 0
125 # define CBOR_STASH cbor_stash
126 #endif
127
128 static HV *cbor_stash, *types_boolean_stash, *types_error_stash, *cbor_tagged_stash; // CBOR::XS::
129 static SV *types_true, *types_false, *types_error, *sv_cbor, *default_filter;
130
131 typedef struct {
132 U32 flags;
133 U32 max_depth;
134 STRLEN max_size;
135 SV *filter;
136
137 // for the incremental parser
138 STRLEN incr_pos; // the current offset into the text
139 STRLEN incr_need; // minimum bytes needed to decode
140 AV *incr_count; // for every nesting level, the number of outstanding values, or -1 for indef.
141 } CBOR;
142
143 ecb_inline void
144 cbor_init (CBOR *cbor)
145 {
146 Zero (cbor, 1, CBOR);
147 cbor->max_depth = 512;
148 }
149
150 ecb_inline void
151 cbor_free (CBOR *cbor)
152 {
153 SvREFCNT_dec (cbor->filter);
154 SvREFCNT_dec (cbor->incr_count);
155 }
156
157 /////////////////////////////////////////////////////////////////////////////
158 // utility functions
159
160 ecb_inline SV *
161 get_bool (const char *name)
162 {
163 SV *sv = get_sv (name, 1);
164
165 SvREADONLY_on (sv);
166 SvREADONLY_on (SvRV (sv));
167
168 return sv;
169 }
170
171 ecb_inline void
172 shrink (SV *sv)
173 {
174 sv_utf8_downgrade (sv, 1);
175
176 if (SvLEN (sv) > SvCUR (sv) + 1)
177 {
178 #ifdef SvPV_shrink_to_cur
179 SvPV_shrink_to_cur (sv);
180 #elif defined (SvPV_renew)
181 SvPV_renew (sv, SvCUR (sv) + 1);
182 #endif
183 }
184 }
185
186 // minimum length of a string to be registered for stringref
187 ecb_inline int
188 minimum_string_length (UV idx)
189 {
190 return idx > 23
191 ? idx > 0xffU
192 ? idx > 0xffffU
193 ? idx > 0xffffffffU
194 ? 11
195 : 7
196 : 5
197 : 4
198 : 3;
199 }
200
201 /////////////////////////////////////////////////////////////////////////////
202 // encoder
203
204 // structure used for encoding CBOR
205 typedef struct
206 {
207 char *cur; // SvPVX (sv) + current output position
208 char *end; // SvEND (sv)
209 SV *sv; // result scalar
210 CBOR cbor;
211 U32 depth; // recursion level
212 HV *stringref[2]; // string => index, or 0 ([0] = bytes, [1] = utf-8)
213 UV stringref_idx;
214 HV *shareable; // ptr => index, or 0
215 UV shareable_idx;
216 } enc_t;
217
218 ecb_inline void
219 need (enc_t *enc, STRLEN len)
220 {
221 if (ecb_expect_false (enc->cur + len >= enc->end))
222 {
223 STRLEN cur = enc->cur - (char *)SvPVX (enc->sv);
224 SvGROW (enc->sv, cur + (len < (cur >> 2) ? cur >> 2 : len) + 1);
225 enc->cur = SvPVX (enc->sv) + cur;
226 enc->end = SvPVX (enc->sv) + SvLEN (enc->sv) - 1;
227 }
228 }
229
230 ecb_inline void
231 encode_ch (enc_t *enc, char ch)
232 {
233 need (enc, 1);
234 *enc->cur++ = ch;
235 }
236
237 static void
238 encode_uint (enc_t *enc, int major, UV len)
239 {
240 need (enc, 9);
241
242 if (ecb_expect_true (len < LENGTH_EXT1))
243 *enc->cur++ = major | len;
244 else if (ecb_expect_true (len <= 0xffU))
245 {
246 *enc->cur++ = major | LENGTH_EXT1;
247 *enc->cur++ = len;
248 }
249 else if (len <= 0xffffU)
250 {
251 *enc->cur++ = major | LENGTH_EXT2;
252 *enc->cur++ = len >> 8;
253 *enc->cur++ = len;
254 }
255 else if (len <= 0xffffffffU)
256 {
257 *enc->cur++ = major | LENGTH_EXT4;
258 *enc->cur++ = len >> 24;
259 *enc->cur++ = len >> 16;
260 *enc->cur++ = len >> 8;
261 *enc->cur++ = len;
262 }
263 else
264 {
265 *enc->cur++ = major | LENGTH_EXT8;
266 *enc->cur++ = len >> 56;
267 *enc->cur++ = len >> 48;
268 *enc->cur++ = len >> 40;
269 *enc->cur++ = len >> 32;
270 *enc->cur++ = len >> 24;
271 *enc->cur++ = len >> 16;
272 *enc->cur++ = len >> 8;
273 *enc->cur++ = len;
274 }
275 }
276
277 ecb_inline void
278 encode_tag (enc_t *enc, UV tag)
279 {
280 encode_uint (enc, MAJOR_TAG, tag);
281 }
282
283 // exceptional (hopefully) slow path for byte strings that need to be utf8-encoded
284 ecb_noinline static void
285 encode_str_utf8 (enc_t *enc, int utf8, char *str, STRLEN len)
286 {
287 STRLEN ulen = len;
288 U8 *p, *pend = (U8 *)str + len;
289
290 for (p = (U8 *)str; p < pend; ++p)
291 ulen += *p >> 7; // count set high bits
292
293 encode_uint (enc, MAJOR_TEXT, ulen);
294
295 need (enc, ulen);
296 for (p = (U8 *)str; p < pend; ++p)
297 if (*p < 0x80)
298 *enc->cur++ = *p;
299 else
300 {
301 *enc->cur++ = 0xc0 + (*p >> 6);
302 *enc->cur++ = 0x80 + (*p & 63);
303 }
304 }
305
306 ecb_inline void
307 encode_str (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
308 {
309 if (ecb_expect_false (upgrade_utf8))
310 if (!utf8)
311 {
312 encode_str_utf8 (enc, utf8, str, len);
313 return;
314 }
315
316 encode_uint (enc, utf8 ? MAJOR_TEXT : MAJOR_BYTES, len);
317 need (enc, len);
318 memcpy (enc->cur, str, len);
319 enc->cur += len;
320 }
321
322 ecb_inline void
323 encode_strref (enc_t *enc, int upgrade_utf8, int utf8, char *str, STRLEN len)
324 {
325 if (ecb_expect_false (enc->cbor.flags & F_PACK_STRINGS))
326 {
327 SV **svp = hv_fetch (enc->stringref[!!utf8], str, len, 1);
328
329 if (SvOK (*svp))
330 {
331 // already registered, use stringref
332 encode_tag (enc, CBOR_TAG_STRINGREF);
333 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
334 return;
335 }
336 else if (len >= minimum_string_length (enc->stringref_idx))
337 {
338 // register only
339 sv_setuv (*svp, enc->stringref_idx);
340 ++enc->stringref_idx;
341 }
342 }
343
344 encode_str (enc, upgrade_utf8, utf8, str, len);
345 }
346
347 static void encode_sv (enc_t *enc, SV *sv);
348
349 static void
350 encode_av (enc_t *enc, AV *av)
351 {
352 int i, len = av_len (av);
353
354 if (enc->depth >= enc->cbor.max_depth)
355 croak (ERR_NESTING_EXCEEDED);
356
357 ++enc->depth;
358
359 encode_uint (enc, MAJOR_ARRAY, len + 1);
360
361 if (SvMAGICAL (av))
362 for (i = 0; i <= len; ++i)
363 {
364 SV **svp = av_fetch (av, i, 0);
365 encode_sv (enc, svp ? *svp : &PL_sv_undef);
366 }
367 else
368 for (i = 0; i <= len; ++i)
369 {
370 SV *sv = AvARRAY (av)[i];
371 encode_sv (enc, sv ? sv : &PL_sv_undef);
372 }
373
374 --enc->depth;
375 }
376
377 static void
378 encode_hv (enc_t *enc, HV *hv)
379 {
380 HE *he;
381
382 if (enc->depth >= enc->cbor.max_depth)
383 croak (ERR_NESTING_EXCEEDED);
384
385 ++enc->depth;
386
387 int pairs = hv_iterinit (hv);
388 int mg = SvMAGICAL (hv);
389
390 if (mg)
391 encode_ch (enc, MAJOR_MAP | MINOR_INDEF);
392 else
393 encode_uint (enc, MAJOR_MAP, pairs);
394
395 while ((he = hv_iternext (hv)))
396 {
397 if (HeKLEN (he) == HEf_SVKEY)
398 encode_sv (enc, HeSVKEY (he));
399 else
400 encode_strref (enc, enc->cbor.flags & (F_TEXT_KEYS | F_TEXT_STRINGS), HeKUTF8 (he), HeKEY (he), HeKLEN (he));
401
402 encode_sv (enc, ecb_expect_false (mg) ? hv_iterval (hv, he) : HeVAL (he));
403 }
404
405 if (mg)
406 encode_ch (enc, MAJOR_MISC | MINOR_INDEF);
407
408 --enc->depth;
409 }
410
411 // encode objects, arrays and special \0=false and \1=true values.
412 static void
413 encode_rv (enc_t *enc, SV *sv)
414 {
415 SvGETMAGIC (sv);
416
417 svtype svt = SvTYPE (sv);
418
419 if (ecb_expect_false (SvOBJECT (sv)))
420 {
421 HV *boolean_stash = !CBOR_SLOW || types_boolean_stash
422 ? types_boolean_stash
423 : gv_stashpv ("Types::Serialiser::Boolean", 1);
424 HV *error_stash = !CBOR_SLOW || types_error_stash
425 ? types_error_stash
426 : gv_stashpv ("Types::Serialiser::Error", 1);
427 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
428 ? cbor_tagged_stash
429 : gv_stashpv ("CBOR::XS::Tagged" , 1);
430
431 HV *stash = SvSTASH (sv);
432
433 if (stash == boolean_stash)
434 {
435 encode_ch (enc, SvIV (sv) ? MAJOR_MISC | SIMPLE_TRUE : MAJOR_MISC | SIMPLE_FALSE);
436 return;
437 }
438 else if (stash == error_stash)
439 {
440 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
441 return;
442 }
443 else if (stash == tagged_stash)
444 {
445 if (svt != SVt_PVAV)
446 croak ("encountered CBOR::XS::Tagged object that isn't an array");
447
448 encode_uint (enc, MAJOR_TAG, SvUV (*av_fetch ((AV *)sv, 0, 1)));
449 encode_sv (enc, *av_fetch ((AV *)sv, 1, 1));
450
451 return;
452 }
453 }
454
455 if (ecb_expect_false (SvREFCNT (sv) > 1)
456 && ecb_expect_false (enc->cbor.flags & F_ALLOW_SHARING))
457 {
458 if (!enc->shareable)
459 enc->shareable = (HV *)sv_2mortal ((SV *)newHV ());
460
461 SV **svp = hv_fetch (enc->shareable, (char *)&sv, sizeof (sv), 1);
462
463 if (SvOK (*svp))
464 {
465 encode_tag (enc, CBOR_TAG_VALUE_SHAREDREF);
466 encode_uint (enc, MAJOR_POS_INT, SvUV (*svp));
467 return;
468 }
469 else
470 {
471 sv_setuv (*svp, enc->shareable_idx);
472 ++enc->shareable_idx;
473 encode_tag (enc, CBOR_TAG_VALUE_SHAREABLE);
474 }
475 }
476
477 if (ecb_expect_false (SvOBJECT (sv)))
478 {
479 HV *stash = SvSTASH (sv);
480 GV *method;
481
482 if ((method = gv_fetchmethod_autoload (stash, "TO_CBOR", 0)))
483 {
484 dSP;
485
486 ENTER; SAVETMPS;
487 PUSHMARK (SP);
488 // we re-bless the reference to get overload and other niceties right
489 XPUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
490
491 PUTBACK;
492 // G_SCALAR ensures that return value is 1
493 call_sv ((SV *)GvCV (method), G_SCALAR);
494 SPAGAIN;
495
496 // catch this surprisingly common error
497 if (SvROK (TOPs) && SvRV (TOPs) == sv)
498 croak ("%s::TO_CBOR method returned same object as was passed instead of a new one", HvNAME (stash));
499
500 encode_sv (enc, POPs);
501
502 PUTBACK;
503
504 FREETMPS; LEAVE;
505 }
506 else if ((method = gv_fetchmethod_autoload (stash, "FREEZE", 0)) != 0)
507 {
508 dSP;
509
510 ENTER; SAVETMPS;
511 SAVESTACK_POS ();
512 PUSHMARK (SP);
513 EXTEND (SP, 2);
514 // we re-bless the reference to get overload and other niceties right
515 PUSHs (sv_bless (sv_2mortal (newRV_inc (sv)), stash));
516 PUSHs (sv_cbor);
517
518 PUTBACK;
519 int count = call_sv ((SV *)GvCV (method), G_ARRAY);
520 SPAGAIN;
521
522 // catch this surprisingly common error
523 if (count == 1 && SvROK (TOPs) && SvRV (TOPs) == sv)
524 croak ("%s::FREEZE(CBOR) method returned same object as was passed instead of a new one", HvNAME (stash));
525
526 encode_tag (enc, CBOR_TAG_PERL_OBJECT);
527 encode_uint (enc, MAJOR_ARRAY, count + 1);
528 encode_strref (enc, 0, HvNAMEUTF8 (stash), HvNAME (stash), HvNAMELEN (stash));
529
530 while (count)
531 encode_sv (enc, SP[1 - count--]);
532
533 PUTBACK;
534
535 FREETMPS; LEAVE;
536 }
537 else
538 croak ("encountered object '%s', but no TO_CBOR or FREEZE methods available on it",
539 SvPV_nolen (sv_2mortal (newRV_inc (sv))));
540 }
541 else if (svt == SVt_PVHV)
542 encode_hv (enc, (HV *)sv);
543 else if (svt == SVt_PVAV)
544 encode_av (enc, (AV *)sv);
545 else
546 {
547 encode_tag (enc, CBOR_TAG_INDIRECTION);
548 encode_sv (enc, sv);
549 }
550 }
551
552 static void
553 encode_nv (enc_t *enc, SV *sv)
554 {
555 double nv = SvNVX (sv);
556
557 need (enc, 9);
558
559 if (ecb_expect_false (nv == (NV)(U32)nv))
560 encode_uint (enc, MAJOR_POS_INT, (U32)nv);
561 //TODO: maybe I32?
562 else if (ecb_expect_false (nv == (float)nv))
563 {
564 uint32_t fp = ecb_float_to_binary32 (nv);
565
566 *enc->cur++ = MAJOR_MISC | MISC_FLOAT32;
567
568 if (!ecb_big_endian ())
569 fp = ecb_bswap32 (fp);
570
571 memcpy (enc->cur, &fp, 4);
572 enc->cur += 4;
573 }
574 else
575 {
576 uint64_t fp = ecb_double_to_binary64 (nv);
577
578 *enc->cur++ = MAJOR_MISC | MISC_FLOAT64;
579
580 if (!ecb_big_endian ())
581 fp = ecb_bswap64 (fp);
582
583 memcpy (enc->cur, &fp, 8);
584 enc->cur += 8;
585 }
586 }
587
588 static void
589 encode_sv (enc_t *enc, SV *sv)
590 {
591 SvGETMAGIC (sv);
592
593 if (SvPOKp (sv))
594 {
595 STRLEN len;
596 char *str = SvPV (sv, len);
597 encode_strref (enc, enc->cbor.flags & F_TEXT_STRINGS, SvUTF8 (sv), str, len);
598 }
599 else if (SvNOKp (sv))
600 encode_nv (enc, sv);
601 else if (SvIOKp (sv))
602 {
603 if (SvIsUV (sv))
604 encode_uint (enc, MAJOR_POS_INT, SvUVX (sv));
605 else if (SvIVX (sv) >= 0)
606 encode_uint (enc, MAJOR_POS_INT, SvIVX (sv));
607 else
608 encode_uint (enc, MAJOR_NEG_INT, -(SvIVX (sv) + 1));
609 }
610 else if (SvROK (sv))
611 encode_rv (enc, SvRV (sv));
612 else if (!SvOK (sv))
613 encode_ch (enc, MAJOR_MISC | SIMPLE_NULL);
614 else if (enc->cbor.flags & F_ALLOW_UNKNOWN)
615 encode_ch (enc, MAJOR_MISC | SIMPLE_UNDEF);
616 else
617 croak ("encountered perl type (%s,0x%x) that CBOR cannot handle, check your input data",
618 SvPV_nolen (sv), (unsigned int)SvFLAGS (sv));
619 }
620
621 static SV *
622 encode_cbor (SV *scalar, CBOR *cbor)
623 {
624 enc_t enc = { 0 };
625
626 enc.cbor = *cbor;
627 enc.sv = sv_2mortal (NEWSV (0, INIT_SIZE));
628 enc.cur = SvPVX (enc.sv);
629 enc.end = SvEND (enc.sv);
630
631 SvPOK_only (enc.sv);
632
633 if (cbor->flags & F_PACK_STRINGS)
634 {
635 encode_tag (&enc, CBOR_TAG_STRINGREF_NAMESPACE);
636 enc.stringref[0]= (HV *)sv_2mortal ((SV *)newHV ());
637 enc.stringref[1]= (HV *)sv_2mortal ((SV *)newHV ());
638 }
639
640 encode_sv (&enc, scalar);
641
642 SvCUR_set (enc.sv, enc.cur - SvPVX (enc.sv));
643 *SvEND (enc.sv) = 0; // many xs functions expect a trailing 0 for text strings
644
645 if (enc.cbor.flags & F_SHRINK)
646 shrink (enc.sv);
647
648 return enc.sv;
649 }
650
651 /////////////////////////////////////////////////////////////////////////////
652 // decoder
653
654 // structure used for decoding CBOR
655 typedef struct
656 {
657 U8 *cur; // current parser pointer
658 U8 *end; // end of input string
659 const char *err; // parse error, if != 0
660 CBOR cbor;
661 U32 depth; // recursion depth
662 U32 maxdepth; // recursion depth limit
663 AV *shareable;
664 AV *stringref;
665 SV *decode_tagged;
666 } dec_t;
667
668 #define ERR(reason) SB if (!dec->err) dec->err = reason; goto fail; SE
669
670 #define WANT(len) if (ecb_expect_false ((UV)(dec->end - dec->cur) < (UV)len)) ERR ("unexpected end of CBOR data")
671
672 #define DEC_INC_DEPTH if (ecb_expect_false (++dec->depth > dec->cbor.max_depth)) ERR (ERR_NESTING_EXCEEDED)
673 #define DEC_DEC_DEPTH --dec->depth
674
675 static UV
676 decode_uint (dec_t *dec)
677 {
678 U8 m = *dec->cur & MINOR_MASK;
679 ++dec->cur;
680
681 if (ecb_expect_true (m < LENGTH_EXT1))
682 return m;
683 else if (ecb_expect_true (m == LENGTH_EXT1))
684 {
685 WANT (1);
686 dec->cur += 1;
687 return dec->cur[-1];
688 }
689 else if (ecb_expect_true (m == LENGTH_EXT2))
690 {
691 WANT (2);
692 dec->cur += 2;
693 return (((UV)dec->cur[-2]) << 8)
694 | ((UV)dec->cur[-1]);
695 }
696 else if (ecb_expect_true (m == LENGTH_EXT4))
697 {
698 WANT (4);
699 dec->cur += 4;
700 return (((UV)dec->cur[-4]) << 24)
701 | (((UV)dec->cur[-3]) << 16)
702 | (((UV)dec->cur[-2]) << 8)
703 | ((UV)dec->cur[-1]);
704 }
705 else if (ecb_expect_true (m == LENGTH_EXT8))
706 {
707 WANT (8);
708 dec->cur += 8;
709
710 return
711 #if UVSIZE < 8
712 0
713 #else
714 (((UV)dec->cur[-8]) << 56)
715 | (((UV)dec->cur[-7]) << 48)
716 | (((UV)dec->cur[-6]) << 40)
717 | (((UV)dec->cur[-5]) << 32)
718 #endif
719 | (((UV)dec->cur[-4]) << 24)
720 | (((UV)dec->cur[-3]) << 16)
721 | (((UV)dec->cur[-2]) << 8)
722 | ((UV)dec->cur[-1]);
723 }
724 else
725 ERR ("corrupted CBOR data (unsupported integer minor encoding)");
726
727 fail:
728 return 0;
729 }
730
731 static SV *decode_sv (dec_t *dec);
732
733 static SV *
734 decode_av (dec_t *dec)
735 {
736 AV *av = newAV ();
737
738 DEC_INC_DEPTH;
739
740 if (*dec->cur == (MAJOR_ARRAY | MINOR_INDEF))
741 {
742 ++dec->cur;
743
744 for (;;)
745 {
746 WANT (1);
747
748 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
749 {
750 ++dec->cur;
751 break;
752 }
753
754 av_push (av, decode_sv (dec));
755 }
756 }
757 else
758 {
759 UV i, len = decode_uint (dec);
760
761 WANT (len); // complexity check for av_fill - need at least one byte per value, do not allow supersize arrays
762 av_fill (av, len - 1);
763
764 for (i = 0; i < len; ++i)
765 AvARRAY (av)[i] = decode_sv (dec);
766 }
767
768 DEC_DEC_DEPTH;
769 return newRV_noinc ((SV *)av);
770
771 fail:
772 SvREFCNT_dec (av);
773 DEC_DEC_DEPTH;
774 return &PL_sv_undef;
775 }
776
777 static void
778 decode_he (dec_t *dec, HV *hv)
779 {
780 // for speed reasons, we specialcase single-string
781 // byte or utf-8 strings as keys, but only when !stringref
782
783 if (ecb_expect_true (!dec->stringref))
784 if (ecb_expect_true ((U8)(*dec->cur - MAJOR_BYTES) <= LENGTH_EXT8))
785 {
786 STRLEN len = decode_uint (dec);
787 char *key = (char *)dec->cur;
788
789 WANT (len);
790 dec->cur += len;
791
792 hv_store (hv, key, len, decode_sv (dec), 0);
793
794 return;
795 }
796 else if (ecb_expect_true ((U8)(*dec->cur - MAJOR_TEXT) <= LENGTH_EXT8))
797 {
798 STRLEN len = decode_uint (dec);
799 char *key = (char *)dec->cur;
800
801 WANT (len);
802 dec->cur += len;
803
804 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
805 if (!is_utf8_string (key, len))
806 ERR ("corrupted CBOR data (invalid UTF-8 in map key)");
807
808 hv_store (hv, key, -len, decode_sv (dec), 0);
809
810 return;
811 }
812
813 SV *k = decode_sv (dec);
814 SV *v = decode_sv (dec);
815
816 hv_store_ent (hv, k, v, 0);
817 SvREFCNT_dec (k);
818
819 fail:
820 ;
821 }
822
823 static SV *
824 decode_hv (dec_t *dec)
825 {
826 HV *hv = newHV ();
827
828 DEC_INC_DEPTH;
829
830 if (*dec->cur == (MAJOR_MAP | MINOR_INDEF))
831 {
832 ++dec->cur;
833
834 for (;;)
835 {
836 WANT (1);
837
838 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
839 {
840 ++dec->cur;
841 break;
842 }
843
844 decode_he (dec, hv);
845 }
846 }
847 else
848 {
849 UV pairs = decode_uint (dec);
850
851 WANT (pairs); // complexity check - need at least one byte per value, do not allow supersize hashes
852
853 while (pairs--)
854 decode_he (dec, hv);
855 }
856
857 DEC_DEC_DEPTH;
858 return newRV_noinc ((SV *)hv);
859
860 fail:
861 SvREFCNT_dec (hv);
862 DEC_DEC_DEPTH;
863 return &PL_sv_undef;
864 }
865
866 static SV *
867 decode_str (dec_t *dec, int utf8)
868 {
869 SV *sv = 0;
870
871 if ((*dec->cur & MINOR_MASK) == MINOR_INDEF)
872 {
873 // indefinite length strings
874 ++dec->cur;
875
876 U8 major = *dec->cur & MAJOR_MISC;
877
878 sv = newSVpvn ("", 0);
879
880 for (;;)
881 {
882 WANT (1);
883
884 if ((*dec->cur - major) > LENGTH_EXT8)
885 if (*dec->cur == (MAJOR_MISC | MINOR_INDEF))
886 {
887 ++dec->cur;
888 break;
889 }
890 else
891 ERR ("corrupted CBOR data (invalid chunks in indefinite length string)");
892
893 STRLEN len = decode_uint (dec);
894
895 WANT (len);
896 sv_catpvn (sv, dec->cur, len);
897 dec->cur += len;
898 }
899 }
900 else
901 {
902 STRLEN len = decode_uint (dec);
903
904 WANT (len);
905 sv = newSVpvn (dec->cur, len);
906 dec->cur += len;
907
908 if (ecb_expect_false (dec->stringref)
909 && SvCUR (sv) >= minimum_string_length (AvFILLp (dec->stringref) + 1))
910 av_push (dec->stringref, SvREFCNT_inc_NN (sv));
911 }
912
913 if (utf8)
914 {
915 if (ecb_expect_false (dec->cbor.flags & F_VALIDATE_UTF8))
916 if (!is_utf8_string (SvPVX (sv), SvCUR (sv)))
917 ERR ("corrupted CBOR data (invalid UTF-8 in text string)");
918
919 SvUTF8_on (sv);
920 }
921
922 return sv;
923
924 fail:
925 SvREFCNT_dec (sv);
926 return &PL_sv_undef;
927 }
928
929 static SV *
930 decode_tagged (dec_t *dec)
931 {
932 SV *sv = 0;
933 UV tag = decode_uint (dec);
934
935 WANT (1);
936
937 switch (tag)
938 {
939 case CBOR_TAG_MAGIC:
940 sv = decode_sv (dec);
941 break;
942
943 case CBOR_TAG_INDIRECTION:
944 sv = newRV_noinc (decode_sv (dec));
945 break;
946
947 case CBOR_TAG_STRINGREF_NAMESPACE:
948 {
949 // do nmot use SAVETMPS/FREETMPS, as these will
950 // erase mortalised caches, e.g. "shareable"
951 ENTER;
952
953 SAVESPTR (dec->stringref);
954 dec->stringref = (AV *)sv_2mortal ((SV *)newAV ());
955
956 sv = decode_sv (dec);
957
958 LEAVE;
959 }
960 break;
961
962 case CBOR_TAG_STRINGREF:
963 {
964 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
965 ERR ("corrupted CBOR data (stringref index not an unsigned integer)");
966
967 UV idx = decode_uint (dec);
968
969 if (!dec->stringref || (int)idx > AvFILLp (dec->stringref))
970 ERR ("corrupted CBOR data (stringref index out of bounds or outside namespace)");
971
972 sv = newSVsv (AvARRAY (dec->stringref)[idx]);
973 }
974 break;
975
976 case CBOR_TAG_VALUE_SHAREABLE:
977 {
978 if (ecb_expect_false (!dec->shareable))
979 dec->shareable = (AV *)sv_2mortal ((SV *)newAV ());
980
981 if (dec->cbor.flags & F_ALLOW_CYCLES)
982 {
983 sv = newSV (0);
984 av_push (dec->shareable, SvREFCNT_inc_NN (sv));
985
986 SV *osv = decode_sv (dec);
987 sv_setsv (sv, osv);
988 SvREFCNT_dec_NN (osv);
989 }
990 else
991 {
992 av_push (dec->shareable, &PL_sv_undef);
993 int idx = AvFILLp (dec->shareable);
994 sv = decode_sv (dec);
995 av_store (dec->shareable, idx, SvREFCNT_inc_NN (sv));
996 }
997 }
998 break;
999
1000 case CBOR_TAG_VALUE_SHAREDREF:
1001 {
1002 if ((*dec->cur >> MAJOR_SHIFT) != (MAJOR_POS_INT >> MAJOR_SHIFT))
1003 ERR ("corrupted CBOR data (sharedref index not an unsigned integer)");
1004
1005 UV idx = decode_uint (dec);
1006
1007 if (!dec->shareable || (int)idx > AvFILLp (dec->shareable))
1008 ERR ("corrupted CBOR data (sharedref index out of bounds)");
1009
1010 sv = SvREFCNT_inc_NN (AvARRAY (dec->shareable)[idx]);
1011
1012 if (sv == &PL_sv_undef)
1013 ERR ("cyclic CBOR data structure found, but allow_cycles is not enabled");
1014 }
1015 break;
1016
1017 case CBOR_TAG_PERL_OBJECT:
1018 {
1019 sv = decode_sv (dec);
1020
1021 if (!SvROK (sv) || SvTYPE (SvRV (sv)) != SVt_PVAV)
1022 ERR ("corrupted CBOR data (non-array perl object)");
1023
1024 AV *av = (AV *)SvRV (sv);
1025 int len = av_len (av) + 1;
1026 HV *stash = gv_stashsv (*av_fetch (av, 0, 1), 0);
1027
1028 if (!stash)
1029 ERR ("cannot decode perl-object (package does not exist)");
1030
1031 GV *method = gv_fetchmethod_autoload (stash, "THAW", 0);
1032
1033 if (!method)
1034 ERR ("cannot decode perl-object (package does not have a THAW method)");
1035
1036 dSP;
1037
1038 ENTER; SAVETMPS;
1039 PUSHMARK (SP);
1040 EXTEND (SP, len + 1);
1041 // we re-bless the reference to get overload and other niceties right
1042 PUSHs (*av_fetch (av, 0, 1));
1043 PUSHs (sv_cbor);
1044
1045 int i;
1046
1047 for (i = 1; i < len; ++i)
1048 PUSHs (*av_fetch (av, i, 1));
1049
1050 PUTBACK;
1051 call_sv ((SV *)GvCV (method), G_SCALAR | G_EVAL);
1052 SPAGAIN;
1053
1054 if (SvTRUE (ERRSV))
1055 {
1056 FREETMPS; LEAVE;
1057 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1058 }
1059
1060 SvREFCNT_dec (sv);
1061 sv = SvREFCNT_inc (POPs);
1062
1063 PUTBACK;
1064
1065 FREETMPS; LEAVE;
1066 }
1067 break;
1068
1069 default:
1070 {
1071 SV *tag_sv = newSVuv (tag);
1072
1073 sv = decode_sv (dec);
1074
1075 dSP;
1076 ENTER; SAVETMPS;
1077 SAVESTACK_POS ();
1078 PUSHMARK (SP);
1079 EXTEND (SP, 2);
1080 PUSHs (tag_sv);
1081 PUSHs (sv);
1082
1083 PUTBACK;
1084 int count = call_sv (dec->cbor.filter ? dec->cbor.filter : default_filter, G_ARRAY | G_EVAL);
1085 SPAGAIN;
1086
1087 if (SvTRUE (ERRSV))
1088 {
1089 SvREFCNT_dec (tag_sv);
1090 FREETMPS; LEAVE;
1091 ERR (SvPVutf8_nolen (sv_2mortal (SvREFCNT_inc (ERRSV))));
1092 }
1093
1094 if (count)
1095 {
1096 SvREFCNT_dec (tag_sv);
1097 SvREFCNT_dec (sv);
1098 sv = SvREFCNT_inc (POPs);
1099 }
1100 else
1101 {
1102 AV *av = newAV ();
1103 av_push (av, tag_sv);
1104 av_push (av, sv);
1105
1106 HV *tagged_stash = !CBOR_SLOW || cbor_tagged_stash
1107 ? cbor_tagged_stash
1108 : gv_stashpv ("CBOR::XS::Tagged" , 1);
1109 sv = sv_bless (newRV_noinc ((SV *)av), tagged_stash);
1110 }
1111
1112 PUTBACK;
1113
1114 FREETMPS; LEAVE;
1115 }
1116 break;
1117 }
1118
1119 return sv;
1120
1121 fail:
1122 SvREFCNT_dec (sv);
1123 return &PL_sv_undef;
1124 }
1125
1126 static SV *
1127 decode_sv (dec_t *dec)
1128 {
1129 WANT (1);
1130
1131 switch (*dec->cur >> MAJOR_SHIFT)
1132 {
1133 case MAJOR_POS_INT >> MAJOR_SHIFT: return newSVuv (decode_uint (dec));
1134 case MAJOR_NEG_INT >> MAJOR_SHIFT: return newSViv (-1 - (IV)decode_uint (dec));
1135 case MAJOR_BYTES >> MAJOR_SHIFT: return decode_str (dec, 0);
1136 case MAJOR_TEXT >> MAJOR_SHIFT: return decode_str (dec, 1);
1137 case MAJOR_ARRAY >> MAJOR_SHIFT: return decode_av (dec);
1138 case MAJOR_MAP >> MAJOR_SHIFT: return decode_hv (dec);
1139 case MAJOR_TAG >> MAJOR_SHIFT: return decode_tagged (dec);
1140
1141 case MAJOR_MISC >> MAJOR_SHIFT:
1142 switch (*dec->cur++ & MINOR_MASK)
1143 {
1144 case SIMPLE_FALSE:
1145 #if CBOR_SLOW
1146 types_false = get_bool ("Types::Serialiser::false");
1147 #endif
1148 return newSVsv (types_false);
1149 case SIMPLE_TRUE:
1150 #if CBOR_SLOW
1151 types_true = get_bool ("Types::Serialiser::true");
1152 #endif
1153 return newSVsv (types_true);
1154 case SIMPLE_NULL:
1155 return newSVsv (&PL_sv_undef);
1156 case SIMPLE_UNDEF:
1157 #if CBOR_SLOW
1158 types_error = get_bool ("Types::Serialiser::error");
1159 #endif
1160 return newSVsv (types_error);
1161
1162 case MISC_FLOAT16:
1163 {
1164 WANT (2);
1165
1166 uint16_t fp = (dec->cur[0] << 8) | dec->cur[1];
1167 dec->cur += 2;
1168
1169 return newSVnv (ecb_binary16_to_float (fp));
1170 }
1171
1172 case MISC_FLOAT32:
1173 {
1174 uint32_t fp;
1175 WANT (4);
1176 memcpy (&fp, dec->cur, 4);
1177 dec->cur += 4;
1178
1179 if (!ecb_big_endian ())
1180 fp = ecb_bswap32 (fp);
1181
1182 return newSVnv (ecb_binary32_to_float (fp));
1183 }
1184
1185 case MISC_FLOAT64:
1186 {
1187 uint64_t fp;
1188 WANT (8);
1189 memcpy (&fp, dec->cur, 8);
1190 dec->cur += 8;
1191
1192 if (!ecb_big_endian ())
1193 fp = ecb_bswap64 (fp);
1194
1195 return newSVnv (ecb_binary64_to_double (fp));
1196 }
1197
1198 // 0..19 unassigned simple
1199 // 24 reserved + unassigned simple (reserved values are not encodable)
1200 // 28-30 unassigned misc
1201 // 31 break code
1202 default:
1203 ERR ("corrupted CBOR data (reserved/unassigned/unexpected major 7 value)");
1204 }
1205
1206 break;
1207 }
1208
1209 fail:
1210 return &PL_sv_undef;
1211 }
1212
1213 static SV *
1214 decode_cbor (SV *string, CBOR *cbor, char **offset_return)
1215 {
1216 dec_t dec = { 0 };
1217 SV *sv;
1218 STRLEN len;
1219 char *data = SvPVbyte (string, len);
1220
1221 if (len > cbor->max_size && cbor->max_size)
1222 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1223 (unsigned long)len, (unsigned long)cbor->max_size);
1224
1225 dec.cbor = *cbor;
1226 dec.cur = (U8 *)data;
1227 dec.end = (U8 *)data + len;
1228
1229 sv = decode_sv (&dec);
1230
1231 if (offset_return)
1232 *offset_return = dec.cur;
1233
1234 if (!(offset_return || !sv))
1235 if (dec.cur != dec.end && !dec.err)
1236 dec.err = "garbage after CBOR object";
1237
1238 if (dec.err)
1239 {
1240 if (dec.shareable)
1241 {
1242 // need to break cyclic links, which would all be in shareable
1243 int i;
1244 SV **svp;
1245
1246 for (i = av_len (dec.shareable) + 1; i--; )
1247 if ((svp = av_fetch (dec.shareable, i, 0)))
1248 sv_setsv (*svp, &PL_sv_undef);
1249 }
1250
1251 SvREFCNT_dec (sv);
1252 croak ("%s, at offset %d (octet 0x%02x)", dec.err, dec.cur - (U8 *)data, (int)(uint8_t)*dec.cur);
1253 }
1254
1255 sv = sv_2mortal (sv);
1256
1257 return sv;
1258 }
1259
1260 /////////////////////////////////////////////////////////////////////////////
1261 // incremental parser
1262
1263 #define INCR_DONE(cbor) (AvFILLp (cbor->incr_count) < 0)
1264
1265 // returns 0 for notyet, 1 for success or error
1266 static int
1267 incr_parse (CBOR *self, SV *cborstr)
1268 {
1269 STRLEN cur;
1270 SvPV (cborstr, cur);
1271
1272 while (ecb_expect_true (self->incr_need <= cur))
1273 {
1274 // table of integer count bytes
1275 static I8 incr_len[MINOR_MASK + 1] = {
1276 0, 0, 0, 0, 0, 0, 0, 0,
1277 0, 0, 0, 0, 0, 0, 0, 0,
1278 0, 0, 0, 0, 0, 0, 0, 0,
1279 1, 2, 4, 8,-1,-1,-1,-2
1280 };
1281
1282 const U8 *p = SvPVX (cborstr) + self->incr_pos;
1283 U8 m = *p & MINOR_MASK;
1284 IV count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1285 I8 ilen = incr_len[m];
1286
1287 self->incr_need = self->incr_pos + 1;
1288
1289 if (ecb_expect_false (ilen < 0))
1290 {
1291 if (m != MINOR_INDEF)
1292 return 1; // error
1293
1294 if (*p == (MAJOR_MISC | MINOR_INDEF))
1295 {
1296 if (count >= 0)
1297 return 1; // error
1298
1299 count = 1;
1300 }
1301 else
1302 {
1303 av_push (self->incr_count, newSViv (-1)); //TODO: nest
1304 count = -1;
1305 }
1306 }
1307 else
1308 {
1309 self->incr_need += ilen;
1310 if (ecb_expect_false (self->incr_need > cur))
1311 return 0;
1312
1313 int major = *p >> MAJOR_SHIFT;
1314
1315 switch (major)
1316 {
1317 case MAJOR_TAG >> MAJOR_SHIFT:
1318 ++count; // tags merely prefix another value
1319 break;
1320
1321 case MAJOR_BYTES >> MAJOR_SHIFT:
1322 case MAJOR_TEXT >> MAJOR_SHIFT:
1323 case MAJOR_ARRAY >> MAJOR_SHIFT:
1324 case MAJOR_MAP >> MAJOR_SHIFT:
1325 {
1326 UV len;
1327
1328 if (ecb_expect_false (ilen))
1329 {
1330 len = 0;
1331
1332 do {
1333 len = (len << 8) | *++p;
1334 } while (--ilen);
1335 }
1336 else
1337 len = m;
1338
1339 switch (major)
1340 {
1341 case MAJOR_BYTES >> MAJOR_SHIFT:
1342 case MAJOR_TEXT >> MAJOR_SHIFT:
1343 self->incr_need += len;
1344 if (ecb_expect_false (self->incr_need > cur))
1345 return 0;
1346
1347 break;
1348
1349 case MAJOR_MAP >> MAJOR_SHIFT:
1350 len <<= 1;
1351 case MAJOR_ARRAY >> MAJOR_SHIFT:
1352 if (len)
1353 {
1354 av_push (self->incr_count, newSViv (len + 1)); //TODO: nest
1355 count = len + 1;
1356 }
1357 break;
1358 }
1359 }
1360 }
1361 }
1362
1363 self->incr_pos = self->incr_need;
1364
1365 if (count > 0)
1366 {
1367 while (!--count)
1368 {
1369 if (!AvFILLp (self->incr_count))
1370 return 1; // done
1371
1372 SvREFCNT_dec_NN (av_pop (self->incr_count));
1373 count = SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]);
1374 }
1375
1376 SvIVX (AvARRAY (self->incr_count)[AvFILLp (self->incr_count)]) = count;
1377 }
1378 }
1379
1380 return 0;
1381 }
1382
1383
1384 /////////////////////////////////////////////////////////////////////////////
1385 // XS interface functions
1386
1387 MODULE = CBOR::XS PACKAGE = CBOR::XS
1388
1389 BOOT:
1390 {
1391 cbor_stash = gv_stashpv ("CBOR::XS" , 1);
1392 cbor_tagged_stash = gv_stashpv ("CBOR::XS::Tagged" , 1);
1393
1394 types_boolean_stash = gv_stashpv ("Types::Serialiser::Boolean", 1);
1395 types_error_stash = gv_stashpv ("Types::Serialiser::Error" , 1);
1396
1397 types_true = get_bool ("Types::Serialiser::true" );
1398 types_false = get_bool ("Types::Serialiser::false");
1399 types_error = get_bool ("Types::Serialiser::error");
1400
1401 default_filter = newSVpv ("CBOR::XS::default_filter", 0);
1402
1403 sv_cbor = newSVpv ("CBOR", 0);
1404 SvREADONLY_on (sv_cbor);
1405
1406 assert (("STRLEN must be an unsigned type", 0 <= (STRLEN)-1));
1407 }
1408
1409 PROTOTYPES: DISABLE
1410
1411 void CLONE (...)
1412 CODE:
1413 cbor_stash = 0;
1414 cbor_tagged_stash = 0;
1415 types_error_stash = 0;
1416 types_boolean_stash = 0;
1417
1418 void new (char *klass)
1419 PPCODE:
1420 {
1421 SV *pv = NEWSV (0, sizeof (CBOR));
1422 SvPOK_only (pv);
1423 cbor_init ((CBOR *)SvPVX (pv));
1424 XPUSHs (sv_2mortal (sv_bless (
1425 newRV_noinc (pv),
1426 strEQ (klass, "CBOR::XS") ? CBOR_STASH : gv_stashpv (klass, 1)
1427 )));
1428 }
1429
1430 void shrink (CBOR *self, int enable = 1)
1431 ALIAS:
1432 shrink = F_SHRINK
1433 allow_unknown = F_ALLOW_UNKNOWN
1434 allow_sharing = F_ALLOW_SHARING
1435 allow_cycles = F_ALLOW_CYCLES
1436 pack_strings = F_PACK_STRINGS
1437 text_keys = F_TEXT_KEYS
1438 text_strings = F_TEXT_STRINGS
1439 validate_utf8 = F_VALIDATE_UTF8
1440 PPCODE:
1441 {
1442 if (enable)
1443 self->flags |= ix;
1444 else
1445 self->flags &= ~ix;
1446
1447 XPUSHs (ST (0));
1448 }
1449
1450 void get_shrink (CBOR *self)
1451 ALIAS:
1452 get_shrink = F_SHRINK
1453 get_allow_unknown = F_ALLOW_UNKNOWN
1454 get_allow_sharing = F_ALLOW_SHARING
1455 get_allow_cycles = F_ALLOW_CYCLES
1456 get_pack_strings = F_PACK_STRINGS
1457 get_text_keys = F_TEXT_KEYS
1458 get_text_strings = F_TEXT_STRINGS
1459 get_validate_utf8 = F_VALIDATE_UTF8
1460 PPCODE:
1461 XPUSHs (boolSV (self->flags & ix));
1462
1463 void max_depth (CBOR *self, U32 max_depth = 0x80000000UL)
1464 PPCODE:
1465 self->max_depth = max_depth;
1466 XPUSHs (ST (0));
1467
1468 U32 get_max_depth (CBOR *self)
1469 CODE:
1470 RETVAL = self->max_depth;
1471 OUTPUT:
1472 RETVAL
1473
1474 void max_size (CBOR *self, U32 max_size = 0)
1475 PPCODE:
1476 self->max_size = max_size;
1477 XPUSHs (ST (0));
1478
1479 int get_max_size (CBOR *self)
1480 CODE:
1481 RETVAL = self->max_size;
1482 OUTPUT:
1483 RETVAL
1484
1485 void filter (CBOR *self, SV *filter = 0)
1486 PPCODE:
1487 SvREFCNT_dec (self->filter);
1488 self->filter = filter ? newSVsv (filter) : filter;
1489 XPUSHs (ST (0));
1490
1491 SV *get_filter (CBOR *self)
1492 CODE:
1493 RETVAL = self->filter ? self->filter : NEWSV (0, 0);
1494 OUTPUT:
1495 RETVAL
1496
1497 void encode (CBOR *self, SV *scalar)
1498 PPCODE:
1499 PUTBACK; scalar = encode_cbor (scalar, self); SPAGAIN;
1500 XPUSHs (scalar);
1501
1502 void decode (CBOR *self, SV *cborstr)
1503 PPCODE:
1504 PUTBACK; cborstr = decode_cbor (cborstr, self, 0); SPAGAIN;
1505 XPUSHs (cborstr);
1506
1507 void decode_prefix (CBOR *self, SV *cborstr)
1508 PPCODE:
1509 {
1510 SV *sv;
1511 char *offset;
1512 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1513 EXTEND (SP, 2);
1514 PUSHs (sv);
1515 PUSHs (sv_2mortal (newSVuv (offset - SvPVX (cborstr))));
1516 }
1517
1518 void incr_parse (CBOR *self, SV *cborstr)
1519 ALIAS:
1520 incr_parse_multiple = 1
1521 PPCODE:
1522 {
1523 if (SvUTF8 (cborstr))
1524 sv_utf8_downgrade (cborstr, 0);
1525
1526 if (!self->incr_count)
1527 {
1528 self->incr_count = newAV ();
1529 self->incr_pos = 0;
1530 self->incr_need = 1;
1531
1532 av_push (self->incr_count, newSViv (1));
1533 }
1534
1535 do
1536 {
1537 if (!incr_parse (self, cborstr))
1538 {
1539 if (self->incr_need > self->max_size && self->max_size)
1540 croak ("attempted decode of CBOR text of %lu bytes size, but max_size is set to %lu",
1541 (unsigned long)self->incr_need, (unsigned long)self->max_size);
1542
1543 break;
1544 }
1545
1546 SV *sv;
1547 char *offset;
1548
1549 PUTBACK; sv = decode_cbor (cborstr, self, &offset); SPAGAIN;
1550 XPUSHs (sv);
1551
1552 sv_chop (cborstr, offset);
1553
1554 av_clear (self->incr_count);
1555 av_push (self->incr_count, newSViv (1));
1556
1557 self->incr_pos = 0;
1558 self->incr_need = self->incr_pos + 1;
1559 }
1560 while (ix);
1561 }
1562
1563 void incr_reset (CBOR *self)
1564 CODE:
1565 {
1566 SvREFCNT_dec (self->incr_count);
1567 self->incr_count = 0;
1568 }
1569
1570 void DESTROY (CBOR *self)
1571 PPCODE:
1572 cbor_free (self);
1573
1574 PROTOTYPES: ENABLE
1575
1576 void encode_cbor (SV *scalar)
1577 ALIAS:
1578 encode_cbor = 0
1579 encode_cbor_sharing = F_ALLOW_SHARING
1580 PPCODE:
1581 {
1582 CBOR cbor;
1583 cbor_init (&cbor);
1584 cbor.flags |= ix;
1585 PUTBACK; scalar = encode_cbor (scalar, &cbor); SPAGAIN;
1586 XPUSHs (scalar);
1587 }
1588
1589 void decode_cbor (SV *cborstr)
1590 PPCODE:
1591 {
1592 CBOR cbor;
1593 cbor_init (&cbor);
1594 PUTBACK; cborstr = decode_cbor (cborstr, &cbor, 0); SPAGAIN;
1595 XPUSHs (cborstr);
1596 }
1597