ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Convert-UUlib/UUlib.pm
(Generate patch)

Comparing Convert-UUlib/UUlib.pm (file contents):
Revision 1.27 by root, Sat Dec 16 22:53:30 2006 UTC vs.
Revision 1.47 by root, Fri Feb 28 16:57:25 2020 UTC

1package Convert::UUlib; 1package Convert::UUlib;
2
3no warnings;
4use strict;
2 5
3use Carp; 6use Carp;
4 7
5require Exporter; 8require Exporter;
6require DynaLoader; 9require DynaLoader;
7 10
8$VERSION = '1.08'; 11our $VERSION = 1.62;
9 12
10@ISA = qw(Exporter DynaLoader); 13our @ISA = qw(Exporter DynaLoader);
11 14
12@_consts = qw( 15our @_consts = qw(
13 ACT_COPYING ACT_DECODING ACT_ENCODING ACT_IDLE ACT_SCANNING 16 ACT_COPYING ACT_DECODING ACT_ENCODING ACT_IDLE ACT_SCANNING
14 17
15 FILE_DECODED FILE_ERROR FILE_MISPART FILE_NOBEGIN FILE_NODATA 18 FILE_DECODED FILE_ERROR FILE_MISPART FILE_NOBEGIN FILE_NODATA
16 FILE_NOEND FILE_OK FILE_READ FILE_TMPFILE 19 FILE_NOEND FILE_OK FILE_READ FILE_TMPFILE
17 20
19 22
20 OPT_RBUF OPT_WBUF 23 OPT_RBUF OPT_WBUF
21 OPT_BRACKPOL OPT_DEBUG OPT_DESPERATE OPT_DUMBNESS OPT_ENCEXT 24 OPT_BRACKPOL OPT_DEBUG OPT_DESPERATE OPT_DUMBNESS OPT_ENCEXT
22 OPT_ERRNO OPT_FAST OPT_IGNMODE OPT_IGNREPLY OPT_OVERWRITE OPT_PREAMB 25 OPT_ERRNO OPT_FAST OPT_IGNMODE OPT_IGNREPLY OPT_OVERWRITE OPT_PREAMB
23 OPT_PROGRESS OPT_SAVEPATH OPT_TINYB64 OPT_USETEXT OPT_VERBOSE 26 OPT_PROGRESS OPT_SAVEPATH OPT_TINYB64 OPT_USETEXT OPT_VERBOSE
24 OPT_VERSION OPT_REMOVE OPT_MOREMIME OPT_DOTDOT 27 OPT_VERSION OPT_REMOVE OPT_MOREMIME OPT_DOTDOT OPT_AUTOCHECK
25 28
26 RET_CANCEL RET_CONT RET_EXISTS RET_ILLVAL RET_IOERR RET_NODATA 29 RET_CANCEL RET_CONT RET_EXISTS RET_ILLVAL RET_IOERR RET_NODATA
27 RET_NOEND RET_NOMEM RET_OK RET_UNSUP 30 RET_NOEND RET_NOMEM RET_OK RET_UNSUP
28 31
29 B64_ENCODED BH_ENCODED PT_ENCODED QP_ENCODED 32 B64_ENCODED BH_ENCODED PT_ENCODED QP_ENCODED
30 XX_ENCODED UU_ENCODED YENC_ENCODED 33 XX_ENCODED UU_ENCODED YENC_ENCODED
31); 34);
32 35
33@_funcs = qw( 36our @_funcs = qw(
34 Initialize CleanUp GetOption SetOption strerror SetMsgCallback 37 Initialize CleanUp GetOption SetOption strerror SetMsgCallback
35 SetBusyCallback SetFileCallback SetFNameFilter SetFileNameCallback 38 SetBusyCallback SetFileCallback SetFNameFilter SetFileNameCallback
36 FNameFilter LoadFile GetFileListItem RenameFile DecodeToTemp 39 FNameFilter LoadFile GetFileListItem GetFileList RenameFile DecodeToTemp
37 RemoveTemp DecodeFile InfoFile Smerge QuickDecode EncodeMulti 40 RemoveTemp DecodeFile InfoFile Smerge QuickDecode EncodeMulti
38 EncodePartial EncodeToStream EncodeToFile E_PrepSingle 41 EncodePartial EncodeToStream EncodeToFile E_PrepSingle
39 E_PrepPartial 42 E_PrepPartial
40 43
41 straction strencoding strmsglevel 44 straction strencoding strmsglevel
42); 45);
43 46
44@EXPORT = @_consts; 47our @EXPORT = @_consts;
45@EXPORT_OK = @_funcs; 48our @EXPORT_OK = @_funcs;
46%EXPORT_TAGS = (all => [@_consts,@_funcs], constants => \@_consts); 49our %EXPORT_TAGS = (all => [@_consts,@_funcs], constants => \@_consts);
47 50
48bootstrap Convert::UUlib $VERSION; 51bootstrap Convert::UUlib $VERSION;
49 52
50Initialize(); 53Initialize();
51 54
52# not when < 5.005_6x 55# not when < 5.005_6x
53# END { CleanUp() } 56# END { CleanUp() }
54 57
55for (@_consts) { 58for (@_consts) {
56 my $constant = constant($_); 59 my $constant = constant($_);
60 no strict 'refs';
57 *$_ = sub () { $constant }; 61 *$_ = sub () { $constant };
58} 62}
59 63
60# action code -> string mapping 64# action code -> string mapping
61sub straction($) { 65sub straction($) {
101 use Convert::UUlib ':all'; 105 use Convert::UUlib ':all';
102 106
103 # read all the files named on the commandline and decode them 107 # read all the files named on the commandline and decode them
104 # into the CURRENT directory. See below for a longer example. 108 # into the CURRENT directory. See below for a longer example.
105 LoadFile $_ for @ARGV; 109 LoadFile $_ for @ARGV;
106 for (my $i = 0; my $uu = GetFileListItem $i; $i++) { 110 for my $uu (GetFileList) {
107 if ($uu->state & FILE_OK) { 111 if ($uu->state & FILE_OK) {
108 $uu->decode; 112 $uu->decode;
109 print $uu->filename, "\n"; 113 print $uu->filename, "\n";
110 } 114 }
111 } 115 }
155 OPT_TINYB64 detect short B64 outside of Mime 159 OPT_TINYB64 detect short B64 outside of Mime
156 OPT_ENCEXT extension for single-part encoded files 160 OPT_ENCEXT extension for single-part encoded files
157 OPT_REMOVE remove input files after decoding (dangerous) 161 OPT_REMOVE remove input files after decoding (dangerous)
158 OPT_MOREMIME strict MIME adherence 162 OPT_MOREMIME strict MIME adherence
159 OPT_DOTDOT ".."-unescaping has not yet been done on input files 163 OPT_DOTDOT ".."-unescaping has not yet been done on input files
160 OPT_RBUF set default read I/O buffer size in bytes *EXPERIMENTAL* 164 OPT_RBUF set default read I/O buffer size in bytes
161 OPT_WBUF set default write I/O buffer size in bytes *EXPERIMENTAL* 165 OPT_WBUF set default write I/O buffer size in bytes
166 OPT_AUTOCHECK automatically check file list after every loadfile
162 167
163=head2 Result/Error codes 168=head2 Result/Error codes
164 169
165 RET_OK everything went fine 170 RET_OK everything went fine
166 RET_IOERR I/O Error - examine errno 171 RET_IOERR I/O Error - examine errno
209again. 214again.
210 215
211On my machine, a fairly complete decode with DBI backend needs about 10MB 216On my machine, a fairly complete decode with DBI backend needs about 10MB
212RSS to decode 20000 files. 217RSS to decode 20000 files.
213 218
214=over 4 219=over
215 220
216=item Initialize 221=item Initialize
217 222
218Not normally necessary, (re-)initializes the library. 223Not normally necessary, (re-)initializes the library.
219 224
224 229
225=back 230=back
226 231
227=head2 Setting and querying options 232=head2 Setting and querying options
228 233
229=over 4 234=over
230 235
231=item $option = GetOption OPT_xxx 236=item $option = GetOption OPT_xxx
232 237
233=item SetOption OPT_xxx, opt-value 238=item SetOption OPT_xxx, opt-value
234 239
236 241
237See the C<OPT_xxx> constants above to see which options exist. 242See the C<OPT_xxx> constants above to see which options exist.
238 243
239=head2 Setting various callbacks 244=head2 Setting various callbacks
240 245
241=over 4 246=over
242 247
243=item SetMsgCallback [callback-function] 248=item SetMsgCallback [callback-function]
244 249
245=item SetBusyCallback [callback-function] 250=item SetBusyCallback [callback-function]
246 251
250 255
251=back 256=back
252 257
253=head2 Call the currently selected FNameFilter 258=head2 Call the currently selected FNameFilter
254 259
255=over 4 260=over
256 261
257=item $file = FNameFilter $file 262=item $file = FNameFilter $file
258 263
259=back 264=back
260 265
261=head2 Loading sourcefiles, optionally fuzzy merge and start decoding 266=head2 Loading sourcefiles, optionally fuzzy merge and start decoding
262 267
263=over 4 268=over
264 269
265=item ($retval, $count) = LoadFile $fname, [$id, [$delflag, [$partno]]] 270=item ($retval, $count) = LoadFile $fname, [$id, [$delflag, [$partno]]]
266 271
267Load the given file and scan it for encoded contents. Optionally tag it 272Load the given file and scan it for encoded contents. Optionally tag it
268with the given id, and if C<$delflag> is true, delete the file after it 273with the given id, and if C<$delflag> is true, delete the file after it
277If you are desperate, try to call C<Smerge> with increasing C<$pass> 282If you are desperate, try to call C<Smerge> with increasing C<$pass>
278values, beginning at C<0>, to try to merge parts that usually would not 283values, beginning at C<0>, to try to merge parts that usually would not
279have been merged. 284have been merged.
280 285
281Most probably this will result in garbled files, so never do this by 286Most probably this will result in garbled files, so never do this by
282default. 287default, except:
288
289If the C<OPT_AUTOCHECK> option has been disabled (by default it is
290enabled) to speed up file loading, then you I<have> to call C<Smerge -1>
291after loading all files as an additional pre-pass (which is normally done
292by C<LoadFile>).
283 293
284=item $item = GetFileListItem $item_number 294=item $item = GetFileListItem $item_number
285 295
286Return the C<$item> structure for the C<$item_number>'th found file, or 296Return the C<$item> structure for the C<$item_number>'th found file, or
287C<undef> of no file with that number exists. 297C<undef> of no file with that number exists.
288 298
289The first file has number C<0>, and the series has no holes, so you can 299The first file has number C<0>, and the series has no holes, so you can
290iterate over all files by starting with zero and incrementing until you 300iterate over all files by starting with zero and incrementing until you
291hit C<undef>. 301hit C<undef>.
292 302
303This function has to walk the linear list of fils on each access, so
304if you want to iterate over all items, it is usually faster to use
305C<GetFileList>.
306
307=item @items = GetFileList
308
309Similar to C<GetFileListItem>, but returns all files in one go.
310
293=back 311=back
294 312
295=head2 Decoding files 313=head2 Decoding files
296 314
297=over 4 315=over
298 316
299=item $retval = $item->rename($newname) 317=item $retval = $item->rename ($newname)
300 318
301Change the ondisk filename where the decoded file will be saved. 319Change the ondisk filename where the decoded file will be saved.
302 320
303=item $retval = $item->decode_temp 321=item $retval = $item->decode_temp
304 322
307 325
308=item $retval = $item->remove_temp 326=item $retval = $item->remove_temp
309 327
310Remove the temporarily decoded file again. 328Remove the temporarily decoded file again.
311 329
312=item $retval = $item->decode([$target_path]) 330=item $retval = $item->decode ([$target_path])
313 331
314Decode the file to it's destination, or the given target path. 332Decode the file to its destination, or the given target path.
315 333
316=item $retval = $item->info(callback-function) 334=item $retval = $item->info (callback-function)
317 335
318=back 336=back
319 337
320=head2 Querying (and setting) item attributes 338=head2 Querying (and setting) item attributes
321 339
322=over 4 340=over
323 341
324=item $state = $item->state 342=item $state = $item->state
325 343
326=item $mode = $item->mode([newmode]) 344=item $mode = $item->mode ([newmode])
327 345
328=item $uudet = $item->uudet 346=item $uudet = $item->uudet
329 347
330=item $size = $item->size 348=item $size = $item->size
331 349
332=item $filename = $item->filename([newfilename}) 350=item $filename = $item->filename ([newfilename})
333 351
334=item $subfname = $item->subfname 352=item $subfname = $item->subfname
335 353
336=item $mimeid = $item->mimeid 354=item $mimeid = $item->mimeid
337 355
341 359
342=back 360=back
343 361
344=head2 Information about source parts 362=head2 Information about source parts
345 363
346=over 4 364=over
347 365
348=item $parts = $item->parts 366=item $parts = $item->parts
349 367
350Return information about all parts (source files) used to decode the file 368Return information about all parts (source files) used to decode the file
351as a list of hashrefs with the following structure: 369as a list of hashrefs with the following structure:
365Usually you are interested mostly the C<sfname> and possibly the C<partno> 383Usually you are interested mostly the C<sfname> and possibly the C<partno>
366and C<filename> members. 384and C<filename> members.
367 385
368=back 386=back
369 387
370=head2 Functions below not documented and not very well tested 388=head2 Functions below are not documented and not very well tested - feedback welcome
371 389
372 QuickDecode 390 QuickDecode
373 EncodeMulti 391 EncodeMulti
374 EncodePartial 392 EncodePartial
375 EncodeToStream 393 EncodeToStream
379 397
380=head2 EXTENSION FUNCTIONS 398=head2 EXTENSION FUNCTIONS
381 399
382Functions found in this module but not documented in the uulib documentation: 400Functions found in this module but not documented in the uulib documentation:
383 401
384=over 4 402=over
385 403
386=item $msg = straction ACT_xxx 404=item $msg = straction ACT_xxx
387 405
388Return a human readable string representing the given action code. 406Return a human readable string representing the given action code.
389 407
433=head1 LARGE EXAMPLE DECODER 451=head1 LARGE EXAMPLE DECODER
434 452
435This is the file C<example-decoder> from the distribution, put here 453This is the file C<example-decoder> from the distribution, put here
436instead of more thorough documentation. 454instead of more thorough documentation.
437 455
456 #!/usr/bin/perl
457
438 # decode all the files in the directory uusrc/ and copy 458 # decode all the files in the directory uusrc/ and copy
439 # the resulting files to uudst/ 459 # the resulting files to uudst/
440 460
441 use Convert::UUlib ':all'; 461 use Convert::UUlib ':all';
442 462
443 sub namefilter { 463 sub namefilter {
444 my($path)=@_; 464 my ($path) = @_;
465
445 $path=~s/^.*[\/\\]//; 466 $path=~s/^.*[\/\\]//;
467
446 $path; 468 $path
447 } 469 }
448 470
449 sub busycb { 471 sub busycb {
450 my ($action, $curfile, $partno, $numparts, $percent, $fsize) = @_; 472 my ($action, $curfile, $partno, $numparts, $percent, $fsize) = @_;
451 $_[0]=straction($action); 473 $_[0]=straction($action);
452 print "busy_callback(", (join ",",@_), ")\n"; 474 print "busy_callback(", (join ",",@_), ")\n";
453 0; 475 0
454 } 476 }
455 477
478 SetOption OPT_RBUF, 128*1024;
479 SetOption OPT_WBUF, 1024*1024;
456 SetOption OPT_IGNMODE, 1; 480 SetOption OPT_IGNMODE, 1;
481 SetOption OPT_IGNMODE, 1;
457 SetOption OPT_VERBOSE, 1; 482 SetOption OPT_VERBOSE, 1;
458 483
459 # show the three ways you can set callback functions. I normally 484 # show the three ways you can set callback functions. I normally
460 # prefer the one with the sub inplace. 485 # prefer the one with the sub inplace.
461 SetFNameFilter \&namefilter; 486 SetFNameFilter \&namefilter;
462 487
463 SetBusyCallback "busycb", 333; 488 SetBusyCallback "busycb", 333;
464 489
465 SetMsgCallback sub { 490 SetMsgCallback sub {
466 my ($msg, $level) = @_; 491 my ($msg, $level) = @_;
467 print uc strmsglevel $_[1], ": $msg\n"; 492 print uc strmsglevel $_[1], ": $msg\n";
468 }; 493 };
469 494
470 # the following non-trivial FileNameCallback takes care 495 # the following non-trivial FileNameCallback takes care
471 # of some subject lines not detected properly by uulib: 496 # of some subject lines not detected properly by uulib:
472 SetFileNameCallback sub { 497 SetFileNameCallback sub {
473 return unless $_[1]; # skip "Re:"-plies et al. 498 return unless $_[1]; # skip "Re:"-plies et al.
474 local $_ = $_[0]; 499 local $_ = $_[0];
475 500
476 # the following rules are rather effective on some newsgroups, 501 # the following rules are rather effective on some newsgroups,
477 # like alt.binaries.games.anime, where non-mime, uuencoded data 502 # like alt.binaries.games.anime, where non-mime, uuencoded data
478 # is very common 503 # is very common
479 504
480 # if we find some *.rar, take it as the filename 505 # if we find some *.rar, take it as the filename
481 return $1 if /(\S{3,}\.(?:[rstuvwxyz]\d\d|rar))\s/i; 506 return $1 if /(\S{3,}\.(?:[rstuvwxyz]\d\d|rar))\s/i;
482 507
483 # one common subject format 508 # one common subject format
484 return $1 if /- "(.{2,}?\..+?)" (?:yenc )?\(\d+\/\d+\)/i; 509 return $1 if /- "(.{2,}?\..+?)" (?:yenc )?\(\d+\/\d+\)/i;
485 510
486 # - filename.par (04/55) 511 # - filename.par (04/55)
487 return $1 if /- "?(\S{3,}\.\S+?)"? (?:yenc )?\(\d+\/\d+\)/i; 512 return $1 if /- "?(\S{3,}\.\S+?)"? (?:yenc )?\(\d+\/\d+\)/i;
488 513
489 # - (xxx) No. 1 sayuri81.jpg 756565 bytes 514 # - (xxx) No. 1 sayuri81.jpg 756565 bytes
490 # - (20 files) No.17 Roseanne.jpg [2/2] 515 # - (20 files) No.17 Roseanne.jpg [2/2]
491 return $1 if /No\.[ 0-9]+ (\S+\....) (?:\d+ bytes )?\[/; 516 return $1 if /No\.[ 0-9]+ (\S+\....) (?:\d+ bytes )?\[/;
492 517
518 # try to detect some common forms of filenames
519 return $1 if /([a-z0-9_\-+.]{3,}\.[a-z]{3,4}(?:.\d+))/i;
520
493 # otherwise just pass what we have 521 # otherwise just pass what we have
494 return (); 522 ()
495 }; 523 };
496 524
497 # now read all files in the directory uusrc/* 525 # now read all files in the directory uusrc/*
498 for(<uusrc/*>) { 526 for (<uusrc/*>) {
499 my($retval,$count)=LoadFile ($_, $_, 1); 527 my ($retval, $count) = LoadFile ($_, $_, 1);
500 print "file($_), status(", strerror $retval, ") parts($count)\n"; 528 print "file($_), status(", strerror $retval, ") parts($count)\n";
501 } 529 }
502 530
503 SetOption OPT_SAVEPATH, "uudst/"; 531 SetOption OPT_SAVEPATH, "uudst/";
504 532
505 # now wade through all files and their source parts 533 # now wade through all files and their source parts
506 $i = 0; 534 for my $uu (GetFileList) {
507 while ($uu = GetFileListItem($i)) { 535 print "file ", $uu->filename, "\n";
508 $i++;
509 print "file nr. $i";
510 print " state ", $uu->state; 536 print " state ", $uu->state, "\n";
511 print " mode ", $uu->mode; 537 print " mode ", $uu->mode, "\n";
512 print " uudet ", strencoding $uu->uudet; 538 print " uudet ", strencoding $uu->uudet, "\n";
513 print " size ", $uu->size; 539 print " size ", $uu->size, "\n";
514 print " filename ", $uu->filename;
515 print " subfname ", $uu->subfname; 540 print " subfname ", $uu->subfname, "\n";
516 print " mimeid ", $uu->mimeid; 541 print " mimeid ", $uu->mimeid, "\n";
517 print " mimetype ", $uu->mimetype; 542 print " mimetype ", $uu->mimetype, "\n";
518 print "\n";
519 543
520 # print additional info about all parts 544 # print additional info about all parts
545 print " parts";
521 for ($uu->parts) { 546 for ($uu->parts) {
522 while (my ($k, $v) = each %$_) { 547 for my $k (sort keys %$_) {
523 print "$k > $v, "; 548 print " $k=$_->{$k}";
524 } 549 }
525 print "\n"; 550 print "\n";
526 } 551 }
527 552
528 $uu->decode_temp;
529 print " temporarily decoded to ", $uu->binfile, "\n";
530 $uu->remove_temp; 553 $uu->remove_temp;
531 554
532 print strerror $uu->decode; 555 if (my $err = $uu->decode) {
556 print " ERROR ", strerror $err, "\n";
557 } else {
533 print " saved as uudst/", $uu->filename, "\n"; 558 print " successfully saved as uudst/", $uu->filename, "\n";
534 } 559 }
560 }
535 561
536 print "cleanup...\n"; 562 print "cleanup...\n";
537 563
538 CleanUp(); 564 CleanUp;
565
566=head1 PERLMULTICORE SUPPORT
567
568This module supports the perlmulticore standard (see
569L<http://perlmulticore.schmorp.de/> for more info) for the following
570functions - generally these are functions accessing the disk and/or using
571considerable CPU time:
572
573 LoadFile
574 $item->decode
575 $item->decode_temp
576 $item->remove_temp
577 $item->info
578
579The perl interpreter will be reacquired/released on every callback
580invocation, so for performance reasons, callbacks should be avoided if
581that is costly.
582
583Future versions might enable multicore support for more functions.
584
585=head1 BUGS AND LIMITATIONS
586
587The original uulib library this module uses was written at a time where
588main memory of measured in megabytes and buffer overflows as a security
589thign didn't exist. While a lot of security fixes have been applied over
590the years (includign some defense in depth mechanism that can shield
591against a lot of as-of-yet undetected bugs), using this library for
592security purposes requires care.
593
594Likewise, file sizes when the uulib library was written were tiny compared
595to today, so do not expect this library to handle files larger than 2GB.
539 596
540=head1 AUTHOR 597=head1 AUTHOR
541 598
542Marc Lehmann <schmorp@schmorp.de>, the original uulib library was written 599Marc Lehmann <schmorp@schmorp.de>, the original uulib library was written
543by Frank Pilhofer <fp@informatik.uni-frankfurt.de>, and later heavily 600by Frank Pilhofer <fp@informatik.uni-frankfurt.de>, and later heavily
544bugfixed by Marc Lehmann. 601bugfixed by Marc Lehmann.
545 602
546=head1 SEE ALSO 603=head1 SEE ALSO
547 604
548perl(1), uudeview homepage at http://www.uni-frankfurt.de/~fp/uudeview/. 605perl(1), uudeview homepage at L<http://www.fpx.de/fp/Software/UUDeview/>.
549 606
550=cut 607=cut
608

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines