1package IO::Compress::Bzip2 ;
2
3use strict ;
4use warnings;
5use bytes;
6require Exporter ;
7
8use IO::Compress::Base 2.106 ;
9
10use IO::Compress::Base::Common  2.106 qw();
11use IO::Compress::Adapter::Bzip2 2.106 ;
12
13
14
15our ($VERSION, @ISA, @EXPORT_OK, %EXPORT_TAGS, $Bzip2Error);
16
17$VERSION = '2.106';
18$Bzip2Error = '';
19
20@ISA    = qw(IO::Compress::Base Exporter);
21@EXPORT_OK = qw( $Bzip2Error bzip2 ) ;
22%EXPORT_TAGS = %IO::Compress::Base::EXPORT_TAGS ;
23push @{ $EXPORT_TAGS{all} }, @EXPORT_OK ;
24Exporter::export_ok_tags('all');
25
26
27
28sub new
29{
30    my $class = shift ;
31
32    my $obj = IO::Compress::Base::Common::createSelfTiedObject($class, \$Bzip2Error);
33    return $obj->_create(undef, @_);
34}
35
36sub bzip2
37{
38    my $obj = IO::Compress::Base::Common::createSelfTiedObject(undef, \$Bzip2Error);
39    $obj->_def(@_);
40}
41
42
43sub mkHeader
44{
45    my $self = shift ;
46    return '';
47
48}
49
50sub getExtraParams
51{
52    my $self = shift ;
53
54    use IO::Compress::Base::Common  2.106 qw(:Parse);
55
56    return (
57            'blocksize100k' => [IO::Compress::Base::Common::Parse_unsigned,  1],
58            'workfactor'    => [IO::Compress::Base::Common::Parse_unsigned,  0],
59            'verbosity'     => [IO::Compress::Base::Common::Parse_boolean,   0],
60        );
61}
62
63
64
65sub ckParams
66{
67    my $self = shift ;
68    my $got = shift;
69
70    # check that BlockSize100K is a number between 1 & 9
71    if ($got->parsed('blocksize100k')) {
72        my $value = $got->getValue('blocksize100k');
73        return $self->saveErrorString(undef, "Parameter 'BlockSize100K' not between 1 and 9, got $value")
74            unless defined $value && $value >= 1 && $value <= 9;
75
76    }
77
78    # check that WorkFactor between 0 & 250
79    if ($got->parsed('workfactor')) {
80        my $value = $got->getValue('workfactor');
81        return $self->saveErrorString(undef, "Parameter 'WorkFactor' not between 0 and 250, got $value")
82            unless $value >= 0 && $value <= 250;
83    }
84
85    return 1 ;
86}
87
88
89sub mkComp
90{
91    my $self = shift ;
92    my $got = shift ;
93
94    my $BlockSize100K = $got->getValue('blocksize100k');
95    my $WorkFactor    = $got->getValue('workfactor');
96    my $Verbosity     = $got->getValue('verbosity');
97
98    my ($obj, $errstr, $errno) = IO::Compress::Adapter::Bzip2::mkCompObject(
99                                               $BlockSize100K, $WorkFactor,
100                                               $Verbosity);
101
102    return $self->saveErrorString(undef, $errstr, $errno)
103        if ! defined $obj;
104
105    return $obj;
106}
107
108
109sub mkTrailer
110{
111    my $self = shift ;
112    return '';
113}
114
115sub mkFinalTrailer
116{
117    return '';
118}
119
120#sub newHeader
121#{
122#    my $self = shift ;
123#    return '';
124#}
125
126sub getInverseClass
127{
128    return ('IO::Uncompress::Bunzip2');
129}
130
131sub getFileInfo
132{
133    my $self = shift ;
134    my $params = shift;
135    my $file = shift ;
136
137}
138
1391;
140
141__END__
142
143=head1 NAME
144
145IO::Compress::Bzip2 - Write bzip2 files/buffers
146
147=head1 SYNOPSIS
148
149    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
150
151    my $status = bzip2 $input => $output [,OPTS]
152        or die "bzip2 failed: $Bzip2Error\n";
153
154    my $z = IO::Compress::Bzip2->new( $output [,OPTS] )
155        or die "bzip2 failed: $Bzip2Error\n";
156
157    $z->print($string);
158    $z->printf($format, $string);
159    $z->write($string);
160    $z->syswrite($string [, $length, $offset]);
161    $z->flush();
162    $z->tell();
163    $z->eof();
164    $z->seek($position, $whence);
165    $z->binmode();
166    $z->fileno();
167    $z->opened();
168    $z->autoflush();
169    $z->input_line_number();
170    $z->newStream( [OPTS] );
171
172    $z->close() ;
173
174    $Bzip2Error ;
175
176    # IO::File mode
177
178    print $z $string;
179    printf $z $format, $string;
180    tell $z
181    eof $z
182    seek $z, $position, $whence
183    binmode $z
184    fileno $z
185    close $z ;
186
187=head1 DESCRIPTION
188
189This module provides a Perl interface that allows writing bzip2
190compressed data to files or buffer.
191
192For reading bzip2 files/buffers, see the companion module
193L<IO::Uncompress::Bunzip2|IO::Uncompress::Bunzip2>.
194
195=head1 Functional Interface
196
197A top-level function, C<bzip2>, is provided to carry out
198"one-shot" compression between buffers and/or files. For finer
199control over the compression process, see the L</"OO Interface">
200section.
201
202    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
203
204    bzip2 $input_filename_or_reference => $output_filename_or_reference [,OPTS]
205        or die "bzip2 failed: $Bzip2Error\n";
206
207The functional interface needs Perl5.005 or better.
208
209=head2 bzip2 $input_filename_or_reference => $output_filename_or_reference [, OPTS]
210
211C<bzip2> expects at least two parameters,
212C<$input_filename_or_reference> and C<$output_filename_or_reference>
213and zero or more optional parameters (see L</Optional Parameters>)
214
215=head3 The C<$input_filename_or_reference> parameter
216
217The parameter, C<$input_filename_or_reference>, is used to define the
218source of the uncompressed data.
219
220It can take one of the following forms:
221
222=over 5
223
224=item A filename
225
226If the C<$input_filename_or_reference> parameter is a simple scalar, it is
227assumed to be a filename. This file will be opened for reading and the
228input data will be read from it.
229
230=item A filehandle
231
232If the C<$input_filename_or_reference> parameter is a filehandle, the input
233data will be read from it.  The string '-' can be used as an alias for
234standard input.
235
236=item A scalar reference
237
238If C<$input_filename_or_reference> is a scalar reference, the input data
239will be read from C<$$input_filename_or_reference>.
240
241=item An array reference
242
243If C<$input_filename_or_reference> is an array reference, each element in
244the array must be a filename.
245
246The input data will be read from each file in turn.
247
248The complete array will be walked to ensure that it only
249contains valid filenames before any data is compressed.
250
251=item An Input FileGlob string
252
253If C<$input_filename_or_reference> is a string that is delimited by the
254characters "<" and ">" C<bzip2> will assume that it is an
255I<input fileglob string>. The input is the list of files that match the
256fileglob.
257
258See L<File::GlobMapper|File::GlobMapper> for more details.
259
260=back
261
262If the C<$input_filename_or_reference> parameter is any other type,
263C<undef> will be returned.
264
265=head3 The C<$output_filename_or_reference> parameter
266
267The parameter C<$output_filename_or_reference> is used to control the
268destination of the compressed data. This parameter can take one of
269these forms.
270
271=over 5
272
273=item A filename
274
275If the C<$output_filename_or_reference> parameter is a simple scalar, it is
276assumed to be a filename.  This file will be opened for writing and the
277compressed data will be written to it.
278
279=item A filehandle
280
281If the C<$output_filename_or_reference> parameter is a filehandle, the
282compressed data will be written to it.  The string '-' can be used as
283an alias for standard output.
284
285=item A scalar reference
286
287If C<$output_filename_or_reference> is a scalar reference, the
288compressed data will be stored in C<$$output_filename_or_reference>.
289
290=item An Array Reference
291
292If C<$output_filename_or_reference> is an array reference,
293the compressed data will be pushed onto the array.
294
295=item An Output FileGlob
296
297If C<$output_filename_or_reference> is a string that is delimited by the
298characters "<" and ">" C<bzip2> will assume that it is an
299I<output fileglob string>. The output is the list of files that match the
300fileglob.
301
302When C<$output_filename_or_reference> is an fileglob string,
303C<$input_filename_or_reference> must also be a fileglob string. Anything
304else is an error.
305
306See L<File::GlobMapper|File::GlobMapper> for more details.
307
308=back
309
310If the C<$output_filename_or_reference> parameter is any other type,
311C<undef> will be returned.
312
313=head2 Notes
314
315When C<$input_filename_or_reference> maps to multiple files/buffers and
316C<$output_filename_or_reference> is a single
317file/buffer the input files/buffers will be stored
318in C<$output_filename_or_reference> as a concatenated series of compressed data streams.
319
320=head2 Optional Parameters
321
322The optional parameters for the one-shot function C<bzip2>
323are (for the most part) identical to those used with the OO interface defined in the
324L</"Constructor Options"> section. The exceptions are listed below
325
326=over 5
327
328=item C<< AutoClose => 0|1 >>
329
330This option applies to any input or output data streams to
331C<bzip2> that are filehandles.
332
333If C<AutoClose> is specified, and the value is true, it will result in all
334input and/or output filehandles being closed once C<bzip2> has
335completed.
336
337This parameter defaults to 0.
338
339=item C<< BinModeIn => 0|1 >>
340
341This option is now a no-op. All files will be read in binmode.
342
343=item C<< Append => 0|1 >>
344
345The behaviour of this option is dependent on the type of output data
346stream.
347
348=over 5
349
350=item * A Buffer
351
352If C<Append> is enabled, all compressed data will be append to the end of
353the output buffer. Otherwise the output buffer will be cleared before any
354compressed data is written to it.
355
356=item * A Filename
357
358If C<Append> is enabled, the file will be opened in append mode. Otherwise
359the contents of the file, if any, will be truncated before any compressed
360data is written to it.
361
362=item * A Filehandle
363
364If C<Append> is enabled, the filehandle will be positioned to the end of
365the file via a call to C<seek> before any compressed data is
366written to it.  Otherwise the file pointer will not be moved.
367
368=back
369
370When C<Append> is specified, and set to true, it will I<append> all compressed
371data to the output data stream.
372
373So when the output is a filehandle it will carry out a seek to the eof
374before writing any compressed data. If the output is a filename, it will be opened for
375appending. If the output is a buffer, all compressed data will be
376appended to the existing buffer.
377
378Conversely when C<Append> is not specified, or it is present and is set to
379false, it will operate as follows.
380
381When the output is a filename, it will truncate the contents of the file
382before writing any compressed data. If the output is a filehandle
383its position will not be changed. If the output is a buffer, it will be
384wiped before any compressed data is output.
385
386Defaults to 0.
387
388=back
389
390=head2 Examples
391
392Here are a few example that show the capabilities of the module.
393
394=head3 Streaming
395
396This very simple command line example demonstrates the streaming capabilities of the module.
397The code reads data from STDIN, compresses it, and writes the compressed data to STDOUT.
398
399    $ echo hello world | perl -MIO::Compress::Bzip2=bzip2 -e 'bzip2 \*STDIN => \*STDOUT' >output.bz2
400
401The special filename "-" can be used as a standin for both C<\*STDIN> and C<\*STDOUT>,
402so the above can be rewritten as
403
404    $ echo hello world | perl -MIO::Compress::Bzip2=bzip2 -e 'bzip2 "-" => "-"' >output.bz2
405
406=head3 Compressing a file from the filesystem
407
408To read the contents of the file C<file1.txt> and write the compressed
409data to the file C<file1.txt.bz2>.
410
411    use strict ;
412    use warnings ;
413    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
414
415    my $input = "file1.txt";
416    bzip2 $input => "$input.bz2"
417        or die "bzip2 failed: $Bzip2Error\n";
418
419=head3 Reading from a Filehandle and writing to an in-memory buffer
420
421To read from an existing Perl filehandle, C<$input>, and write the
422compressed data to a buffer, C<$buffer>.
423
424    use strict ;
425    use warnings ;
426    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
427    use IO::File ;
428
429    my $input = IO::File->new( "<file1.txt" )
430        or die "Cannot open 'file1.txt': $!\n" ;
431    my $buffer ;
432    bzip2 $input => \$buffer
433        or die "bzip2 failed: $Bzip2Error\n";
434
435=head3 Compressing multiple files
436
437To compress all files in the directory "/my/home" that match "*.txt"
438and store the compressed data in the same directory
439
440    use strict ;
441    use warnings ;
442    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
443
444    bzip2 '</my/home/*.txt>' => '<*.bz2>'
445        or die "bzip2 failed: $Bzip2Error\n";
446
447and if you want to compress each file one at a time, this will do the trick
448
449    use strict ;
450    use warnings ;
451    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
452
453    for my $input ( glob "/my/home/*.txt" )
454    {
455        my $output = "$input.bz2" ;
456        bzip2 $input => $output
457            or die "Error compressing '$input': $Bzip2Error\n";
458    }
459
460=head1 OO Interface
461
462=head2 Constructor
463
464The format of the constructor for C<IO::Compress::Bzip2> is shown below
465
466    my $z = IO::Compress::Bzip2->new( $output [,OPTS] )
467        or die "IO::Compress::Bzip2 failed: $Bzip2Error\n";
468
469It returns an C<IO::Compress::Bzip2> object on success and undef on failure.
470The variable C<$Bzip2Error> will contain an error message on failure.
471
472If you are running Perl 5.005 or better the object, C<$z>, returned from
473IO::Compress::Bzip2 can be used exactly like an L<IO::File|IO::File> filehandle.
474This means that all normal output file operations can be carried out
475with C<$z>.
476For example, to write to a compressed file/buffer you can use either of
477these forms
478
479    $z->print("hello world\n");
480    print $z "hello world\n";
481
482The mandatory parameter C<$output> is used to control the destination
483of the compressed data. This parameter can take one of these forms.
484
485=over 5
486
487=item A filename
488
489If the C<$output> parameter is a simple scalar, it is assumed to be a
490filename. This file will be opened for writing and the compressed data
491will be written to it.
492
493=item A filehandle
494
495If the C<$output> parameter is a filehandle, the compressed data will be
496written to it.
497The string '-' can be used as an alias for standard output.
498
499=item A scalar reference
500
501If C<$output> is a scalar reference, the compressed data will be stored
502in C<$$output>.
503
504=back
505
506If the C<$output> parameter is any other type, C<IO::Compress::Bzip2>::new will
507return undef.
508
509=head2 Constructor Options
510
511C<OPTS> is any combination of zero or more the following options:
512
513=over 5
514
515=item C<< AutoClose => 0|1 >>
516
517This option is only valid when the C<$output> parameter is a filehandle. If
518specified, and the value is true, it will result in the C<$output> being
519closed once either the C<close> method is called or the C<IO::Compress::Bzip2>
520object is destroyed.
521
522This parameter defaults to 0.
523
524=item C<< Append => 0|1 >>
525
526Opens C<$output> in append mode.
527
528The behaviour of this option is dependent on the type of C<$output>.
529
530=over 5
531
532=item * A Buffer
533
534If C<$output> is a buffer and C<Append> is enabled, all compressed data
535will be append to the end of C<$output>. Otherwise C<$output> will be
536cleared before any data is written to it.
537
538=item * A Filename
539
540If C<$output> is a filename and C<Append> is enabled, the file will be
541opened in append mode. Otherwise the contents of the file, if any, will be
542truncated before any compressed data is written to it.
543
544=item * A Filehandle
545
546If C<$output> is a filehandle, the file pointer will be positioned to the
547end of the file via a call to C<seek> before any compressed data is written
548to it.  Otherwise the file pointer will not be moved.
549
550=back
551
552This parameter defaults to 0.
553
554=item C<< BlockSize100K => number >>
555
556Specify the number of 100K blocks bzip2 uses during compression.
557
558Valid values are from 1 to 9, where 9 is best compression.
559
560The default is 1.
561
562=item C<< WorkFactor => number >>
563
564Specifies how much effort bzip2 should take before resorting to a slower
565fallback compression algorithm.
566
567Valid values range from 0 to 250, where 0 means use the default value 30.
568
569The default is 0.
570
571=item C<< Strict => 0|1 >>
572
573This is a placeholder option.
574
575=back
576
577=head2 Examples
578
579TODO
580
581=head1 Methods
582
583=head2 print
584
585Usage is
586
587    $z->print($data)
588    print $z $data
589
590Compresses and outputs the contents of the C<$data> parameter. This
591has the same behaviour as the C<print> built-in.
592
593Returns true if successful.
594
595=head2 printf
596
597Usage is
598
599    $z->printf($format, $data)
600    printf $z $format, $data
601
602Compresses and outputs the contents of the C<$data> parameter.
603
604Returns true if successful.
605
606=head2 syswrite
607
608Usage is
609
610    $z->syswrite $data
611    $z->syswrite $data, $length
612    $z->syswrite $data, $length, $offset
613
614Compresses and outputs the contents of the C<$data> parameter.
615
616Returns the number of uncompressed bytes written, or C<undef> if
617unsuccessful.
618
619=head2 write
620
621Usage is
622
623    $z->write $data
624    $z->write $data, $length
625    $z->write $data, $length, $offset
626
627Compresses and outputs the contents of the C<$data> parameter.
628
629Returns the number of uncompressed bytes written, or C<undef> if
630unsuccessful.
631
632=head2 flush
633
634Usage is
635
636    $z->flush;
637
638Flushes any pending compressed data to the output file/buffer.
639
640TODO
641
642Returns true on success.
643
644=head2 tell
645
646Usage is
647
648    $z->tell()
649    tell $z
650
651Returns the uncompressed file offset.
652
653=head2 eof
654
655Usage is
656
657    $z->eof();
658    eof($z);
659
660Returns true if the C<close> method has been called.
661
662=head2 seek
663
664    $z->seek($position, $whence);
665    seek($z, $position, $whence);
666
667Provides a sub-set of the C<seek> functionality, with the restriction
668that it is only legal to seek forward in the output file/buffer.
669It is a fatal error to attempt to seek backward.
670
671Empty parts of the file/buffer will have NULL (0x00) bytes written to them.
672
673The C<$whence> parameter takes one the usual values, namely SEEK_SET,
674SEEK_CUR or SEEK_END.
675
676Returns 1 on success, 0 on failure.
677
678=head2 binmode
679
680Usage is
681
682    $z->binmode
683    binmode $z ;
684
685This is a noop provided for completeness.
686
687=head2 opened
688
689    $z->opened()
690
691Returns true if the object currently refers to a opened file/buffer.
692
693=head2 autoflush
694
695    my $prev = $z->autoflush()
696    my $prev = $z->autoflush(EXPR)
697
698If the C<$z> object is associated with a file or a filehandle, this method
699returns the current autoflush setting for the underlying filehandle. If
700C<EXPR> is present, and is non-zero, it will enable flushing after every
701write/print operation.
702
703If C<$z> is associated with a buffer, this method has no effect and always
704returns C<undef>.
705
706B<Note> that the special variable C<$|> B<cannot> be used to set or
707retrieve the autoflush setting.
708
709=head2 input_line_number
710
711    $z->input_line_number()
712    $z->input_line_number(EXPR)
713
714This method always returns C<undef> when compressing.
715
716=head2 fileno
717
718    $z->fileno()
719    fileno($z)
720
721If the C<$z> object is associated with a file or a filehandle, C<fileno>
722will return the underlying file descriptor. Once the C<close> method is
723called C<fileno> will return C<undef>.
724
725If the C<$z> object is associated with a buffer, this method will return
726C<undef>.
727
728=head2 close
729
730    $z->close() ;
731    close $z ;
732
733Flushes any pending compressed data and then closes the output file/buffer.
734
735For most versions of Perl this method will be automatically invoked if
736the IO::Compress::Bzip2 object is destroyed (either explicitly or by the
737variable with the reference to the object going out of scope). The
738exceptions are Perl versions 5.005 through 5.00504 and 5.8.0. In
739these cases, the C<close> method will be called automatically, but
740not until global destruction of all live objects when the program is
741terminating.
742
743Therefore, if you want your scripts to be able to run on all versions
744of Perl, you should call C<close> explicitly and not rely on automatic
745closing.
746
747Returns true on success, otherwise 0.
748
749If the C<AutoClose> option has been enabled when the IO::Compress::Bzip2
750object was created, and the object is associated with a file, the
751underlying file will also be closed.
752
753=head2 newStream([OPTS])
754
755Usage is
756
757    $z->newStream( [OPTS] )
758
759Closes the current compressed data stream and starts a new one.
760
761OPTS consists of any of the options that are available when creating
762the C<$z> object.
763
764See the L</"Constructor Options"> section for more details.
765
766=head1 Importing
767
768No symbolic constants are required by IO::Compress::Bzip2 at present.
769
770=over 5
771
772=item :all
773
774Imports C<bzip2> and C<$Bzip2Error>.
775Same as doing this
776
777    use IO::Compress::Bzip2 qw(bzip2 $Bzip2Error) ;
778
779=back
780
781=head1 EXAMPLES
782
783=head2 Apache::GZip Revisited
784
785See L<IO::Compress::FAQ|IO::Compress::FAQ/"Apache::GZip Revisited">
786
787=head2 Working with Net::FTP
788
789See L<IO::Compress::FAQ|IO::Compress::FAQ/"Compressed files and Net::FTP">
790
791=head1 SUPPORT
792
793General feedback/questions/bug reports should be sent to
794L<https://github.com/pmqs/IO-Compress/issues> (preferred) or
795L<https://rt.cpan.org/Public/Dist/Display.html?Name=IO-Compress>.
796
797=head1 SEE ALSO
798
799L<Compress::Zlib>, L<IO::Compress::Gzip>, L<IO::Uncompress::Gunzip>, L<IO::Compress::Deflate>, L<IO::Uncompress::Inflate>, L<IO::Compress::RawDeflate>, L<IO::Uncompress::RawInflate>, L<IO::Uncompress::Bunzip2>, L<IO::Compress::Lzma>, L<IO::Uncompress::UnLzma>, L<IO::Compress::Xz>, L<IO::Uncompress::UnXz>, L<IO::Compress::Lzip>, L<IO::Uncompress::UnLzip>, L<IO::Compress::Lzop>, L<IO::Uncompress::UnLzop>, L<IO::Compress::Lzf>, L<IO::Uncompress::UnLzf>, L<IO::Compress::Zstd>, L<IO::Uncompress::UnZstd>, L<IO::Uncompress::AnyInflate>, L<IO::Uncompress::AnyUncompress>
800
801L<IO::Compress::FAQ|IO::Compress::FAQ>
802
803L<File::GlobMapper|File::GlobMapper>, L<Archive::Zip|Archive::Zip>,
804L<Archive::Tar|Archive::Tar>,
805L<IO::Zlib|IO::Zlib>
806
807The primary site for the bzip2 program is L<https://sourceware.org/bzip2/>.
808
809See the module L<Compress::Bzip2|Compress::Bzip2>
810
811=head1 AUTHOR
812
813This module was written by Paul Marquess, C<pmqs@cpan.org>.
814
815=head1 MODIFICATION HISTORY
816
817See the Changes file.
818
819=head1 COPYRIGHT AND LICENSE
820
821Copyright (c) 2005-2022 Paul Marquess. All rights reserved.
822
823This program is free software; you can redistribute it and/or
824modify it under the same terms as Perl itself.
825