1 2package IO::Compress::Gzip ; 3 4require 5.004 ; 5 6use strict ; 7use warnings; 8use bytes; 9 10 11use IO::Compress::RawDeflate 2.024 ; 12 13use Compress::Raw::Zlib 2.024 ; 14use IO::Compress::Base::Common 2.024 qw(:Status :Parse createSelfTiedObject); 15use IO::Compress::Gzip::Constants 2.024 ; 16use IO::Compress::Zlib::Extra 2.024 ; 17 18BEGIN 19{ 20 if (defined &utf8::downgrade ) 21 { *noUTF8 = \&utf8::downgrade } 22 else 23 { *noUTF8 = sub {} } 24} 25 26require Exporter ; 27 28our ($VERSION, @ISA, @EXPORT_OK, %EXPORT_TAGS, $GzipError); 29 30$VERSION = '2.024'; 31$GzipError = '' ; 32 33@ISA = qw(Exporter IO::Compress::RawDeflate); 34@EXPORT_OK = qw( $GzipError gzip ) ; 35%EXPORT_TAGS = %IO::Compress::RawDeflate::DEFLATE_CONSTANTS ; 36push @{ $EXPORT_TAGS{all} }, @EXPORT_OK ; 37Exporter::export_ok_tags('all'); 38 39sub new 40{ 41 my $class = shift ; 42 43 my $obj = createSelfTiedObject($class, \$GzipError); 44 45 $obj->_create(undef, @_); 46} 47 48 49sub gzip 50{ 51 my $obj = createSelfTiedObject(undef, \$GzipError); 52 return $obj->_def(@_); 53} 54 55#sub newHeader 56#{ 57# my $self = shift ; 58# #return GZIP_MINIMUM_HEADER ; 59# return $self->mkHeader(*$self->{Got}); 60#} 61 62sub getExtraParams 63{ 64 my $self = shift ; 65 66 return ( 67 # zlib behaviour 68 $self->getZlibParams(), 69 70 # Gzip header fields 71 'Minimal' => [0, 1, Parse_boolean, 0], 72 'Comment' => [0, 1, Parse_any, undef], 73 'Name' => [0, 1, Parse_any, undef], 74 'Time' => [0, 1, Parse_any, undef], 75 'TextFlag' => [0, 1, Parse_boolean, 0], 76 'HeaderCRC' => [0, 1, Parse_boolean, 0], 77 'OS_Code' => [0, 1, Parse_unsigned, $Compress::Raw::Zlib::gzip_os_code], 78 'ExtraField'=> [0, 1, Parse_any, undef], 79 'ExtraFlags'=> [0, 1, Parse_any, undef], 80 81 ); 82} 83 84 85sub ckParams 86{ 87 my $self = shift ; 88 my $got = shift ; 89 90 # gzip always needs crc32 91 $got->value('CRC32' => 1); 92 93 return 1 94 if $got->value('Merge') ; 95 96 my $strict = $got->value('Strict') ; 97 98 99 { 100 if (! $got->parsed('Time') ) { 101 # Modification time defaults to now. 102 $got->value('Time' => time) ; 103 } 104 105 # Check that the Name & Comment don't have embedded NULLs 106 # Also check that they only contain ISO 8859-1 chars. 107 if ($got->parsed('Name') && defined $got->value('Name')) { 108 my $name = $got->value('Name'); 109 110 return $self->saveErrorString(undef, "Null Character found in Name", 111 Z_DATA_ERROR) 112 if $strict && $name =~ /\x00/ ; 113 114 return $self->saveErrorString(undef, "Non ISO 8859-1 Character found in Name", 115 Z_DATA_ERROR) 116 if $strict && $name =~ /$GZIP_FNAME_INVALID_CHAR_RE/o ; 117 } 118 119 if ($got->parsed('Comment') && defined $got->value('Comment')) { 120 my $comment = $got->value('Comment'); 121 122 return $self->saveErrorString(undef, "Null Character found in Comment", 123 Z_DATA_ERROR) 124 if $strict && $comment =~ /\x00/ ; 125 126 return $self->saveErrorString(undef, "Non ISO 8859-1 Character found in Comment", 127 Z_DATA_ERROR) 128 if $strict && $comment =~ /$GZIP_FCOMMENT_INVALID_CHAR_RE/o; 129 } 130 131 if ($got->parsed('OS_Code') ) { 132 my $value = $got->value('OS_Code'); 133 134 return $self->saveErrorString(undef, "OS_Code must be between 0 and 255, got '$value'") 135 if $value < 0 || $value > 255 ; 136 137 } 138 139 # gzip only supports Deflate at present 140 $got->value('Method' => Z_DEFLATED) ; 141 142 if ( ! $got->parsed('ExtraFlags')) { 143 $got->value('ExtraFlags' => 2) 144 if $got->value('Level') == Z_BEST_SPEED ; 145 $got->value('ExtraFlags' => 4) 146 if $got->value('Level') == Z_BEST_COMPRESSION ; 147 } 148 149 my $data = $got->value('ExtraField') ; 150 if (defined $data) { 151 my $bad = IO::Compress::Zlib::Extra::parseExtraField($data, $strict, 1) ; 152 return $self->saveErrorString(undef, "Error with ExtraField Parameter: $bad", Z_DATA_ERROR) 153 if $bad ; 154 155 $got->value('ExtraField', $data) ; 156 } 157 } 158 159 return 1; 160} 161 162sub mkTrailer 163{ 164 my $self = shift ; 165 return pack("V V", *$self->{Compress}->crc32(), 166 *$self->{UnCompSize}->get32bit()); 167} 168 169sub getInverseClass 170{ 171 return ('IO::Uncompress::Gunzip', 172 \$IO::Uncompress::Gunzip::GunzipError); 173} 174 175sub getFileInfo 176{ 177 my $self = shift ; 178 my $params = shift; 179 my $filename = shift ; 180 181 my $defaultTime = (stat($filename))[9] ; 182 183 $params->value('Name' => $filename) 184 if ! $params->parsed('Name') ; 185 186 $params->value('Time' => $defaultTime) 187 if ! $params->parsed('Time') ; 188} 189 190 191sub mkHeader 192{ 193 my $self = shift ; 194 my $param = shift ; 195 196 # stort-circuit if a minimal header is requested. 197 return GZIP_MINIMUM_HEADER if $param->value('Minimal') ; 198 199 # METHOD 200 my $method = $param->valueOrDefault('Method', GZIP_CM_DEFLATED) ; 201 202 # FLAGS 203 my $flags = GZIP_FLG_DEFAULT ; 204 $flags |= GZIP_FLG_FTEXT if $param->value('TextFlag') ; 205 $flags |= GZIP_FLG_FHCRC if $param->value('HeaderCRC') ; 206 $flags |= GZIP_FLG_FEXTRA if $param->wantValue('ExtraField') ; 207 $flags |= GZIP_FLG_FNAME if $param->wantValue('Name') ; 208 $flags |= GZIP_FLG_FCOMMENT if $param->wantValue('Comment') ; 209 210 # MTIME 211 my $time = $param->valueOrDefault('Time', GZIP_MTIME_DEFAULT) ; 212 213 # EXTRA FLAGS 214 my $extra_flags = $param->valueOrDefault('ExtraFlags', GZIP_XFL_DEFAULT); 215 216 # OS CODE 217 my $os_code = $param->valueOrDefault('OS_Code', GZIP_OS_DEFAULT) ; 218 219 220 my $out = pack("C4 V C C", 221 GZIP_ID1, # ID1 222 GZIP_ID2, # ID2 223 $method, # Compression Method 224 $flags, # Flags 225 $time, # Modification Time 226 $extra_flags, # Extra Flags 227 $os_code, # Operating System Code 228 ) ; 229 230 # EXTRA 231 if ($flags & GZIP_FLG_FEXTRA) { 232 my $extra = $param->value('ExtraField') ; 233 $out .= pack("v", length $extra) . $extra ; 234 } 235 236 # NAME 237 if ($flags & GZIP_FLG_FNAME) { 238 my $name .= $param->value('Name') ; 239 $name =~ s/\x00.*$//; 240 $out .= $name ; 241 # Terminate the filename with NULL unless it already is 242 $out .= GZIP_NULL_BYTE 243 if !length $name or 244 substr($name, 1, -1) ne GZIP_NULL_BYTE ; 245 } 246 247 # COMMENT 248 if ($flags & GZIP_FLG_FCOMMENT) { 249 my $comment .= $param->value('Comment') ; 250 $comment =~ s/\x00.*$//; 251 $out .= $comment ; 252 # Terminate the comment with NULL unless it already is 253 $out .= GZIP_NULL_BYTE 254 if ! length $comment or 255 substr($comment, 1, -1) ne GZIP_NULL_BYTE; 256 } 257 258 # HEADER CRC 259 $out .= pack("v", crc32($out) & 0x00FF ) if $param->value('HeaderCRC') ; 260 261 noUTF8($out); 262 263 return $out ; 264} 265 266sub mkFinalTrailer 267{ 268 return ''; 269} 270 2711; 272 273__END__ 274 275=head1 NAME 276 277IO::Compress::Gzip - Write RFC 1952 files/buffers 278 279 280 281=head1 SYNOPSIS 282 283 use IO::Compress::Gzip qw(gzip $GzipError) ; 284 285 my $status = gzip $input => $output [,OPTS] 286 or die "gzip failed: $GzipError\n"; 287 288 my $z = new IO::Compress::Gzip $output [,OPTS] 289 or die "gzip failed: $GzipError\n"; 290 291 $z->print($string); 292 $z->printf($format, $string); 293 $z->write($string); 294 $z->syswrite($string [, $length, $offset]); 295 $z->flush(); 296 $z->tell(); 297 $z->eof(); 298 $z->seek($position, $whence); 299 $z->binmode(); 300 $z->fileno(); 301 $z->opened(); 302 $z->autoflush(); 303 $z->input_line_number(); 304 $z->newStream( [OPTS] ); 305 306 $z->deflateParams(); 307 308 $z->close() ; 309 310 $GzipError ; 311 312 # IO::File mode 313 314 print $z $string; 315 printf $z $format, $string; 316 tell $z 317 eof $z 318 seek $z, $position, $whence 319 binmode $z 320 fileno $z 321 close $z ; 322 323 324=head1 DESCRIPTION 325 326This module provides a Perl interface that allows writing compressed 327data to files or buffer as defined in RFC 1952. 328 329All the gzip headers defined in RFC 1952 can be created using 330this module. 331 332For reading RFC 1952 files/buffers, see the companion module 333L<IO::Uncompress::Gunzip|IO::Uncompress::Gunzip>. 334 335=head1 Functional Interface 336 337A top-level function, C<gzip>, is provided to carry out 338"one-shot" compression between buffers and/or files. For finer 339control over the compression process, see the L</"OO Interface"> 340section. 341 342 use IO::Compress::Gzip qw(gzip $GzipError) ; 343 344 gzip $input => $output [,OPTS] 345 or die "gzip failed: $GzipError\n"; 346 347The functional interface needs Perl5.005 or better. 348 349=head2 gzip $input => $output [, OPTS] 350 351C<gzip> expects at least two parameters, C<$input> and C<$output>. 352 353=head3 The C<$input> parameter 354 355The parameter, C<$input>, is used to define the source of 356the uncompressed data. 357 358It can take one of the following forms: 359 360=over 5 361 362=item A filename 363 364If the C<$input> parameter is a simple scalar, it is assumed to be a 365filename. This file will be opened for reading and the input data 366will be read from it. 367 368=item A filehandle 369 370If the C<$input> parameter is a filehandle, the input data will be 371read from it. 372The string '-' can be used as an alias for standard input. 373 374=item A scalar reference 375 376If C<$input> is a scalar reference, the input data will be read 377from C<$$input>. 378 379=item An array reference 380 381If C<$input> is an array reference, each element in the array must be a 382filename. 383 384The input data will be read from each file in turn. 385 386The complete array will be walked to ensure that it only 387contains valid filenames before any data is compressed. 388 389=item An Input FileGlob string 390 391If C<$input> is a string that is delimited by the characters "<" and ">" 392C<gzip> will assume that it is an I<input fileglob string>. The 393input is the list of files that match the fileglob. 394 395If the fileglob does not match any files ... 396 397See L<File::GlobMapper|File::GlobMapper> for more details. 398 399=back 400 401If the C<$input> parameter is any other type, C<undef> will be returned. 402 403In addition, if C<$input> is a simple filename, the default values for 404the C<Name> and C<Time> options will be sourced from that file. 405 406If you do not want to use these defaults they can be overridden by 407explicitly setting the C<Name> and C<Time> options or by setting the 408C<Minimal> parameter. 409 410=head3 The C<$output> parameter 411 412The parameter C<$output> is used to control the destination of the 413compressed data. This parameter can take one of these forms. 414 415=over 5 416 417=item A filename 418 419If the C<$output> parameter is a simple scalar, it is assumed to be a 420filename. This file will be opened for writing and the compressed 421data will be written to it. 422 423=item A filehandle 424 425If the C<$output> parameter is a filehandle, the compressed data 426will be written to it. 427The string '-' can be used as an alias for standard output. 428 429=item A scalar reference 430 431If C<$output> is a scalar reference, the compressed data will be 432stored in C<$$output>. 433 434=item An Array Reference 435 436If C<$output> is an array reference, the compressed data will be 437pushed onto the array. 438 439=item An Output FileGlob 440 441If C<$output> is a string that is delimited by the characters "<" and ">" 442C<gzip> will assume that it is an I<output fileglob string>. The 443output is the list of files that match the fileglob. 444 445When C<$output> is an fileglob string, C<$input> must also be a fileglob 446string. Anything else is an error. 447 448=back 449 450If the C<$output> parameter is any other type, C<undef> will be returned. 451 452=head2 Notes 453 454When C<$input> maps to multiple files/buffers and C<$output> is a single 455file/buffer the input files/buffers will be stored 456in C<$output> as a concatenated series of compressed data streams. 457 458=head2 Optional Parameters 459 460Unless specified below, the optional parameters for C<gzip>, 461C<OPTS>, are the same as those used with the OO interface defined in the 462L</"Constructor Options"> section below. 463 464=over 5 465 466=item C<< AutoClose => 0|1 >> 467 468This option applies to any input or output data streams to 469C<gzip> that are filehandles. 470 471If C<AutoClose> is specified, and the value is true, it will result in all 472input and/or output filehandles being closed once C<gzip> has 473completed. 474 475This parameter defaults to 0. 476 477=item C<< BinModeIn => 0|1 >> 478 479When reading from a file or filehandle, set C<binmode> before reading. 480 481Defaults to 0. 482 483=item C<< Append => 0|1 >> 484 485The behaviour of this option is dependent on the type of output data 486stream. 487 488=over 5 489 490=item * A Buffer 491 492If C<Append> is enabled, all compressed data will be append to the end of 493the output buffer. Otherwise the output buffer will be cleared before any 494compressed data is written to it. 495 496=item * A Filename 497 498If C<Append> is enabled, the file will be opened in append mode. Otherwise 499the contents of the file, if any, will be truncated before any compressed 500data is written to it. 501 502=item * A Filehandle 503 504If C<Append> is enabled, the filehandle will be positioned to the end of 505the file via a call to C<seek> before any compressed data is 506written to it. Otherwise the file pointer will not be moved. 507 508=back 509 510When C<Append> is specified, and set to true, it will I<append> all compressed 511data to the output data stream. 512 513So when the output is a filehandle it will carry out a seek to the eof 514before writing any compressed data. If the output is a filename, it will be opened for 515appending. If the output is a buffer, all compressed data will be appened to 516the existing buffer. 517 518Conversely when C<Append> is not specified, or it is present and is set to 519false, it will operate as follows. 520 521When the output is a filename, it will truncate the contents of the file 522before writing any compressed data. If the output is a filehandle 523its position will not be changed. If the output is a buffer, it will be 524wiped before any compressed data is output. 525 526Defaults to 0. 527 528=back 529 530=head2 Examples 531 532To read the contents of the file C<file1.txt> and write the compressed 533data to the file C<file1.txt.gz>. 534 535 use strict ; 536 use warnings ; 537 use IO::Compress::Gzip qw(gzip $GzipError) ; 538 539 my $input = "file1.txt"; 540 gzip $input => "$input.gz" 541 or die "gzip failed: $GzipError\n"; 542 543To read from an existing Perl filehandle, C<$input>, and write the 544compressed data to a buffer, C<$buffer>. 545 546 use strict ; 547 use warnings ; 548 use IO::Compress::Gzip qw(gzip $GzipError) ; 549 use IO::File ; 550 551 my $input = new IO::File "<file1.txt" 552 or die "Cannot open 'file1.txt': $!\n" ; 553 my $buffer ; 554 gzip $input => \$buffer 555 or die "gzip failed: $GzipError\n"; 556 557To compress all files in the directory "/my/home" that match "*.txt" 558and store the compressed data in the same directory 559 560 use strict ; 561 use warnings ; 562 use IO::Compress::Gzip qw(gzip $GzipError) ; 563 564 gzip '</my/home/*.txt>' => '<*.gz>' 565 or die "gzip failed: $GzipError\n"; 566 567and if you want to compress each file one at a time, this will do the trick 568 569 use strict ; 570 use warnings ; 571 use IO::Compress::Gzip qw(gzip $GzipError) ; 572 573 for my $input ( glob "/my/home/*.txt" ) 574 { 575 my $output = "$input.gz" ; 576 gzip $input => $output 577 or die "Error compressing '$input': $GzipError\n"; 578 } 579 580=head1 OO Interface 581 582=head2 Constructor 583 584The format of the constructor for C<IO::Compress::Gzip> is shown below 585 586 my $z = new IO::Compress::Gzip $output [,OPTS] 587 or die "IO::Compress::Gzip failed: $GzipError\n"; 588 589It returns an C<IO::Compress::Gzip> object on success and undef on failure. 590The variable C<$GzipError> will contain an error message on failure. 591 592If you are running Perl 5.005 or better the object, C<$z>, returned from 593IO::Compress::Gzip can be used exactly like an L<IO::File|IO::File> filehandle. 594This means that all normal output file operations can be carried out 595with C<$z>. 596For example, to write to a compressed file/buffer you can use either of 597these forms 598 599 $z->print("hello world\n"); 600 print $z "hello world\n"; 601 602The mandatory parameter C<$output> is used to control the destination 603of the compressed data. This parameter can take one of these forms. 604 605=over 5 606 607=item A filename 608 609If the C<$output> parameter is a simple scalar, it is assumed to be a 610filename. This file will be opened for writing and the compressed data 611will be written to it. 612 613=item A filehandle 614 615If the C<$output> parameter is a filehandle, the compressed data will be 616written to it. 617The string '-' can be used as an alias for standard output. 618 619=item A scalar reference 620 621If C<$output> is a scalar reference, the compressed data will be stored 622in C<$$output>. 623 624=back 625 626If the C<$output> parameter is any other type, C<IO::Compress::Gzip>::new will 627return undef. 628 629=head2 Constructor Options 630 631C<OPTS> is any combination of the following options: 632 633=over 5 634 635=item C<< AutoClose => 0|1 >> 636 637This option is only valid when the C<$output> parameter is a filehandle. If 638specified, and the value is true, it will result in the C<$output> being 639closed once either the C<close> method is called or the C<IO::Compress::Gzip> 640object is destroyed. 641 642This parameter defaults to 0. 643 644=item C<< Append => 0|1 >> 645 646Opens C<$output> in append mode. 647 648The behaviour of this option is dependent on the type of C<$output>. 649 650=over 5 651 652=item * A Buffer 653 654If C<$output> is a buffer and C<Append> is enabled, all compressed data 655will be append to the end of C<$output>. Otherwise C<$output> will be 656cleared before any data is written to it. 657 658=item * A Filename 659 660If C<$output> is a filename and C<Append> is enabled, the file will be 661opened in append mode. Otherwise the contents of the file, if any, will be 662truncated before any compressed data is written to it. 663 664=item * A Filehandle 665 666If C<$output> is a filehandle, the file pointer will be positioned to the 667end of the file via a call to C<seek> before any compressed data is written 668to it. Otherwise the file pointer will not be moved. 669 670=back 671 672This parameter defaults to 0. 673 674=item C<< Merge => 0|1 >> 675 676This option is used to compress input data and append it to an existing 677compressed data stream in C<$output>. The end result is a single compressed 678data stream stored in C<$output>. 679 680It is a fatal error to attempt to use this option when C<$output> is not an 681RFC 1952 data stream. 682 683There are a number of other limitations with the C<Merge> option: 684 685=over 5 686 687=item 1 688 689This module needs to have been built with zlib 1.2.1 or better to work. A 690fatal error will be thrown if C<Merge> is used with an older version of 691zlib. 692 693=item 2 694 695If C<$output> is a file or a filehandle, it must be seekable. 696 697=back 698 699This parameter defaults to 0. 700 701=item -Level 702 703Defines the compression level used by zlib. The value should either be 704a number between 0 and 9 (0 means no compression and 9 is maximum 705compression), or one of the symbolic constants defined below. 706 707 Z_NO_COMPRESSION 708 Z_BEST_SPEED 709 Z_BEST_COMPRESSION 710 Z_DEFAULT_COMPRESSION 711 712The default is Z_DEFAULT_COMPRESSION. 713 714Note, these constants are not imported by C<IO::Compress::Gzip> by default. 715 716 use IO::Compress::Gzip qw(:strategy); 717 use IO::Compress::Gzip qw(:constants); 718 use IO::Compress::Gzip qw(:all); 719 720=item -Strategy 721 722Defines the strategy used to tune the compression. Use one of the symbolic 723constants defined below. 724 725 Z_FILTERED 726 Z_HUFFMAN_ONLY 727 Z_RLE 728 Z_FIXED 729 Z_DEFAULT_STRATEGY 730 731The default is Z_DEFAULT_STRATEGY. 732 733=item C<< Minimal => 0|1 >> 734 735If specified, this option will force the creation of the smallest possible 736compliant gzip header (which is exactly 10 bytes long) as defined in 737RFC 1952. 738 739See the section titled "Compliance" in RFC 1952 for a definition 740of the values used for the fields in the gzip header. 741 742All other parameters that control the content of the gzip header will 743be ignored if this parameter is set to 1. 744 745This parameter defaults to 0. 746 747=item C<< Comment => $comment >> 748 749Stores the contents of C<$comment> in the COMMENT field in 750the gzip header. 751By default, no comment field is written to the gzip file. 752 753If the C<-Strict> option is enabled, the comment can only consist of ISO 7548859-1 characters plus line feed. 755 756If the C<-Strict> option is disabled, the comment field can contain any 757character except NULL. If any null characters are present, the field 758will be truncated at the first NULL. 759 760=item C<< Name => $string >> 761 762Stores the contents of C<$string> in the gzip NAME header field. If 763C<Name> is not specified, no gzip NAME field will be created. 764 765If the C<-Strict> option is enabled, C<$string> can only consist of ISO 7668859-1 characters. 767 768If C<-Strict> is disabled, then C<$string> can contain any character 769except NULL. If any null characters are present, the field will be 770truncated at the first NULL. 771 772=item C<< Time => $number >> 773 774Sets the MTIME field in the gzip header to $number. 775 776This field defaults to the time the C<IO::Compress::Gzip> object was created 777if this option is not specified. 778 779=item C<< TextFlag => 0|1 >> 780 781This parameter controls the setting of the FLG.FTEXT bit in the gzip 782header. It is used to signal that the data stored in the gzip file/buffer 783is probably text. 784 785The default is 0. 786 787=item C<< HeaderCRC => 0|1 >> 788 789When true this parameter will set the FLG.FHCRC bit to 1 in the gzip header 790and set the CRC16 header field to the CRC of the complete gzip header 791except the CRC16 field itself. 792 793B<Note> that gzip files created with the C<HeaderCRC> flag set to 1 cannot 794be read by most, if not all, of the the standard gunzip utilities, most 795notably gzip version 1.2.4. You should therefore avoid using this option if 796you want to maximize the portability of your gzip files. 797 798This parameter defaults to 0. 799 800=item C<< OS_Code => $value >> 801 802Stores C<$value> in the gzip OS header field. A number between 0 and 255 is 803valid. 804 805If not specified, this parameter defaults to the OS code of the Operating 806System this module was built on. The value 3 is used as a catch-all for all 807Unix variants and unknown Operating Systems. 808 809=item C<< ExtraField => $data >> 810 811This parameter allows additional metadata to be stored in the ExtraField in 812the gzip header. An RFC 1952 compliant ExtraField consists of zero or more 813subfields. Each subfield consists of a two byte header followed by the 814subfield data. 815 816The list of subfields can be supplied in any of the following formats 817 818 -ExtraField => [$id1, $data1, 819 $id2, $data2, 820 ... 821 ] 822 -ExtraField => [ [$id1 => $data1], 823 [$id2 => $data2], 824 ... 825 ] 826 -ExtraField => { $id1 => $data1, 827 $id2 => $data2, 828 ... 829 } 830 831Where C<$id1>, C<$id2> are two byte subfield ID's. The second byte of 832the ID cannot be 0, unless the C<Strict> option has been disabled. 833 834If you use the hash syntax, you have no control over the order in which 835the ExtraSubFields are stored, plus you cannot have SubFields with 836duplicate ID. 837 838Alternatively the list of subfields can by supplied as a scalar, thus 839 840 -ExtraField => $rawdata 841 842If you use the raw format, and the C<Strict> option is enabled, 843C<IO::Compress::Gzip> will check that C<$rawdata> consists of zero or more 844conformant sub-fields. When C<Strict> is disabled, C<$rawdata> can 845consist of any arbitrary byte stream. 846 847The maximum size of the Extra Field 65535 bytes. 848 849=item C<< ExtraFlags => $value >> 850 851Sets the XFL byte in the gzip header to C<$value>. 852 853If this option is not present, the value stored in XFL field will be 854determined by the setting of the C<Level> option. 855 856If C<< Level => Z_BEST_SPEED >> has been specified then XFL is set to 2. 857If C<< Level => Z_BEST_COMPRESSION >> has been specified then XFL is set to 4. 858Otherwise XFL is set to 0. 859 860=item C<< Strict => 0|1 >> 861 862C<Strict> will optionally police the values supplied with other options 863to ensure they are compliant with RFC1952. 864 865This option is enabled by default. 866 867If C<Strict> is enabled the following behaviour will be policed: 868 869=over 5 870 871=item * 872 873The value supplied with the C<Name> option can only contain ISO 8859-1 874characters. 875 876=item * 877 878The value supplied with the C<Comment> option can only contain ISO 8859-1 879characters plus line-feed. 880 881=item * 882 883The values supplied with the C<-Name> and C<-Comment> options cannot 884contain multiple embedded nulls. 885 886=item * 887 888If an C<ExtraField> option is specified and it is a simple scalar, 889it must conform to the sub-field structure as defined in RFC 1952. 890 891=item * 892 893If an C<ExtraField> option is specified the second byte of the ID will be 894checked in each subfield to ensure that it does not contain the reserved 895value 0x00. 896 897=back 898 899When C<Strict> is disabled the following behaviour will be policed: 900 901=over 5 902 903=item * 904 905The value supplied with C<-Name> option can contain 906any character except NULL. 907 908=item * 909 910The value supplied with C<-Comment> option can contain any character 911except NULL. 912 913=item * 914 915The values supplied with the C<-Name> and C<-Comment> options can contain 916multiple embedded nulls. The string written to the gzip header will 917consist of the characters up to, but not including, the first embedded 918NULL. 919 920=item * 921 922If an C<ExtraField> option is specified and it is a simple scalar, the 923structure will not be checked. The only error is if the length is too big. 924 925=item * 926 927The ID header in an C<ExtraField> sub-field can consist of any two bytes. 928 929=back 930 931=back 932 933=head2 Examples 934 935TODO 936 937=head1 Methods 938 939=head2 print 940 941Usage is 942 943 $z->print($data) 944 print $z $data 945 946Compresses and outputs the contents of the C<$data> parameter. This 947has the same behaviour as the C<print> built-in. 948 949Returns true if successful. 950 951=head2 printf 952 953Usage is 954 955 $z->printf($format, $data) 956 printf $z $format, $data 957 958Compresses and outputs the contents of the C<$data> parameter. 959 960Returns true if successful. 961 962=head2 syswrite 963 964Usage is 965 966 $z->syswrite $data 967 $z->syswrite $data, $length 968 $z->syswrite $data, $length, $offset 969 970Compresses and outputs the contents of the C<$data> parameter. 971 972Returns the number of uncompressed bytes written, or C<undef> if 973unsuccessful. 974 975=head2 write 976 977Usage is 978 979 $z->write $data 980 $z->write $data, $length 981 $z->write $data, $length, $offset 982 983Compresses and outputs the contents of the C<$data> parameter. 984 985Returns the number of uncompressed bytes written, or C<undef> if 986unsuccessful. 987 988=head2 flush 989 990Usage is 991 992 $z->flush; 993 $z->flush($flush_type); 994 995Flushes any pending compressed data to the output file/buffer. 996 997This method takes an optional parameter, C<$flush_type>, that controls 998how the flushing will be carried out. By default the C<$flush_type> 999used is C<Z_FINISH>. Other valid values for C<$flush_type> are 1000C<Z_NO_FLUSH>, C<Z_SYNC_FLUSH>, C<Z_FULL_FLUSH> and C<Z_BLOCK>. It is 1001strongly recommended that you only set the C<flush_type> parameter if 1002you fully understand the implications of what it does - overuse of C<flush> 1003can seriously degrade the level of compression achieved. See the C<zlib> 1004documentation for details. 1005 1006Returns true on success. 1007 1008=head2 tell 1009 1010Usage is 1011 1012 $z->tell() 1013 tell $z 1014 1015Returns the uncompressed file offset. 1016 1017=head2 eof 1018 1019Usage is 1020 1021 $z->eof(); 1022 eof($z); 1023 1024Returns true if the C<close> method has been called. 1025 1026=head2 seek 1027 1028 $z->seek($position, $whence); 1029 seek($z, $position, $whence); 1030 1031Provides a sub-set of the C<seek> functionality, with the restriction 1032that it is only legal to seek forward in the output file/buffer. 1033It is a fatal error to attempt to seek backward. 1034 1035Empty parts of the file/buffer will have NULL (0x00) bytes written to them. 1036 1037The C<$whence> parameter takes one the usual values, namely SEEK_SET, 1038SEEK_CUR or SEEK_END. 1039 1040Returns 1 on success, 0 on failure. 1041 1042=head2 binmode 1043 1044Usage is 1045 1046 $z->binmode 1047 binmode $z ; 1048 1049This is a noop provided for completeness. 1050 1051=head2 opened 1052 1053 $z->opened() 1054 1055Returns true if the object currently refers to a opened file/buffer. 1056 1057=head2 autoflush 1058 1059 my $prev = $z->autoflush() 1060 my $prev = $z->autoflush(EXPR) 1061 1062If the C<$z> object is associated with a file or a filehandle, this method 1063returns the current autoflush setting for the underlying filehandle. If 1064C<EXPR> is present, and is non-zero, it will enable flushing after every 1065write/print operation. 1066 1067If C<$z> is associated with a buffer, this method has no effect and always 1068returns C<undef>. 1069 1070B<Note> that the special variable C<$|> B<cannot> be used to set or 1071retrieve the autoflush setting. 1072 1073=head2 input_line_number 1074 1075 $z->input_line_number() 1076 $z->input_line_number(EXPR) 1077 1078This method always returns C<undef> when compressing. 1079 1080=head2 fileno 1081 1082 $z->fileno() 1083 fileno($z) 1084 1085If the C<$z> object is associated with a file or a filehandle, C<fileno> 1086will return the underlying file descriptor. Once the C<close> method is 1087called C<fileno> will return C<undef>. 1088 1089If the C<$z> object is is associated with a buffer, this method will return 1090C<undef>. 1091 1092=head2 close 1093 1094 $z->close() ; 1095 close $z ; 1096 1097Flushes any pending compressed data and then closes the output file/buffer. 1098 1099For most versions of Perl this method will be automatically invoked if 1100the IO::Compress::Gzip object is destroyed (either explicitly or by the 1101variable with the reference to the object going out of scope). The 1102exceptions are Perl versions 5.005 through 5.00504 and 5.8.0. In 1103these cases, the C<close> method will be called automatically, but 1104not until global destruction of all live objects when the program is 1105terminating. 1106 1107Therefore, if you want your scripts to be able to run on all versions 1108of Perl, you should call C<close> explicitly and not rely on automatic 1109closing. 1110 1111Returns true on success, otherwise 0. 1112 1113If the C<AutoClose> option has been enabled when the IO::Compress::Gzip 1114object was created, and the object is associated with a file, the 1115underlying file will also be closed. 1116 1117=head2 newStream([OPTS]) 1118 1119Usage is 1120 1121 $z->newStream( [OPTS] ) 1122 1123Closes the current compressed data stream and starts a new one. 1124 1125OPTS consists of any of the the options that are available when creating 1126the C<$z> object. 1127 1128See the L</"Constructor Options"> section for more details. 1129 1130=head2 deflateParams 1131 1132Usage is 1133 1134 $z->deflateParams 1135 1136TODO 1137 1138=head1 Importing 1139 1140A number of symbolic constants are required by some methods in 1141C<IO::Compress::Gzip>. None are imported by default. 1142 1143=over 5 1144 1145=item :all 1146 1147Imports C<gzip>, C<$GzipError> and all symbolic 1148constants that can be used by C<IO::Compress::Gzip>. Same as doing this 1149 1150 use IO::Compress::Gzip qw(gzip $GzipError :constants) ; 1151 1152=item :constants 1153 1154Import all symbolic constants. Same as doing this 1155 1156 use IO::Compress::Gzip qw(:flush :level :strategy) ; 1157 1158=item :flush 1159 1160These symbolic constants are used by the C<flush> method. 1161 1162 Z_NO_FLUSH 1163 Z_PARTIAL_FLUSH 1164 Z_SYNC_FLUSH 1165 Z_FULL_FLUSH 1166 Z_FINISH 1167 Z_BLOCK 1168 1169=item :level 1170 1171These symbolic constants are used by the C<Level> option in the constructor. 1172 1173 Z_NO_COMPRESSION 1174 Z_BEST_SPEED 1175 Z_BEST_COMPRESSION 1176 Z_DEFAULT_COMPRESSION 1177 1178=item :strategy 1179 1180These symbolic constants are used by the C<Strategy> option in the constructor. 1181 1182 Z_FILTERED 1183 Z_HUFFMAN_ONLY 1184 Z_RLE 1185 Z_FIXED 1186 Z_DEFAULT_STRATEGY 1187 1188 1189 1190 1191=back 1192 1193=head1 EXAMPLES 1194 1195=head2 Apache::GZip Revisited 1196 1197See L<IO::Compress::FAQ|IO::Compress::FAQ/"Apache::GZip Revisited"> 1198 1199 1200 1201=head2 Working with Net::FTP 1202 1203See L<IO::Compress::FAQ|IO::Compress::FAQ/"Compressed files and Net::FTP"> 1204 1205=head1 SEE ALSO 1206 1207L<Compress::Zlib>, L<IO::Uncompress::Gunzip>, L<IO::Compress::Deflate>, L<IO::Uncompress::Inflate>, L<IO::Compress::RawDeflate>, L<IO::Uncompress::RawInflate>, L<IO::Compress::Bzip2>, L<IO::Uncompress::Bunzip2>, L<IO::Compress::Lzma>, L<IO::Uncompress::UnLzma>, L<IO::Compress::Xz>, L<IO::Uncompress::UnXz>, L<IO::Compress::Lzop>, L<IO::Uncompress::UnLzop>, L<IO::Compress::Lzf>, L<IO::Uncompress::UnLzf>, L<IO::Uncompress::AnyInflate>, L<IO::Uncompress::AnyUncompress> 1208 1209L<Compress::Zlib::FAQ|Compress::Zlib::FAQ> 1210 1211L<File::GlobMapper|File::GlobMapper>, L<Archive::Zip|Archive::Zip>, 1212L<Archive::Tar|Archive::Tar>, 1213L<IO::Zlib|IO::Zlib> 1214 1215For RFC 1950, 1951 and 1952 see 1216F<http://www.faqs.org/rfcs/rfc1950.html>, 1217F<http://www.faqs.org/rfcs/rfc1951.html> and 1218F<http://www.faqs.org/rfcs/rfc1952.html> 1219 1220The I<zlib> compression library was written by Jean-loup Gailly 1221F<gzip@prep.ai.mit.edu> and Mark Adler F<madler@alumni.caltech.edu>. 1222 1223The primary site for the I<zlib> compression library is 1224F<http://www.zlib.org>. 1225 1226The primary site for gzip is F<http://www.gzip.org>. 1227 1228=head1 AUTHOR 1229 1230This module was written by Paul Marquess, F<pmqs@cpan.org>. 1231 1232=head1 MODIFICATION HISTORY 1233 1234See the Changes file. 1235 1236=head1 COPYRIGHT AND LICENSE 1237 1238Copyright (c) 2005-2010 Paul Marquess. All rights reserved. 1239 1240This program is free software; you can redistribute it and/or 1241modify it under the same terms as Perl itself. 1242 1243