1# 2# Data/Dumper.pm 3# 4# convert perl data structures into perl syntax suitable for both printing 5# and eval 6# 7# Documentation at the __END__ 8# 9 10package Data::Dumper; 11 12$VERSION = '2.125'; # Don't forget to set version and release date in POD! 13 14#$| = 1; 15 16use 5.006_001; 17require Exporter; 18require overload; 19 20use Carp; 21 22BEGIN { 23 @ISA = qw(Exporter); 24 @EXPORT = qw(Dumper); 25 @EXPORT_OK = qw(DumperX); 26 27 # if run under miniperl, or otherwise lacking dynamic loading, 28 # XSLoader should be attempted to load, or the pure perl flag 29 # toggled on load failure. 30 eval { 31 require XSLoader; 32 }; 33 $Useperl = 1 if $@; 34} 35 36XSLoader::load( 'Data::Dumper' ) unless $Useperl; 37 38# module vars and their defaults 39$Indent = 2 unless defined $Indent; 40$Purity = 0 unless defined $Purity; 41$Pad = "" unless defined $Pad; 42$Varname = "VAR" unless defined $Varname; 43$Useqq = 0 unless defined $Useqq; 44$Terse = 0 unless defined $Terse; 45$Freezer = "" unless defined $Freezer; 46$Toaster = "" unless defined $Toaster; 47$Deepcopy = 0 unless defined $Deepcopy; 48$Quotekeys = 1 unless defined $Quotekeys; 49$Bless = "bless" unless defined $Bless; 50#$Expdepth = 0 unless defined $Expdepth; 51$Maxdepth = 0 unless defined $Maxdepth; 52$Pair = ' => ' unless defined $Pair; 53$Useperl = 0 unless defined $Useperl; 54$Sortkeys = 0 unless defined $Sortkeys; 55$Deparse = 0 unless defined $Deparse; 56 57# 58# expects an arrayref of values to be dumped. 59# can optionally pass an arrayref of names for the values. 60# names must have leading $ sign stripped. begin the name with * 61# to cause output of arrays and hashes rather than refs. 62# 63sub new { 64 my($c, $v, $n) = @_; 65 66 croak "Usage: PACKAGE->new(ARRAYREF, [ARRAYREF])" 67 unless (defined($v) && (ref($v) eq 'ARRAY')); 68 $n = [] unless (defined($n) && (ref($n) eq 'ARRAY')); 69 70 my($s) = { 71 level => 0, # current recursive depth 72 indent => $Indent, # various styles of indenting 73 pad => $Pad, # all lines prefixed by this string 74 xpad => "", # padding-per-level 75 apad => "", # added padding for hash keys n such 76 sep => "", # list separator 77 pair => $Pair, # hash key/value separator: defaults to ' => ' 78 seen => {}, # local (nested) refs (id => [name, val]) 79 todump => $v, # values to dump [] 80 names => $n, # optional names for values [] 81 varname => $Varname, # prefix to use for tagging nameless ones 82 purity => $Purity, # degree to which output is evalable 83 useqq => $Useqq, # use "" for strings (backslashitis ensues) 84 terse => $Terse, # avoid name output (where feasible) 85 freezer => $Freezer, # name of Freezer method for objects 86 toaster => $Toaster, # name of method to revive objects 87 deepcopy => $Deepcopy, # dont cross-ref, except to stop recursion 88 quotekeys => $Quotekeys, # quote hash keys 89 'bless' => $Bless, # keyword to use for "bless" 90# expdepth => $Expdepth, # cutoff depth for explicit dumping 91 maxdepth => $Maxdepth, # depth beyond which we give up 92 useperl => $Useperl, # use the pure Perl implementation 93 sortkeys => $Sortkeys, # flag or filter for sorting hash keys 94 deparse => $Deparse, # use B::Deparse for coderefs 95 }; 96 97 if ($Indent > 0) { 98 $s->{xpad} = " "; 99 $s->{sep} = "\n"; 100 } 101 return bless($s, $c); 102} 103 104if ($] >= 5.008) { 105 # Packed numeric addresses take less memory. Plus pack is faster than sprintf 106 *init_refaddr_format = sub {}; 107 108 *format_refaddr = sub { 109 require Scalar::Util; 110 pack "J", Scalar::Util::refaddr(shift); 111 }; 112} else { 113 *init_refaddr_format = sub { 114 require Config; 115 my $f = $Config::Config{uvxformat}; 116 $f =~ tr/"//d; 117 our $refaddr_format = "0x%" . $f; 118 }; 119 120 *format_refaddr = sub { 121 require Scalar::Util; 122 sprintf our $refaddr_format, Scalar::Util::refaddr(shift); 123 } 124} 125 126# 127# add-to or query the table of already seen references 128# 129sub Seen { 130 my($s, $g) = @_; 131 if (defined($g) && (ref($g) eq 'HASH')) { 132 init_refaddr_format(); 133 my($k, $v, $id); 134 while (($k, $v) = each %$g) { 135 if (defined $v and ref $v) { 136 $id = format_refaddr($v); 137 if ($k =~ /^[*](.*)$/) { 138 $k = (ref $v eq 'ARRAY') ? ( "\\\@" . $1 ) : 139 (ref $v eq 'HASH') ? ( "\\\%" . $1 ) : 140 (ref $v eq 'CODE') ? ( "\\\&" . $1 ) : 141 ( "\$" . $1 ) ; 142 } 143 elsif ($k !~ /^\$/) { 144 $k = "\$" . $k; 145 } 146 $s->{seen}{$id} = [$k, $v]; 147 } 148 else { 149 carp "Only refs supported, ignoring non-ref item \$$k"; 150 } 151 } 152 return $s; 153 } 154 else { 155 return map { @$_ } values %{$s->{seen}}; 156 } 157} 158 159# 160# set or query the values to be dumped 161# 162sub Values { 163 my($s, $v) = @_; 164 if (defined($v) && (ref($v) eq 'ARRAY')) { 165 $s->{todump} = [@$v]; # make a copy 166 return $s; 167 } 168 else { 169 return @{$s->{todump}}; 170 } 171} 172 173# 174# set or query the names of the values to be dumped 175# 176sub Names { 177 my($s, $n) = @_; 178 if (defined($n) && (ref($n) eq 'ARRAY')) { 179 $s->{names} = [@$n]; # make a copy 180 return $s; 181 } 182 else { 183 return @{$s->{names}}; 184 } 185} 186 187sub DESTROY {} 188 189sub Dump { 190 return &Dumpxs 191 unless $Data::Dumper::Useperl || (ref($_[0]) && $_[0]->{useperl}) || 192 $Data::Dumper::Useqq || (ref($_[0]) && $_[0]->{useqq}) || 193 $Data::Dumper::Deparse || (ref($_[0]) && $_[0]->{deparse}); 194 return &Dumpperl; 195} 196 197# 198# dump the refs in the current dumper object. 199# expects same args as new() if called via package name. 200# 201sub Dumpperl { 202 my($s) = shift; 203 my(@out, $val, $name); 204 my($i) = 0; 205 local(@post); 206 init_refaddr_format(); 207 208 $s = $s->new(@_) unless ref $s; 209 210 for $val (@{$s->{todump}}) { 211 my $out = ""; 212 @post = (); 213 $name = $s->{names}[$i++]; 214 if (defined $name) { 215 if ($name =~ /^[*](.*)$/) { 216 if (defined $val) { 217 $name = (ref $val eq 'ARRAY') ? ( "\@" . $1 ) : 218 (ref $val eq 'HASH') ? ( "\%" . $1 ) : 219 (ref $val eq 'CODE') ? ( "\*" . $1 ) : 220 ( "\$" . $1 ) ; 221 } 222 else { 223 $name = "\$" . $1; 224 } 225 } 226 elsif ($name !~ /^\$/) { 227 $name = "\$" . $name; 228 } 229 } 230 else { 231 $name = "\$" . $s->{varname} . $i; 232 } 233 234 my $valstr; 235 { 236 local($s->{apad}) = $s->{apad}; 237 $s->{apad} .= ' ' x (length($name) + 3) if $s->{indent} >= 2; 238 $valstr = $s->_dump($val, $name); 239 } 240 241 $valstr = "$name = " . $valstr . ';' if @post or !$s->{terse}; 242 $out .= $s->{pad} . $valstr . $s->{sep}; 243 $out .= $s->{pad} . join(';' . $s->{sep} . $s->{pad}, @post) 244 . ';' . $s->{sep} if @post; 245 246 push @out, $out; 247 } 248 return wantarray ? @out : join('', @out); 249} 250 251# wrap string in single quotes (escaping if needed) 252sub _quote { 253 my $val = shift; 254 $val =~ s/([\\\'])/\\$1/g; 255 return "'" . $val . "'"; 256} 257 258# 259# twist, toil and turn; 260# and recurse, of course. 261# sometimes sordidly; 262# and curse if no recourse. 263# 264sub _dump { 265 my($s, $val, $name) = @_; 266 my($sname); 267 my($out, $realpack, $realtype, $type, $ipad, $id, $blesspad); 268 269 $type = ref $val; 270 $out = ""; 271 272 if ($type) { 273 274 # Call the freezer method if it's specified and the object has the 275 # method. Trap errors and warn() instead of die()ing, like the XS 276 # implementation. 277 my $freezer = $s->{freezer}; 278 if ($freezer and UNIVERSAL::can($val, $freezer)) { 279 eval { $val->$freezer() }; 280 warn "WARNING(Freezer method call failed): $@" if $@; 281 } 282 283 require Scalar::Util; 284 $realpack = Scalar::Util::blessed($val); 285 $realtype = $realpack ? Scalar::Util::reftype($val) : ref $val; 286 $id = format_refaddr($val); 287 288 # if it has a name, we need to either look it up, or keep a tab 289 # on it so we know when we hit it later 290 if (defined($name) and length($name)) { 291 # keep a tab on it so that we dont fall into recursive pit 292 if (exists $s->{seen}{$id}) { 293# if ($s->{expdepth} < $s->{level}) { 294 if ($s->{purity} and $s->{level} > 0) { 295 $out = ($realtype eq 'HASH') ? '{}' : 296 ($realtype eq 'ARRAY') ? '[]' : 297 'do{my $o}' ; 298 push @post, $name . " = " . $s->{seen}{$id}[0]; 299 } 300 else { 301 $out = $s->{seen}{$id}[0]; 302 if ($name =~ /^([\@\%])/) { 303 my $start = $1; 304 if ($out =~ /^\\$start/) { 305 $out = substr($out, 1); 306 } 307 else { 308 $out = $start . '{' . $out . '}'; 309 } 310 } 311 } 312 return $out; 313# } 314 } 315 else { 316 # store our name 317 $s->{seen}{$id} = [ (($name =~ /^[@%]/) ? ('\\' . $name ) : 318 ($realtype eq 'CODE' and 319 $name =~ /^[*](.*)$/) ? ('\\&' . $1 ) : 320 $name ), 321 $val ]; 322 } 323 } 324 my $no_bless = 0; 325 my $is_regex = 0; 326 if ( $realpack and ($] >= 5.009005 ? re::is_regexp($val) : $realpack eq 'Regexp') ) { 327 $is_regex = 1; 328 $no_bless = $realpack eq 'Regexp'; 329 } 330 331 # If purity is not set and maxdepth is set, then check depth: 332 # if we have reached maximum depth, return the string 333 # representation of the thing we are currently examining 334 # at this depth (i.e., 'Foo=ARRAY(0xdeadbeef)'). 335 if (!$s->{purity} 336 and $s->{maxdepth} > 0 337 and $s->{level} >= $s->{maxdepth}) 338 { 339 return qq['$val']; 340 } 341 342 # we have a blessed ref 343 if ($realpack and !$no_bless) { 344 $out = $s->{'bless'} . '( '; 345 $blesspad = $s->{apad}; 346 $s->{apad} .= ' ' if ($s->{indent} >= 2); 347 } 348 349 $s->{level}++; 350 $ipad = $s->{xpad} x $s->{level}; 351 352 if ($is_regex) { 353 my $pat; 354 # This really sucks, re:regexp_pattern is in ext/re/re.xs and not in 355 # universal.c, and even worse we cant just require that re to be loaded 356 # we *have* to use() it. 357 # We should probably move it to universal.c for 5.10.1 and fix this. 358 # Currently we only use re::regexp_pattern when the re is blessed into another 359 # package. This has the disadvantage of meaning that a DD dump won't round trip 360 # as the pattern will be repeatedly wrapped with the same modifiers. 361 # This is an aesthetic issue so we will leave it for now, but we could use 362 # regexp_pattern() in list context to get the modifiers separately. 363 # But since this means loading the full debugging engine in process we wont 364 # bother unless its necessary for accuracy. 365 if (($realpack ne 'Regexp') && defined(*re::regexp_pattern{CODE})) { 366 $pat = re::regexp_pattern($val); 367 } else { 368 $pat = "$val"; 369 } 370 $pat =~ s,/,\\/,g; 371 $out .= "qr/$pat/"; 372 } 373 elsif ($realtype eq 'SCALAR' || $realtype eq 'REF') { 374 if ($realpack) { 375 $out .= 'do{\\(my $o = ' . $s->_dump($$val, "\${$name}") . ')}'; 376 } 377 else { 378 $out .= '\\' . $s->_dump($$val, "\${$name}"); 379 } 380 } 381 elsif ($realtype eq 'GLOB') { 382 $out .= '\\' . $s->_dump($$val, "*{$name}"); 383 } 384 elsif ($realtype eq 'ARRAY') { 385 my($pad, $mname); 386 my($i) = 0; 387 $out .= ($name =~ /^\@/) ? '(' : '['; 388 $pad = $s->{sep} . $s->{pad} . $s->{apad}; 389 ($name =~ /^\@(.*)$/) ? ($mname = "\$" . $1) : 390 # omit -> if $foo->[0]->{bar}, but not ${$foo->[0]}->{bar} 391 ($name =~ /^\\?[\%\@\*\$][^{].*[]}]$/) ? ($mname = $name) : 392 ($mname = $name . '->'); 393 $mname .= '->' if $mname =~ /^\*.+\{[A-Z]+\}$/; 394 for my $v (@$val) { 395 $sname = $mname . '[' . $i . ']'; 396 $out .= $pad . $ipad . '#' . $i if $s->{indent} >= 3; 397 $out .= $pad . $ipad . $s->_dump($v, $sname); 398 $out .= "," if $i++ < $#$val; 399 } 400 $out .= $pad . ($s->{xpad} x ($s->{level} - 1)) if $i; 401 $out .= ($name =~ /^\@/) ? ')' : ']'; 402 } 403 elsif ($realtype eq 'HASH') { 404 my($k, $v, $pad, $lpad, $mname, $pair); 405 $out .= ($name =~ /^\%/) ? '(' : '{'; 406 $pad = $s->{sep} . $s->{pad} . $s->{apad}; 407 $lpad = $s->{apad}; 408 $pair = $s->{pair}; 409 ($name =~ /^\%(.*)$/) ? ($mname = "\$" . $1) : 410 # omit -> if $foo->[0]->{bar}, but not ${$foo->[0]}->{bar} 411 ($name =~ /^\\?[\%\@\*\$][^{].*[]}]$/) ? ($mname = $name) : 412 ($mname = $name . '->'); 413 $mname .= '->' if $mname =~ /^\*.+\{[A-Z]+\}$/; 414 my ($sortkeys, $keys, $key) = ("$s->{sortkeys}"); 415 if ($sortkeys) { 416 if (ref($s->{sortkeys}) eq 'CODE') { 417 $keys = $s->{sortkeys}($val); 418 unless (ref($keys) eq 'ARRAY') { 419 carp "Sortkeys subroutine did not return ARRAYREF"; 420 $keys = []; 421 } 422 } 423 else { 424 $keys = [ sort keys %$val ]; 425 } 426 } 427 428 # Ensure hash iterator is reset 429 keys(%$val); 430 431 while (($k, $v) = ! $sortkeys ? (each %$val) : 432 @$keys ? ($key = shift(@$keys), $val->{$key}) : 433 () ) 434 { 435 my $nk = $s->_dump($k, ""); 436 $nk = $1 if !$s->{quotekeys} and $nk =~ /^[\"\']([A-Za-z_]\w*)[\"\']$/; 437 $sname = $mname . '{' . $nk . '}'; 438 $out .= $pad . $ipad . $nk . $pair; 439 440 # temporarily alter apad 441 $s->{apad} .= (" " x (length($nk) + 4)) if $s->{indent} >= 2; 442 $out .= $s->_dump($val->{$k}, $sname) . ","; 443 $s->{apad} = $lpad if $s->{indent} >= 2; 444 } 445 if (substr($out, -1) eq ',') { 446 chop $out; 447 $out .= $pad . ($s->{xpad} x ($s->{level} - 1)); 448 } 449 $out .= ($name =~ /^\%/) ? ')' : '}'; 450 } 451 elsif ($realtype eq 'CODE') { 452 if ($s->{deparse}) { 453 require B::Deparse; 454 my $sub = 'sub ' . (B::Deparse->new)->coderef2text($val); 455 $pad = $s->{sep} . $s->{pad} . $s->{apad} . $s->{xpad} x ($s->{level} - 1); 456 $sub =~ s/\n/$pad/gse; 457 $out .= $sub; 458 } else { 459 $out .= 'sub { "DUMMY" }'; 460 carp "Encountered CODE ref, using dummy placeholder" if $s->{purity}; 461 } 462 } 463 else { 464 croak "Can\'t handle $realtype type."; 465 } 466 467 if ($realpack and !$no_bless) { # we have a blessed ref 468 $out .= ', ' . _quote($realpack) . ' )'; 469 $out .= '->' . $s->{toaster} . '()' if $s->{toaster} ne ''; 470 $s->{apad} = $blesspad; 471 } 472 $s->{level}--; 473 474 } 475 else { # simple scalar 476 477 my $ref = \$_[1]; 478 # first, catalog the scalar 479 if ($name ne '') { 480 $id = format_refaddr($ref); 481 if (exists $s->{seen}{$id}) { 482 if ($s->{seen}{$id}[2]) { 483 $out = $s->{seen}{$id}[0]; 484 #warn "[<$out]\n"; 485 return "\${$out}"; 486 } 487 } 488 else { 489 #warn "[>\\$name]\n"; 490 $s->{seen}{$id} = ["\\$name", $ref]; 491 } 492 } 493 if (ref($ref) eq 'GLOB' or "$ref" =~ /=GLOB\([^()]+\)$/) { # glob 494 my $name = substr($val, 1); 495 if ($name =~ /^[A-Za-z_][\w:]*$/) { 496 $name =~ s/^main::/::/; 497 $sname = $name; 498 } 499 else { 500 $sname = $s->_dump($name, ""); 501 $sname = '{' . $sname . '}'; 502 } 503 if ($s->{purity}) { 504 my $k; 505 local ($s->{level}) = 0; 506 for $k (qw(SCALAR ARRAY HASH)) { 507 my $gval = *$val{$k}; 508 next unless defined $gval; 509 next if $k eq "SCALAR" && ! defined $$gval; # always there 510 511 # _dump can push into @post, so we hold our place using $postlen 512 my $postlen = scalar @post; 513 $post[$postlen] = "\*$sname = "; 514 local ($s->{apad}) = " " x length($post[$postlen]) if $s->{indent} >= 2; 515 $post[$postlen] .= $s->_dump($gval, "\*$sname\{$k\}"); 516 } 517 } 518 $out .= '*' . $sname; 519 } 520 elsif (!defined($val)) { 521 $out .= "undef"; 522 } 523 elsif ($val =~ /^(?:0|-?[1-9]\d{0,8})\z/) { # safe decimal number 524 $out .= $val; 525 } 526 else { # string 527 if ($s->{useqq} or $val =~ tr/\0-\377//c) { 528 # Fall back to qq if there's Unicode 529 $out .= qquote($val, $s->{useqq}); 530 } 531 else { 532 $out .= _quote($val); 533 } 534 } 535 } 536 if ($id) { 537 # if we made it this far, $id was added to seen list at current 538 # level, so remove it to get deep copies 539 if ($s->{deepcopy}) { 540 delete($s->{seen}{$id}); 541 } 542 elsif ($name) { 543 $s->{seen}{$id}[2] = 1; 544 } 545 } 546 return $out; 547} 548 549# 550# non-OO style of earlier version 551# 552sub Dumper { 553 return Data::Dumper->Dump([@_]); 554} 555 556# compat stub 557sub DumperX { 558 return Data::Dumper->Dumpxs([@_], []); 559} 560 561sub Dumpf { return Data::Dumper->Dump(@_) } 562 563sub Dumpp { print Data::Dumper->Dump(@_) } 564 565# 566# reset the "seen" cache 567# 568sub Reset { 569 my($s) = shift; 570 $s->{seen} = {}; 571 return $s; 572} 573 574sub Indent { 575 my($s, $v) = @_; 576 if (defined($v)) { 577 if ($v == 0) { 578 $s->{xpad} = ""; 579 $s->{sep} = ""; 580 } 581 else { 582 $s->{xpad} = " "; 583 $s->{sep} = "\n"; 584 } 585 $s->{indent} = $v; 586 return $s; 587 } 588 else { 589 return $s->{indent}; 590 } 591} 592 593sub Pair { 594 my($s, $v) = @_; 595 defined($v) ? (($s->{pair} = $v), return $s) : $s->{pair}; 596} 597 598sub Pad { 599 my($s, $v) = @_; 600 defined($v) ? (($s->{pad} = $v), return $s) : $s->{pad}; 601} 602 603sub Varname { 604 my($s, $v) = @_; 605 defined($v) ? (($s->{varname} = $v), return $s) : $s->{varname}; 606} 607 608sub Purity { 609 my($s, $v) = @_; 610 defined($v) ? (($s->{purity} = $v), return $s) : $s->{purity}; 611} 612 613sub Useqq { 614 my($s, $v) = @_; 615 defined($v) ? (($s->{useqq} = $v), return $s) : $s->{useqq}; 616} 617 618sub Terse { 619 my($s, $v) = @_; 620 defined($v) ? (($s->{terse} = $v), return $s) : $s->{terse}; 621} 622 623sub Freezer { 624 my($s, $v) = @_; 625 defined($v) ? (($s->{freezer} = $v), return $s) : $s->{freezer}; 626} 627 628sub Toaster { 629 my($s, $v) = @_; 630 defined($v) ? (($s->{toaster} = $v), return $s) : $s->{toaster}; 631} 632 633sub Deepcopy { 634 my($s, $v) = @_; 635 defined($v) ? (($s->{deepcopy} = $v), return $s) : $s->{deepcopy}; 636} 637 638sub Quotekeys { 639 my($s, $v) = @_; 640 defined($v) ? (($s->{quotekeys} = $v), return $s) : $s->{quotekeys}; 641} 642 643sub Bless { 644 my($s, $v) = @_; 645 defined($v) ? (($s->{'bless'} = $v), return $s) : $s->{'bless'}; 646} 647 648sub Maxdepth { 649 my($s, $v) = @_; 650 defined($v) ? (($s->{'maxdepth'} = $v), return $s) : $s->{'maxdepth'}; 651} 652 653sub Useperl { 654 my($s, $v) = @_; 655 defined($v) ? (($s->{'useperl'} = $v), return $s) : $s->{'useperl'}; 656} 657 658sub Sortkeys { 659 my($s, $v) = @_; 660 defined($v) ? (($s->{'sortkeys'} = $v), return $s) : $s->{'sortkeys'}; 661} 662 663sub Deparse { 664 my($s, $v) = @_; 665 defined($v) ? (($s->{'deparse'} = $v), return $s) : $s->{'deparse'}; 666} 667 668# used by qquote below 669my %esc = ( 670 "\a" => "\\a", 671 "\b" => "\\b", 672 "\t" => "\\t", 673 "\n" => "\\n", 674 "\f" => "\\f", 675 "\r" => "\\r", 676 "\e" => "\\e", 677); 678 679# put a string value in double quotes 680sub qquote { 681 local($_) = shift; 682 s/([\\\"\@\$])/\\$1/g; 683 my $bytes; { use bytes; $bytes = length } 684 s/([^\x00-\x7f])/'\x{'.sprintf("%x",ord($1)).'}'/ge if $bytes > length; 685 return qq("$_") unless 686 /[^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~]/; # fast exit 687 688 my $high = shift || ""; 689 s/([\a\b\t\n\f\r\e])/$esc{$1}/g; 690 691 if (ord('^')==94) { # ascii 692 # no need for 3 digits in escape for these 693 s/([\0-\037])(?!\d)/'\\'.sprintf('%o',ord($1))/eg; 694 s/([\0-\037\177])/'\\'.sprintf('%03o',ord($1))/eg; 695 # all but last branch below not supported --BEHAVIOR SUBJECT TO CHANGE-- 696 if ($high eq "iso8859") { 697 s/([\200-\240])/'\\'.sprintf('%o',ord($1))/eg; 698 } elsif ($high eq "utf8") { 699# use utf8; 700# $str =~ s/([^\040-\176])/sprintf "\\x{%04x}", ord($1)/ge; 701 } elsif ($high eq "8bit") { 702 # leave it as it is 703 } else { 704 s/([\200-\377])/'\\'.sprintf('%03o',ord($1))/eg; 705 s/([^\040-\176])/sprintf "\\x{%04x}", ord($1)/ge; 706 } 707 } 708 else { # ebcdic 709 s{([^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~])(?!\d)} 710 {my $v = ord($1); '\\'.sprintf(($v <= 037 ? '%o' : '%03o'), $v)}eg; 711 s{([^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~])} 712 {'\\'.sprintf('%03o',ord($1))}eg; 713 } 714 715 return qq("$_"); 716} 717 718# helper sub to sort hash keys in Perl < 5.8.0 where we don't have 719# access to sortsv() from XS 720sub _sortkeys { [ sort keys %{$_[0]} ] } 721 7221; 723__END__ 724 725=head1 NAME 726 727Data::Dumper - stringified perl data structures, suitable for both printing and C<eval> 728 729=head1 SYNOPSIS 730 731 use Data::Dumper; 732 733 # simple procedural interface 734 print Dumper($foo, $bar); 735 736 # extended usage with names 737 print Data::Dumper->Dump([$foo, $bar], [qw(foo *ary)]); 738 739 # configuration variables 740 { 741 local $Data::Dumper::Purity = 1; 742 eval Data::Dumper->Dump([$foo, $bar], [qw(foo *ary)]); 743 } 744 745 # OO usage 746 $d = Data::Dumper->new([$foo, $bar], [qw(foo *ary)]); 747 ... 748 print $d->Dump; 749 ... 750 $d->Purity(1)->Terse(1)->Deepcopy(1); 751 eval $d->Dump; 752 753 754=head1 DESCRIPTION 755 756Given a list of scalars or reference variables, writes out their contents in 757perl syntax. The references can also be objects. The content of each 758variable is output in a single Perl statement. Handles self-referential 759structures correctly. 760 761The return value can be C<eval>ed to get back an identical copy of the 762original reference structure. 763 764Any references that are the same as one of those passed in will be named 765C<$VAR>I<n> (where I<n> is a numeric suffix), and other duplicate references 766to substructures within C<$VAR>I<n> will be appropriately labeled using arrow 767notation. You can specify names for individual values to be dumped if you 768use the C<Dump()> method, or you can change the default C<$VAR> prefix to 769something else. See C<$Data::Dumper::Varname> and C<$Data::Dumper::Terse> 770below. 771 772The default output of self-referential structures can be C<eval>ed, but the 773nested references to C<$VAR>I<n> will be undefined, since a recursive 774structure cannot be constructed using one Perl statement. You should set the 775C<Purity> flag to 1 to get additional statements that will correctly fill in 776these references. Moreover, if C<eval>ed when strictures are in effect, 777you need to ensure that any variables it accesses are previously declared. 778 779In the extended usage form, the references to be dumped can be given 780user-specified names. If a name begins with a C<*>, the output will 781describe the dereferenced type of the supplied reference for hashes and 782arrays, and coderefs. Output of names will be avoided where possible if 783the C<Terse> flag is set. 784 785In many cases, methods that are used to set the internal state of the 786object will return the object itself, so method calls can be conveniently 787chained together. 788 789Several styles of output are possible, all controlled by setting 790the C<Indent> flag. See L<Configuration Variables or Methods> below 791for details. 792 793 794=head2 Methods 795 796=over 4 797 798=item I<PACKAGE>->new(I<ARRAYREF [>, I<ARRAYREF]>) 799 800Returns a newly created C<Data::Dumper> object. The first argument is an 801anonymous array of values to be dumped. The optional second argument is an 802anonymous array of names for the values. The names need not have a leading 803C<$> sign, and must be comprised of alphanumeric characters. You can begin 804a name with a C<*> to specify that the dereferenced type must be dumped 805instead of the reference itself, for ARRAY and HASH references. 806 807The prefix specified by C<$Data::Dumper::Varname> will be used with a 808numeric suffix if the name for a value is undefined. 809 810Data::Dumper will catalog all references encountered while dumping the 811values. Cross-references (in the form of names of substructures in perl 812syntax) will be inserted at all possible points, preserving any structural 813interdependencies in the original set of values. Structure traversal is 814depth-first, and proceeds in order from the first supplied value to 815the last. 816 817=item I<$OBJ>->Dump I<or> I<PACKAGE>->Dump(I<ARRAYREF [>, I<ARRAYREF]>) 818 819Returns the stringified form of the values stored in the object (preserving 820the order in which they were supplied to C<new>), subject to the 821configuration options below. In a list context, it returns a list 822of strings corresponding to the supplied values. 823 824The second form, for convenience, simply calls the C<new> method on its 825arguments before dumping the object immediately. 826 827=item I<$OBJ>->Seen(I<[HASHREF]>) 828 829Queries or adds to the internal table of already encountered references. 830You must use C<Reset> to explicitly clear the table if needed. Such 831references are not dumped; instead, their names are inserted wherever they 832are encountered subsequently. This is useful especially for properly 833dumping subroutine references. 834 835Expects an anonymous hash of name => value pairs. Same rules apply for names 836as in C<new>. If no argument is supplied, will return the "seen" list of 837name => value pairs, in a list context. Otherwise, returns the object 838itself. 839 840=item I<$OBJ>->Values(I<[ARRAYREF]>) 841 842Queries or replaces the internal array of values that will be dumped. 843When called without arguments, returns the values. Otherwise, returns the 844object itself. 845 846=item I<$OBJ>->Names(I<[ARRAYREF]>) 847 848Queries or replaces the internal array of user supplied names for the values 849that will be dumped. When called without arguments, returns the names. 850Otherwise, returns the object itself. 851 852=item I<$OBJ>->Reset 853 854Clears the internal table of "seen" references and returns the object 855itself. 856 857=back 858 859=head2 Functions 860 861=over 4 862 863=item Dumper(I<LIST>) 864 865Returns the stringified form of the values in the list, subject to the 866configuration options below. The values will be named C<$VAR>I<n> in the 867output, where I<n> is a numeric suffix. Will return a list of strings 868in a list context. 869 870=back 871 872=head2 Configuration Variables or Methods 873 874Several configuration variables can be used to control the kind of output 875generated when using the procedural interface. These variables are usually 876C<local>ized in a block so that other parts of the code are not affected by 877the change. 878 879These variables determine the default state of the object created by calling 880the C<new> method, but cannot be used to alter the state of the object 881thereafter. The equivalent method names should be used instead to query 882or set the internal state of the object. 883 884The method forms return the object itself when called with arguments, 885so that they can be chained together nicely. 886 887=over 4 888 889=item * 890 891$Data::Dumper::Indent I<or> I<$OBJ>->Indent(I<[NEWVAL]>) 892 893Controls the style of indentation. It can be set to 0, 1, 2 or 3. Style 0 894spews output without any newlines, indentation, or spaces between list 895items. It is the most compact format possible that can still be called 896valid perl. Style 1 outputs a readable form with newlines but no fancy 897indentation (each level in the structure is simply indented by a fixed 898amount of whitespace). Style 2 (the default) outputs a very readable form 899which takes into account the length of hash keys (so the hash value lines 900up). Style 3 is like style 2, but also annotates the elements of arrays 901with their index (but the comment is on its own line, so array output 902consumes twice the number of lines). Style 2 is the default. 903 904=item * 905 906$Data::Dumper::Purity I<or> I<$OBJ>->Purity(I<[NEWVAL]>) 907 908Controls the degree to which the output can be C<eval>ed to recreate the 909supplied reference structures. Setting it to 1 will output additional perl 910statements that will correctly recreate nested references. The default is 9110. 912 913=item * 914 915$Data::Dumper::Pad I<or> I<$OBJ>->Pad(I<[NEWVAL]>) 916 917Specifies the string that will be prefixed to every line of the output. 918Empty string by default. 919 920=item * 921 922$Data::Dumper::Varname I<or> I<$OBJ>->Varname(I<[NEWVAL]>) 923 924Contains the prefix to use for tagging variable names in the output. The 925default is "VAR". 926 927=item * 928 929$Data::Dumper::Useqq I<or> I<$OBJ>->Useqq(I<[NEWVAL]>) 930 931When set, enables the use of double quotes for representing string values. 932Whitespace other than space will be represented as C<[\n\t\r]>, "unsafe" 933characters will be backslashed, and unprintable characters will be output as 934quoted octal integers. Since setting this variable imposes a performance 935penalty, the default is 0. C<Dump()> will run slower if this flag is set, 936since the fast XSUB implementation doesn't support it yet. 937 938=item * 939 940$Data::Dumper::Terse I<or> I<$OBJ>->Terse(I<[NEWVAL]>) 941 942When set, Data::Dumper will emit single, non-self-referential values as 943atoms/terms rather than statements. This means that the C<$VAR>I<n> names 944will be avoided where possible, but be advised that such output may not 945always be parseable by C<eval>. 946 947=item * 948 949$Data::Dumper::Freezer I<or> $I<OBJ>->Freezer(I<[NEWVAL]>) 950 951Can be set to a method name, or to an empty string to disable the feature. 952Data::Dumper will invoke that method via the object before attempting to 953stringify it. This method can alter the contents of the object (if, for 954instance, it contains data allocated from C), and even rebless it in a 955different package. The client is responsible for making sure the specified 956method can be called via the object, and that the object ends up containing 957only perl data types after the method has been called. Defaults to an empty 958string. 959 960If an object does not support the method specified (determined using 961UNIVERSAL::can()) then the call will be skipped. If the method dies a 962warning will be generated. 963 964=item * 965 966$Data::Dumper::Toaster I<or> $I<OBJ>->Toaster(I<[NEWVAL]>) 967 968Can be set to a method name, or to an empty string to disable the feature. 969Data::Dumper will emit a method call for any objects that are to be dumped 970using the syntax C<bless(DATA, CLASS)-E<gt>METHOD()>. Note that this means that 971the method specified will have to perform any modifications required on the 972object (like creating new state within it, and/or reblessing it in a 973different package) and then return it. The client is responsible for making 974sure the method can be called via the object, and that it returns a valid 975object. Defaults to an empty string. 976 977=item * 978 979$Data::Dumper::Deepcopy I<or> $I<OBJ>->Deepcopy(I<[NEWVAL]>) 980 981Can be set to a boolean value to enable deep copies of structures. 982Cross-referencing will then only be done when absolutely essential 983(i.e., to break reference cycles). Default is 0. 984 985=item * 986 987$Data::Dumper::Quotekeys I<or> $I<OBJ>->Quotekeys(I<[NEWVAL]>) 988 989Can be set to a boolean value to control whether hash keys are quoted. 990A false value will avoid quoting hash keys when it looks like a simple 991string. Default is 1, which will always enclose hash keys in quotes. 992 993=item * 994 995$Data::Dumper::Bless I<or> $I<OBJ>->Bless(I<[NEWVAL]>) 996 997Can be set to a string that specifies an alternative to the C<bless> 998builtin operator used to create objects. A function with the specified 999name should exist, and should accept the same arguments as the builtin. 1000Default is C<bless>. 1001 1002=item * 1003 1004$Data::Dumper::Pair I<or> $I<OBJ>->Pair(I<[NEWVAL]>) 1005 1006Can be set to a string that specifies the separator between hash keys 1007and values. To dump nested hash, array and scalar values to JavaScript, 1008use: C<$Data::Dumper::Pair = ' : ';>. Implementing C<bless> in JavaScript 1009is left as an exercise for the reader. 1010A function with the specified name exists, and accepts the same arguments 1011as the builtin. 1012 1013Default is: C< =E<gt> >. 1014 1015=item * 1016 1017$Data::Dumper::Maxdepth I<or> $I<OBJ>->Maxdepth(I<[NEWVAL]>) 1018 1019Can be set to a positive integer that specifies the depth beyond which 1020we don't venture into a structure. Has no effect when 1021C<Data::Dumper::Purity> is set. (Useful in debugger when we often don't 1022want to see more than enough). Default is 0, which means there is 1023no maximum depth. 1024 1025=item * 1026 1027$Data::Dumper::Useperl I<or> $I<OBJ>->Useperl(I<[NEWVAL]>) 1028 1029Can be set to a boolean value which controls whether the pure Perl 1030implementation of C<Data::Dumper> is used. The C<Data::Dumper> module is 1031a dual implementation, with almost all functionality written in both 1032pure Perl and also in XS ('C'). Since the XS version is much faster, it 1033will always be used if possible. This option lets you override the 1034default behavior, usually for testing purposes only. Default is 0, which 1035means the XS implementation will be used if possible. 1036 1037=item * 1038 1039$Data::Dumper::Sortkeys I<or> $I<OBJ>->Sortkeys(I<[NEWVAL]>) 1040 1041Can be set to a boolean value to control whether hash keys are dumped in 1042sorted order. A true value will cause the keys of all hashes to be 1043dumped in Perl's default sort order. Can also be set to a subroutine 1044reference which will be called for each hash that is dumped. In this 1045case C<Data::Dumper> will call the subroutine once for each hash, 1046passing it the reference of the hash. The purpose of the subroutine is 1047to return a reference to an array of the keys that will be dumped, in 1048the order that they should be dumped. Using this feature, you can 1049control both the order of the keys, and which keys are actually used. In 1050other words, this subroutine acts as a filter by which you can exclude 1051certain keys from being dumped. Default is 0, which means that hash keys 1052are not sorted. 1053 1054=item * 1055 1056$Data::Dumper::Deparse I<or> $I<OBJ>->Deparse(I<[NEWVAL]>) 1057 1058Can be set to a boolean value to control whether code references are 1059turned into perl source code. If set to a true value, C<B::Deparse> 1060will be used to get the source of the code reference. Using this option 1061will force using the Perl implementation of the dumper, since the fast 1062XSUB implementation doesn't support it. 1063 1064Caution : use this option only if you know that your coderefs will be 1065properly reconstructed by C<B::Deparse>. 1066 1067=back 1068 1069=head2 Exports 1070 1071=over 4 1072 1073=item Dumper 1074 1075=back 1076 1077=head1 EXAMPLES 1078 1079Run these code snippets to get a quick feel for the behavior of this 1080module. When you are through with these examples, you may want to 1081add or change the various configuration variables described above, 1082to see their behavior. (See the testsuite in the Data::Dumper 1083distribution for more examples.) 1084 1085 1086 use Data::Dumper; 1087 1088 package Foo; 1089 sub new {bless {'a' => 1, 'b' => sub { return "foo" }}, $_[0]}; 1090 1091 package Fuz; # a weird REF-REF-SCALAR object 1092 sub new {bless \($_ = \ 'fu\'z'), $_[0]}; 1093 1094 package main; 1095 $foo = Foo->new; 1096 $fuz = Fuz->new; 1097 $boo = [ 1, [], "abcd", \*foo, 1098 {1 => 'a', 023 => 'b', 0x45 => 'c'}, 1099 \\"p\q\'r", $foo, $fuz]; 1100 1101 ######## 1102 # simple usage 1103 ######## 1104 1105 $bar = eval(Dumper($boo)); 1106 print($@) if $@; 1107 print Dumper($boo), Dumper($bar); # pretty print (no array indices) 1108 1109 $Data::Dumper::Terse = 1; # don't output names where feasible 1110 $Data::Dumper::Indent = 0; # turn off all pretty print 1111 print Dumper($boo), "\n"; 1112 1113 $Data::Dumper::Indent = 1; # mild pretty print 1114 print Dumper($boo); 1115 1116 $Data::Dumper::Indent = 3; # pretty print with array indices 1117 print Dumper($boo); 1118 1119 $Data::Dumper::Useqq = 1; # print strings in double quotes 1120 print Dumper($boo); 1121 1122 $Data::Dumper::Pair = " : "; # specify hash key/value separator 1123 print Dumper($boo); 1124 1125 1126 ######## 1127 # recursive structures 1128 ######## 1129 1130 @c = ('c'); 1131 $c = \@c; 1132 $b = {}; 1133 $a = [1, $b, $c]; 1134 $b->{a} = $a; 1135 $b->{b} = $a->[1]; 1136 $b->{c} = $a->[2]; 1137 print Data::Dumper->Dump([$a,$b,$c], [qw(a b c)]); 1138 1139 1140 $Data::Dumper::Purity = 1; # fill in the holes for eval 1141 print Data::Dumper->Dump([$a, $b], [qw(*a b)]); # print as @a 1142 print Data::Dumper->Dump([$b, $a], [qw(*b a)]); # print as %b 1143 1144 1145 $Data::Dumper::Deepcopy = 1; # avoid cross-refs 1146 print Data::Dumper->Dump([$b, $a], [qw(*b a)]); 1147 1148 1149 $Data::Dumper::Purity = 0; # avoid cross-refs 1150 print Data::Dumper->Dump([$b, $a], [qw(*b a)]); 1151 1152 ######## 1153 # deep structures 1154 ######## 1155 1156 $a = "pearl"; 1157 $b = [ $a ]; 1158 $c = { 'b' => $b }; 1159 $d = [ $c ]; 1160 $e = { 'd' => $d }; 1161 $f = { 'e' => $e }; 1162 print Data::Dumper->Dump([$f], [qw(f)]); 1163 1164 $Data::Dumper::Maxdepth = 3; # no deeper than 3 refs down 1165 print Data::Dumper->Dump([$f], [qw(f)]); 1166 1167 1168 ######## 1169 # object-oriented usage 1170 ######## 1171 1172 $d = Data::Dumper->new([$a,$b], [qw(a b)]); 1173 $d->Seen({'*c' => $c}); # stash a ref without printing it 1174 $d->Indent(3); 1175 print $d->Dump; 1176 $d->Reset->Purity(0); # empty the seen cache 1177 print join "----\n", $d->Dump; 1178 1179 1180 ######## 1181 # persistence 1182 ######## 1183 1184 package Foo; 1185 sub new { bless { state => 'awake' }, shift } 1186 sub Freeze { 1187 my $s = shift; 1188 print STDERR "preparing to sleep\n"; 1189 $s->{state} = 'asleep'; 1190 return bless $s, 'Foo::ZZZ'; 1191 } 1192 1193 package Foo::ZZZ; 1194 sub Thaw { 1195 my $s = shift; 1196 print STDERR "waking up\n"; 1197 $s->{state} = 'awake'; 1198 return bless $s, 'Foo'; 1199 } 1200 1201 package Foo; 1202 use Data::Dumper; 1203 $a = Foo->new; 1204 $b = Data::Dumper->new([$a], ['c']); 1205 $b->Freezer('Freeze'); 1206 $b->Toaster('Thaw'); 1207 $c = $b->Dump; 1208 print $c; 1209 $d = eval $c; 1210 print Data::Dumper->Dump([$d], ['d']); 1211 1212 1213 ######## 1214 # symbol substitution (useful for recreating CODE refs) 1215 ######## 1216 1217 sub foo { print "foo speaking\n" } 1218 *other = \&foo; 1219 $bar = [ \&other ]; 1220 $d = Data::Dumper->new([\&other,$bar],['*other','bar']); 1221 $d->Seen({ '*foo' => \&foo }); 1222 print $d->Dump; 1223 1224 1225 ######## 1226 # sorting and filtering hash keys 1227 ######## 1228 1229 $Data::Dumper::Sortkeys = \&my_filter; 1230 my $foo = { map { (ord, "$_$_$_") } 'I'..'Q' }; 1231 my $bar = { %$foo }; 1232 my $baz = { reverse %$foo }; 1233 print Dumper [ $foo, $bar, $baz ]; 1234 1235 sub my_filter { 1236 my ($hash) = @_; 1237 # return an array ref containing the hash keys to dump 1238 # in the order that you want them to be dumped 1239 return [ 1240 # Sort the keys of %$foo in reverse numeric order 1241 $hash eq $foo ? (sort {$b <=> $a} keys %$hash) : 1242 # Only dump the odd number keys of %$bar 1243 $hash eq $bar ? (grep {$_ % 2} keys %$hash) : 1244 # Sort keys in default order for all other hashes 1245 (sort keys %$hash) 1246 ]; 1247 } 1248 1249=head1 BUGS 1250 1251Due to limitations of Perl subroutine call semantics, you cannot pass an 1252array or hash. Prepend it with a C<\> to pass its reference instead. This 1253will be remedied in time, now that Perl has subroutine prototypes. 1254For now, you need to use the extended usage form, and prepend the 1255name with a C<*> to output it as a hash or array. 1256 1257C<Data::Dumper> cheats with CODE references. If a code reference is 1258encountered in the structure being processed (and if you haven't set 1259the C<Deparse> flag), an anonymous subroutine that 1260contains the string '"DUMMY"' will be inserted in its place, and a warning 1261will be printed if C<Purity> is set. You can C<eval> the result, but bear 1262in mind that the anonymous sub that gets created is just a placeholder. 1263Someday, perl will have a switch to cache-on-demand the string 1264representation of a compiled piece of code, I hope. If you have prior 1265knowledge of all the code refs that your data structures are likely 1266to have, you can use the C<Seen> method to pre-seed the internal reference 1267table and make the dumped output point to them, instead. See L</EXAMPLES> 1268above. 1269 1270The C<Useqq> and C<Deparse> flags makes Dump() run slower, since the 1271XSUB implementation does not support them. 1272 1273SCALAR objects have the weirdest looking C<bless> workaround. 1274 1275Pure Perl version of C<Data::Dumper> escapes UTF-8 strings correctly 1276only in Perl 5.8.0 and later. 1277 1278=head2 NOTE 1279 1280Starting from Perl 5.8.1 different runs of Perl will have different 1281ordering of hash keys. The change was done for greater security, 1282see L<perlsec/"Algorithmic Complexity Attacks">. This means that 1283different runs of Perl will have different Data::Dumper outputs if 1284the data contains hashes. If you need to have identical Data::Dumper 1285outputs from different runs of Perl, use the environment variable 1286PERL_HASH_SEED, see L<perlrun/PERL_HASH_SEED>. Using this restores 1287the old (platform-specific) ordering: an even prettier solution might 1288be to use the C<Sortkeys> filter of Data::Dumper. 1289 1290=head1 AUTHOR 1291 1292Gurusamy Sarathy gsar@activestate.com 1293 1294Copyright (c) 1996-98 Gurusamy Sarathy. All rights reserved. 1295This program is free software; you can redistribute it and/or 1296modify it under the same terms as Perl itself. 1297 1298=head1 VERSION 1299 1300Version 2.125 (Aug 8 2009) 1301 1302=head1 SEE ALSO 1303 1304perl(1) 1305 1306=cut 1307