commit for archiving

2025-08-27 09:03:01 +02:00
commit a163c80769
140 changed files with 49745 additions and 0 deletions
@@ -0,0 +1,497 @@
+package Data::Dump;
+
+use strict;
+use vars qw(@EXPORT_OK $VERSION $DEBUG);
+
+require Exporter;
+*import = \&Exporter::import;
+@EXPORT_OK=qw(dump pp);
+
+$VERSION = "1.08";  # $Date: 2006/11/29 10:47:17 $
+$DEBUG = 0;
+
+use overload ();
+use vars qw(%seen %refcnt @dump @fixup %require $TRY_BASE64);
+
+$TRY_BASE64 = 50 unless defined $TRY_BASE64;
+
+my %is_perl_keyword = map { $_ => 1 }
+qw( __FILE__ __LINE__ __PACKAGE__ __DATA__ __END__ AUTOLOAD BEGIN CORE
+DESTROY END EQ GE GT INIT LE LT NE abs accept alarm and atan2 bind
+binmode bless caller chdir chmod chomp chop chown chr chroot close
+closedir cmp connect continue cos crypt dbmclose dbmopen defined
+delete die do dump each else elsif endgrent endhostent endnetent
+endprotoent endpwent endservent eof eq eval exec exists exit exp fcntl
+fileno flock for foreach fork format formline ge getc getgrent
+getgrgid getgrnam gethostbyaddr gethostbyname gethostent getlogin
+getnetbyaddr getnetbyname getnetent getpeername getpgrp getppid
+getpriority getprotobyname getprotobynumber getprotoent getpwent
+getpwnam getpwuid getservbyname getservbyport getservent getsockname
+getsockopt glob gmtime goto grep gt hex if index int ioctl join keys
+kill last lc lcfirst le length link listen local localtime lock log
+lstat lt m map mkdir msgctl msgget msgrcv msgsnd my ne next no not oct
+open opendir or ord pack package pipe pop pos print printf prototype
+push q qq qr quotemeta qw qx rand read readdir readline readlink
+readpipe recv redo ref rename require reset return reverse rewinddir
+rindex rmdir s scalar seek seekdir select semctl semget semop send
+setgrent sethostent setnetent setpgrp setpriority setprotoent setpwent
+setservent setsockopt shift shmctl shmget shmread shmwrite shutdown
+sin sleep socket socketpair sort splice split sprintf sqrt srand stat
+study sub substr symlink syscall sysopen sysread sysseek system
+syswrite tell telldir tie tied time times tr truncate uc ucfirst umask
+undef unless unlink unpack unshift untie until use utime values vec
+wait waitpid wantarray warn while write x xor y);
+
+
+sub dump
+{
+    local %seen;
+    local %refcnt;
+    local %require;
+    local @fixup;
+
+    my $name = "a";
+    my @dump;
+
+    for my $v (@_) {
+	my $val = _dump($v, $name, [], tied($v));
+	push(@dump, [$name, $val]);
+    } continue {
+	$name++;
+    }
+
+    my $out = "";
+    if (%require) {
+	for (sort keys %require) {
+	    $out .= "require $_;\n";
+	}
+    }
+    if (%refcnt) {
+	# output all those with refcounts first
+	for (@dump) {
+	    my $name = $_->[0];
+	    if ($refcnt{$name}) {
+		$out .= "my \$$name = $_->[1];\n";
+		undef $_->[1];
+	    }
+	}
+	for (@fixup) {
+	    $out .= "$_;\n";
+	}
+    }
+
+    my $paren = (@dump != 1);
+    $out .= "(" if $paren;
+    $out .= format_list($paren, undef,
+			map {defined($_->[1]) ? $_->[1] : "\$".$_->[0]}
+			    @dump
+		       );
+    $out .= ")" if $paren;
+
+    if (%refcnt || %require) {
+	$out .= ";\n";
+	$out =~ s/^/  /gm;  # indent
+	$out = "do {\n$out}";
+    }
+
+    #use Data::Dumper;   print Dumper(\%refcnt);
+    #use Data::Dumper;   print Dumper(\%seen);
+
+    print STDERR "$out\n" unless defined wantarray;
+    $out;
+}
+
+*pp = \&dump;
+
+sub _dump
+{
+    my $ref  = ref $_[0];
+    my $rval = $ref ? $_[0] : \$_[0];
+    shift;
+
+    my($name, $idx, $dont_remember) = @_;
+
+    my($class, $type, $id);
+    if (overload::StrVal($rval) =~ /^(?:([^=]+)=)?([A-Z]+)\(0x([^\)]+)\)$/) {
+	$class = $1;
+	$type  = $2;
+	$id    = $3;
+    } else {
+	die "Can't parse " . overload::StrVal($rval);
+    }
+    if ($] < 5.008 && $type eq "SCALAR") {
+	$type = "REF" if $ref eq "REF";
+    }
+    warn "\$$name(@$idx) $class $type $id ($ref)" if $DEBUG;
+
+    unless ($dont_remember) {
+	if (my $s = $seen{$id}) {
+	    my($sname, $sidx) = @$s;
+	    $refcnt{$sname}++;
+	    my $sref = fullname($sname, $sidx,
+				($ref && $type eq "SCALAR"));
+	    warn "SEEN: [\$$name(@$idx)] => [\$$sname(@$sidx)] ($ref,$sref)" if $DEBUG;
+	    return $sref unless $sname eq $name;
+	    $refcnt{$name}++;
+	    push(@fixup, fullname($name,$idx)." = $sref");
+	    return "do{my \$fix}" if @$idx && $idx->[-1] eq '$';
+	    return "'fix'";
+	}
+	$seen{$id} = [$name, $idx];
+    }
+
+    my $out;
+    if ($type eq "SCALAR" || $type eq "REF") {
+	if ($ref) {
+	    if ($class && $class eq "Regexp") {
+		my $v = "$rval";
+
+		my $mod = "";
+		if ($v =~ /^\(\?([msix-]+):([\x00-\xFF]*)\)\z/) {
+		    $mod = $1;
+		    $v = $2;
+		    $mod =~ s/-.*//;
+		}
+
+		my $sep = '/';
+		my $sep_count = ($v =~ tr/\///);
+		if ($sep_count) {
+		    # see if we can find a better one
+		    for ('|', ',', ':', '#') {
+			my $c = eval "\$v =~ tr/\Q$_\E//";
+			#print "SEP $_ $c $sep_count\n";
+			if ($c < $sep_count) {
+			    $sep = $_;
+			    $sep_count = $c;
+			    last if $sep_count == 0;
+			}
+		    }
+		}
+		$v =~ s/\Q$sep\E/\\$sep/g;
+
+		$out = "qr$sep$v$sep$mod";
+		undef($class);
+	    }
+	    else {
+		delete $seen{$id} if $type eq "SCALAR";  # will be seen again shortly
+		my $val = _dump($$rval, $name, [@$idx, "\$"]);
+		$out = $class ? "do{\\(my \$o = $val)}" : "\\$val";
+	    }
+	} else {
+	    if (!defined $$rval) {
+		$out = "undef";
+	    }
+	    elsif ($$rval =~ /^-?[1-9]\d{0,9}$/ || $$rval eq "0") {
+		$out = $$rval;
+	    }
+	    else {
+		$out = quote($$rval);
+	    }
+	    if ($class && !@$idx) {
+		# Top is an object, not a reference to one as perl needs
+		$refcnt{$name}++;
+		my $obj = fullname($name, $idx);
+		my $cl  = quote($class);
+		push(@fixup, "bless \\$obj, $cl");
+	    }
+	}
+    }
+    elsif ($type eq "GLOB") {
+	if ($ref) {
+	    delete $seen{$id};
+	    my $val = _dump($$rval, $name, [@$idx, "*"]);
+	    $out = "\\$val";
+	    if ($out =~ /^\\\*Symbol::/) {
+		$require{Symbol}++;
+		$out = "Symbol::gensym()";
+	    }
+	} else {
+	    my $val = "$$rval";
+	    $out = "$$rval";
+
+	    for my $k (qw(SCALAR ARRAY HASH)) {
+		my $gval = *$$rval{$k};
+		next unless defined $gval;
+		next if $k eq "SCALAR" && ! defined $$gval;  # always there
+		my $f = scalar @fixup;
+		push(@fixup, "RESERVED");  # overwritten after _dump() below
+		$gval = _dump($gval, $name, [@$idx, "*{$k}"]);
+		$refcnt{$name}++;
+		my $gname = fullname($name, $idx);
+		$fixup[$f] = "$gname = $gval";  #XXX indent $gval
+	    }
+	}
+    }
+    elsif ($type eq "ARRAY") {
+	my @vals;
+	my $tied = tied_str(tied(@$rval));
+	my $i = 0;
+	for my $v (@$rval) {
+	    push(@vals, _dump($v, $name, [@$idx, "[$i]"], $tied));
+	    $i++;
+	}
+	$out = "[" . format_list(1, $tied, @vals) . "]";
+    }
+    elsif ($type eq "HASH") {
+	my(@keys, @vals);
+	my $tied = tied_str(tied(%$rval));
+
+	# statistics to determine variation in key lengths
+	my $kstat_max = 0;
+	my $kstat_sum = 0;
+	my $kstat_sum2 = 0;
+
+	my @orig_keys = keys %$rval;
+	my $text_keys = 0;
+	for (@orig_keys) {
+	    $text_keys++, last unless $_ eq "0" || /^[-+]?[1-9]\d*(?:.\d+)?\z/;
+	}
+
+	if ($text_keys) {
+	    @orig_keys = sort @orig_keys;
+	}
+	else {
+	    @orig_keys = sort { $a <=> $b } @orig_keys;
+	}
+
+	for my $key (@orig_keys) {
+	    my $val = \$rval->{$key};
+	    $key = quote($key) if $is_perl_keyword{$key} ||
+		                  !($key =~ /^[a-zA-Z_]\w{0,19}\z/ ||
+				    $key =~ /^-?[1-9]\d{0,8}\z/
+				    );
+
+	    $kstat_max = length($key) if length($key) > $kstat_max;
+	    $kstat_sum += length($key);
+	    $kstat_sum2 += length($key)*length($key);
+
+	    push(@keys, $key);
+	    push(@vals, _dump($$val, $name, [@$idx, "{$key}"], $tied));
+	}
+	my $nl = "";
+	my $klen_pad = 0;
+	my $tmp = "@keys @vals";
+	if (length($tmp) > 60 || $tmp =~ /\n/ || $tied) {
+	    $nl = "\n";
+
+	    # Determine what padding to add
+	    if ($kstat_max < 4) {
+		$klen_pad = $kstat_max;
+	    }
+	    elsif (@keys >= 2) {
+		my $n = @keys;
+		my $avg = $kstat_sum/$n;
+		my $stddev = sqrt(($kstat_sum2 - $n * $avg * $avg) / ($n - 1));
+
+		# I am not actually very happy with this heuristics
+		if ($stddev / $kstat_max < 0.25) {
+		    $klen_pad = $kstat_max;
+		}
+		if ($DEBUG) {
+		    push(@keys, "__S");
+		    push(@vals, sprintf("%.2f (%d/%.1f/%.1f)",
+					$stddev / $kstat_max,
+					$kstat_max, $avg, $stddev));
+		}
+	    }
+	}
+	$out = "{$nl";
+	$out .= "  # $tied$nl" if $tied;
+	while (@keys) {
+	    my $key = shift @keys;
+	    my $val = shift @vals;
+	    my $pad = " " x ($klen_pad + 6);
+	    $val =~ s/\n/\n$pad/gm;
+	    $key = " $key" . " " x ($klen_pad - length($key)) if $nl;
+	    $out .= " $key => $val,$nl";
+	}
+	$out =~ s/,$/ / unless $nl;
+	$out .= "}";
+    }
+    elsif ($type eq "CODE") {
+	$out = 'sub { "???" }';
+    }
+    else {
+	warn "Can't handle $type data";
+	$out = "'#$type#'";
+    }
+
+    if ($class && $ref) {
+	$out = "bless($out, " . quote($class) . ")";
+    }
+    return $out;
+}
+
+sub tied_str {
+    my $tied = shift;
+    if ($tied) {
+	if (my $tied_ref = ref($tied)) {
+	    $tied = "tied $tied_ref";
+	}
+	else {
+	    $tied = "tied";
+	}
+    }
+    return $tied;
+}
+
+sub fullname
+{
+    my($name, $idx, $ref) = @_;
+    substr($name, 0, 0) = "\$";
+
+    my @i = @$idx;  # need copy in order to not modify @$idx
+    if ($ref && @i && $i[0] eq "\$") {
+	shift(@i);  # remove one deref
+	$ref = 0;
+    }
+    while (@i && $i[0] eq "\$") {
+	shift @i;
+	$name = "\$$name";
+    }
+
+    my $last_was_index;
+    for my $i (@i) {
+	if ($i eq "*" || $i eq "\$") {
+	    $last_was_index = 0;
+	    $name = "$i\{$name}";
+	} elsif ($i =~ s/^\*//) {
+	    $name .= $i;
+	    $last_was_index++;
+	} else {
+	    $name .= "->" unless $last_was_index++;
+	    $name .= $i;
+	}
+    }
+    $name = "\\$name" if $ref;
+    $name;
+}
+
+sub format_list
+{
+    my $paren = shift;
+    my $comment = shift;
+    my $indent_lim = $paren ? 0 : 1;
+    my $tmp = "@_";
+    if ($comment || (@_ > $indent_lim && (length($tmp) > 60 || $tmp =~ /\n/))) {
+	my @elem = @_;
+	for (@elem) { s/^/  /gm; }   # indent
+	return "\n" . ($comment ? "  # $comment\n" : "") .
+               join(",\n", @elem, "");
+    } else {
+	return join(", ", @_);
+    }
+}
+
+my %esc = (
+    "\a" => "\\a",
+    "\b" => "\\b",
+    "\t" => "\\t",
+    "\n" => "\\n",
+    "\f" => "\\f",
+    "\r" => "\\r",
+    "\e" => "\\e",
+);
+
+# put a string value in double quotes
+sub quote {
+  local($_) = $_[0];
+  if (length($_) > 20) {
+      # Check for repeated string
+      if (/^(.{1,5}?)(\1*)$/s) {
+	  my $base   = quote($1);
+	  my $repeat = length($2)/length($1) + 1;
+	  return "($base x $repeat)";
+      }
+  }
+  # If there are many '"' we might want to use qq() instead
+  s/([\\\"\@\$])/\\$1/g;
+  return qq("$_") unless /[^\040-\176]/;  # fast exit
+
+  s/([\a\b\t\n\f\r\e])/$esc{$1}/g;
+
+  # no need for 3 digits in escape for these
+  s/([\0-\037])(?!\d)/sprintf('\\%o',ord($1))/eg;
+
+  s/([\0-\037\177-\377])/sprintf('\\x%02X',ord($1))/eg;
+  s/([^\040-\176])/sprintf('\\x{%X}',ord($1))/eg;
+
+  if (length($_) > 40  && !/\\x\{/ && length($_) > (length($_[0]) * 2)) {
+      # too much binary data, better to represent as a hex/base64 string
+
+      # Base64 is more compact than hex when string is longer than
+      # 17 bytes (not counting any require statement needed).
+      # But on the other hand, hex is much more readable.
+      if ($TRY_BASE64 && length($_[0]) > $TRY_BASE64 &&
+	  eval { require MIME::Base64 })
+      {
+	  $require{"MIME::Base64"}++;
+	  return "MIME::Base64::decode(\"" .
+	             MIME::Base64::encode($_[0],"") .
+		 "\")";
+      }
+      return "pack(\"H*\",\"" . unpack("H*", $_[0]) . "\")";
+  }
+
+  return qq("$_");
+}
+
+1;
+
+__END__
+
+=head1 NAME
+
+Data::Dump - Pretty printing of data structures
+
+=head1 SYNOPSIS
+
+ use Data::Dump qw(dump);
+
+ $str = dump(@list)
+ @copy_of_list = eval $str;
+
+=head1 DESCRIPTION
+
+This module provides a single function called dump() that takes a list
+of values as its argument and produces a string as its result.  The string
+contains Perl code that, when C<eval>ed, produces a deep copy of the
+original arguments.  The string is formatted for easy reading.
+
+If dump() is called in a void context, then the dump is printed on
+STDERR instead of being returned.
+
+If you don't like importing a function that overrides Perl's
+not-so-useful builtin, then you can also import the same function as
+pp(), mnemonic for "pretty-print".
+
+=head1 HISTORY
+
+The C<Data::Dump> module grew out of frustration with Sarathy's
+in-most-cases-excellent C<Data::Dumper>.  Basic ideas and some code are shared
+with Sarathy's module.
+
+The C<Data::Dump> module provides a much simpler interface than
+C<Data::Dumper>.  No OO interface is available and there are no
+configuration options to worry about (yet :-).  The other benefit is
+that the dump produced does not try to set any variables.  It only
+returns what is needed to produce a copy of the arguments.  This means
+that C<dump("foo")> simply returns C<"foo">, and C<dump(1..5)> simply
+returns C<(1, 2, 3, 4, 5)>.
+
+=head1 SEE ALSO
+
+L<Data::Dumper>, L<Storable>
+
+=head1 AUTHORS
+
+The C<Data::Dump> module is written by Gisle Aas <gisle@aas.no>, based
+on C<Data::Dumper> by Gurusamy Sarathy <gsar@umich.edu>.
+
+ Copyright 1998-2000,2003-2004 Gisle Aas.
+ Copyright 1996-1998 Gurusamy Sarathy.
+
+This library is free software; you can redistribute it and/or
+modify it under the same terms as Perl itself.
+
+=cut