Data-Dmap/lib/Data/Dmap.pm
package Data::Dmap;
use warnings;
use strict;
require v5.10;
use feature 'switch';
use Exporter 'import';
our @EXPORT = qw{ dmap };
our @EXPORT_OK = qw{ cut };
use Carp 'croak';
use Scalar::Util qw{ reftype refaddr };
use Try::Tiny;
=head1 NAME
Data::Dmap - just like map, but on deep data structures
=head1 VERSION
Version 0.08.
=cut
our $VERSION = '0.08';
=head1 SYNOPSIS
This module provides the single function C<dmap> which carries out a
C<map>-like operation on deep data structures.
use Data::Dmap;
my $foo = {
cars => [ 'ford', 'opel', 'BMW' ],
birds => [ 'cuckatoo', 'ostrich', 'frigate' ],
handler => sub { print "barf\n" }
};
# This removes all keys named 'cars'
my($bar) = dmap { delete $_->{cars} if ref eq 'HASH'; $_ } $foo;
# This replaces arrays with the number of elements they contains
my($other) = dmap { $_ = scalar @$_ if ref eq 'ARRAY'; $_ } $foo;
use Data::Dumper;
print Dumper $other;
#
# Prints
# {
# birds => 3,
# handler => sub { "DUMMY" }
# }
# (Data::Dumper doesn't dump subs)
$other->{handler}->();
# Prints
# barf
=head1 EXPORTS
=over
=item C<dmap> (always exported) - the dmap function that does deep in-place mapping
=item C<cut> (optional) - a function for stopping recursion.
=back
=head1 SUBROUTINES
=head2 C<dmap>
This function works like C<map> - it takes an expression followed by a list,
evaluates the expression on each member of the list and returns the result.
The only difference is that any references returned by the expression will
also be traversed and passed to the expression once again, thus making it
possible to make deep traversal of any data structure.
Objects (references blessed to something) are just traversed as if they
weren't blessed.
=head3 Examples
Delete all hash references
use Data::Dmap;
use Data::Dump 'pp';
pp dmap { return $_ unless ref eq 'HASH'; return; } 1, 'foo', [ { a => 1 }, 2];
# Prints:
# (1, "foo", [2])
Delete every odd number
use Data::Dmap;
use Data::Dump 'pp';
pp dmap { return if $_ % 2; $_ } [ 1 .. 10 ];
# Prints:
# [2, 4, 6, 8, 10]
Replace all hash refs with some C<$object> of class C<thingy>.
use Data::Dmap;
use Data::Dump 'pp';
pp dmap { return bless $_, 'thingy' if ref eq 'HASH'; $_ } [ 1, "hello", { a => 1 } ];
# Prints:
# [1, "hello", bless({ a => 1 }, "thingy")]
C<dmap> understands what you want, if you return nothing (as opposed to C<undef>) when
evaluating the expression for a hash key:
use Data::Dmap;
use Data::Dump 'pp;
my $characters = { main => 'pooh', secondary => 'piglet' };
pp dmap { return if $_ eq "piglet"; $_ } $characters;
# Prints:
# { main => "pooh" }
Because the output from the expression is being traversed, you can use C<dmap> to generate
data structures:
use Data::Dmap;
use Data::Dump 'pp';
my $height = 3;
pp dmap { if(ref eq 'HASH' and $height--) { $_->{a} = {height => $height} } $_ } {};
# Prints:
# {
# a => {
# a => {
# a => {
# height => 0
# },
# height => 1
# },
# height => 2
# }
# }
# (My own formatting above.)
=head2 C<cut>
The C<cut> routine stops recursion at any point and returns any data as it is
in place of the current node.
=head3 Examples
use Data::Dmap 'cut';
use Data::Dump 'pp';
my $deep = {
level => 1,
data => {
level => 2,
data => {
level => 3
}
}
};
pp dmap { cut('stop') if ref eq 'HASH' and $_->{level} == 2} $deep;
# Prints:
#
# { data => { data => "stop", level => 2 }, level => 1 }
=cut
sub _store_cache {
my $cache = shift;
my $ref = shift;
$cache->{refaddr($ref)} = [@_];
}
sub _get_cache {
my $cache = shift;
my $ref = shift;
@{$cache->{refaddr($ref)}};
}
sub _has_cache {
my $cache = shift;
my $ref = shift;
exists $cache->{refaddr($ref)};
}
sub _dmap {
my $cache = shift;
my $callback = shift;
map {
my @result;
if(ref) {
my $orig_ref = $_;
if(not _has_cache($cache, $orig_ref)) {
my $recurse = 1;
my @mapped;
try {
@mapped = $callback->($orig_ref);
} catch {
if(ref eq 'Data::Dmap::Cut') {
$recurse = 0;
@result = @$_;
} else {
die $_
}
};
if($recurse) {
foreach my $val (@mapped) {
given(reftype $val) {
when('HASH') {
for(keys %$val) {
my @res = _dmap($cache, $callback, $val->{$_});
croak 'Multi value return in hash value assignment'
if @res > 1;
if(@res) {
$val->{$_} = $res[0];
} else {
delete $val->{$_};
}
}
push @result, $val;
}
when('ARRAY') {
my $i = 0;
while($i <= $#$val) {
if(exists $val->[$i]) {
# TODO Use splice to allow multi-value returns
my @res = _dmap($cache, $callback, $val->[$i]);
croak 'Multi value return in array single value assignment'
if @res > 1;
if(@res) {
$val->[$i] = $res[0];
} else {
splice @$val, $i, 1;
}
}
$i++;
}
push @result, $val;
}
when('SCALAR') {
my @res = _dmap($cache, $callback, $$val);
croak 'Multi value return in single value assignment'
if @res > 1;
$$val = $res[0] if @res and $$val ne $res[0];
push @result, $val;
}
default {
push @result, $val;
}
}
}
}
_store_cache($cache, $orig_ref, @result);
} else {
push @result, _get_cache($cache, $_);
}
} else {
@result = $callback->($_);
}
@result;
} @_
}
sub cut { die bless [@_], 'Data::Dmap::Cut' }
# Stub that inserts empty map cache
sub dmap(&@) { _dmap({}, @_) }
=head1 AUTHOR
Michael Zedeler, C<< <michael@zedeler.dk> >>
=head1 BUGS
If you find a bug, please consider helping to fix the bug by doing this:
=over
=item * Fork C<Data::Dmap> from L<http://github.com/mzedeler/Data-Dmap>
=item * Write a test case in the C<t> directory, commit and push it.
=item * Fix the bug or (if you don't know how to fix it), report the bug
=back
Bugs and feature requests can be reported through the web interface at
L<http://github.com/mzedeler/Data-Dmap/issues>. I may not be notified, so send
me a mail too.
=head1 SUPPORT
You can find documentation for this module with the perldoc command.
perldoc Data::Dmap
You can also look for information at:
=over 4
=item * The github issue tracker
L<http://github.com/mzedeler/Data-Dmap/issues>
=item * AnnoCPAN: Annotated CPAN documentation
L<http://annocpan.org/dist/Data-Dmap>
=item * CPAN Ratings
L<http://cpanratings.perl.org/d/Data-Dmap>
=item * Search CPAN
L<http://search.cpan.org/dist/Data-Dmap/>
=back
=head1 SEE ALSO
L<Data::Rmap>, L<Data::Visitor>, L<Data::Transformer>, L<Data::Visitor>, L<Data::Walk>.
=head1 TODO
=over
=item Some kind of option making it possible to traverse objects with L<Class::MOP>
metaclasses, so we can avoid breaking encapsulation.
=item Options to provide more information about the current node to the
callback handler, such as path, depth and data types. Should not affect
performance if not used.
=back
=head1 LICENSE AND COPYRIGHT
Copyright 2010 Michael Zedeler.
This program is free software; you can redistribute it and/or modify it
under the terms of either: the GNU General Public License as published
by the Free Software Foundation; or the Artistic License.
See http://dev.perl.org/licenses/ for more information.
=cut
1; # End of Data::Dmap