Group
Extension

OrePAN2-Indexer-Tiny/lib/OrePAN2/Indexer/Tiny.pm

package OrePAN2::Indexer::Tiny;
use strict;
use warnings;
use utf8;

use Archive::Extract ();
use CPAN::Meta;
use Carp ();
use File::Basename ();
use File::Find qw(find);
use File::Spec ();
use File::Temp qw(tempdir);
use File::pushd qw(pushd);
use IO::Uncompress::Gunzip ('$GunzipError');
use IO::Zlib;
use Parse::LocalDistribution;

our $VERSION = "0.03";

sub new {
    my ($class, %args) = @_;
    unless ( defined $args{directory} ) {
        Carp::croak('Missing mandatory parameter: directory');
    }
    bless {
        index => {},
        %args,
    }, $class;
}

sub add_index {
    my ( $self, $archive_file ) = @_;

    my $archive = Archive::Extract->new( archive => $archive_file );
    my $tmpdir = tempdir( 'orepan2.XXXXXX', TMPDIR => 1, CLEANUP => 1 );
    $archive->extract( to => $tmpdir );

    my $provides = $self->scan_provides( $tmpdir, $archive_file );
    my $path = $self->_orepan_archive_path($archive_file);

    for my $package ( sort keys %{$provides} ) {
        $self->_add_index(
            $package,
            $provides->{$package}->{version},
            $path,
        );
    }
}

# Order of preference is last updated. So if some modules maintain the same
# version number across multiple uploads, we'll point to the module in the
# latest archive.

sub _add_index {
    my ( $self, $package, $version, $archive_file ) = @_;

    if ( $self->{index}{$package} ) {
        my ($orig_ver) = @{ $self->{index}{$package} };

        if ( version->parse($orig_ver) > version->parse($version) ) {
            $version //= 'undef';
            print STDERR "[INFO] Not adding $package in $archive_file\n";
            print STDERR
                "[INFO] Existing version $orig_ver is greater than $version\n";
            return;
        }
    }
    $self->{index}->{$package} = [ $version, $archive_file ];
}

sub _orepan_archive_path {
    my ( $self, $archive_file ) = @_;
    my $path         = File::Spec->abs2rel(
        $archive_file,
        File::Spec->catfile( $self->{directory}, 'authors', 'id' )
    );
    $path =~ s!\\!/!g;
    return $path;
}

sub scan_provides {
    my ( $self, $dir, $archive_file ) = @_;

    my $guard = pushd( glob("$dir/*") );
    for my $mfile ( 'META.json', 'META.yml', 'META.yaml' ) {
        next unless -f $mfile;
        my $meta = eval { CPAN::Meta->load_file($mfile) };
        return $meta->{provides} if $meta && $meta->{provides};

        if ($@) {
            print STDERR "[WARN] Error using '$mfile' from '$archive_file'\n";
            print STDERR "[WARN] $@\n";
            print STDERR "[WARN] Attempting to continue...\n";
        }
    }

    print STDERR
        "[INFO] Found META file in '$archive_file' but it does not contain 'provides'\n";
    print STDERR "[INFO] Scanning for provided modules...\n";

    my $provides = eval { $self->_scan_provides('.') };
    return $provides if $provides;

    print STDERR "[WARN] Error scanning: $@\n";

    # Return empty provides.
    return {};
}

sub _scan_provides {
    my ( $self, $dir, $meta ) = @_;

    my $provides = Parse::LocalDistribution->new( { ALLOW_DEV_VERSION => 1 } )
        ->parse($dir);
    return $provides;
}

sub write_index {
    my ( $self ) = @_;

    my $pkgfname = $self->_package_file();
    mkdir( File::Basename::dirname($pkgfname) );
    my $fh = IO::Zlib->new( $pkgfname, 'w' )
        or die "Cannot open $pkgfname for writing: $!\n";
    print $fh $self->_as_string();
    close $fh;
}

sub _as_string {
    my ( $self ) = @_;

    my @buf;

    push @buf, <<"...";
File:         02packages.details.txt
URL:          http://www.perl.com/CPAN/modules/02packages.details.txt
Description:  DarkPAN
Columns:      package name, version, path
Intended-For: Automated fetch routines, namespace documentation.
Written-By:   OrePAN2::Indexer::Tiny $OrePAN2::Indexer::Tiny::VERSION
Line-Count:   @{[ scalar(keys %{$self->{index}}) ]}
Last-Updated: @{[ scalar localtime ]}
...

    for my $pkg ( sort { lc $a cmp lc $b } keys %{ $self->{index} } ) {
        my $entry = $self->{index}{$pkg};

        # package name, version, path
        push @buf, sprintf '%-22s %-22s %s', $pkg, $entry->[0] || 'undef',
            $entry->[1];
    }
    return join( "\n", @buf ) . "\n";
}

sub load_index {
    my ( $self ) = @_;

    return unless -e $self->_package_file;

    my $fh = IO::Uncompress::Gunzip->new($self->_package_file)
        or die "gzip failed: $GunzipError\n";

    # skip headers
    while (<$fh>) {
        last unless /\S/;
    }

    while (<$fh>) {
        if (/^(\S+)\s+(\S+)\s+(.*)$/) {
            $self->_add_index( $1, $2 eq 'undef' ? undef : $2, $3 );
        }
    }

    close $fh;
}

sub _package_file {
    my ( $self ) = @_;

    return File::Spec->catfile(
        $self->{directory},
        'modules',
        '02packages.details.txt.gz'
    );
}

sub list_archive_files {
    my ( $self ) = @_;

    my $authors_dir = File::Spec->catfile( $self->{directory}, 'authors' );
    return () unless -d $authors_dir;

    my @files;
    find(
        {
            wanted => sub {
                return unless /
                    (?:
                        \.tar\.gz
                        | \.tgz
                        | \.zip
                        )
                        \z/x;
                push @files, $_;
            },
            no_chdir => 1,
        },
        $authors_dir
    );

    # Sort files by modication time so that we can index distributions from
    # earliest to latest version.

    return sort { -M $b <=> -M $a } @files;
}

1;
__END__

=encoding utf-8

=head1 NAME

OrePAN2::Indexer::Tiny - Minimal DarkPAN indexer

=head1 SYNOPSIS

    use OrePAN2::Indexer::Tiny;

    my $orepan = OrePAN2::Indexer::Tiny->new(
        directory => $directory,
    );
    $orepan->load_index();
    for my $archive_file ($self->list_archive_files()) {
        $self->add_index( $archive_file );
    }
    $self->write_index();

=head1 DESCRIPTION

OrePAN2::Indexer::Tiny is minimal L<OrePAN2> indexer which have less dependencies.

Original code is taken from L<OrePAN2>.

=head1 SEE ALSO

L<OrePAN2>

=head1 LICENSE

Copyright (C) Takumi Akiyama.

This library is free software; you can redistribute it and/or modify
it under the same terms as Perl itself.

=head1 AUTHOR

Takumi Akiyama E<lt>t.akiym@gmail.comE<gt>

=cut


Powered by Groonga
Maintained by Kenichi Ishigaki <ishigaki@cpan.org>. If you find anything, submit it on GitHub.