Bio-MUST-Apps-FortyTwo/bin/forty-two.pl
#!/usr/bin/env perl
# PODNAME: forty-two.pl
# ABSTRACT: The Answer to the Ultimate Question of Phylogenomics
# CONTRIBUTOR: Mick VAN VLIERBERGHE <mvanvlierberghe@doct.uliege.be>
use Modern::Perl '2011';
use Getopt::Euclid qw(:vars);
## no critic (RequireLocalizedPunctuationVars)
BEGIN{
$ENV{Smart_Comments} = $ARGV_verbosity
? join q{ }, map { '#' x (2 + $_) } 1..$ARGV_verbosity
: q{}
;
}
## use critic
use Smart::Comments -ENV;
use Config::Any;
use aliased 'Bio::MUST::Apps::FortyTwo';
# read configuration file
my $config = Config::Any->load_files( {
files => [ $ARGV_config ],
flatten_to_hash => 1,
use_ext => 1,
} );
# build ft object
# Note: default args are propagated to all orgs
my $ft = FortyTwo->new(
config => $config->{$ARGV_config},
infiles => \@ARGV_infiles,
);
# use ft as factory for run_proc object
# Note: CLI parameters are introduced here
my %args;
$args{debug_mode} = $ARGV_verbosity > 5 ? 1 : 0;
$args{out_dir} = $ARGV_outdir if $ARGV_outdir;
$args{threads} = $ARGV_threads;
my $rp = $ft->run_proc(\%args);
__END__
=pod
=head1 NAME
forty-two.pl - The Answer to the Ultimate Question of Phylogenomics
=head1 VERSION
version 0.213470
=head1 USAGE
______ __ ______
/ ____/___ _____/ /___ __ /_ __/ ______
/ /_ / __ \/ ___/ __/ / / /_____/ / | | /| / / __ \
/ __/ / /_/ / / / /_/ /_/ /_____/ / | |/ |/ / /_/ /
/_/ \____/_/ \__/\__, / /_/ |__/|__/\____/
/____/
forty-two.pl <infiles> --config=<file> [optional arguments]
=head1 REQUIRED ARGUMENTS
=over
=item <infiles>
Path to input ALI (or FASTA) files [repeatable argument].
forty-two should not be called in a shell loop. If so it will run very
slowly, especially when using tax filters (because loading the NCBI Taxonomy
database is quite long). Use shell jokers instead:
forty-two.pl --config=config.yaml rpl*.ali rps*.ali
=for Euclid: infiles.type: readable
repeatable
=item --config=<file>
Path to the configuration file specifying the run details.
In principle, several configuration file formats are available: XML, JSON,
YAML. However, forty-two was designed with YAML in mind. See the C<test>
directory of the distribution for annotated examples of YAML files.
=for Euclid: file.type: readable
=back
=head1 OPTIONAL ARGUMENTS
=over
=item --threads=<n>
Number of threads to run in parallel [default: n.default]. Parallelization is
achieved by processing several ALI files in parallel using an internal queue.
Therefore, the specified number of threads should not be larger than the
number of input ALI files.
=for Euclid: n.type: +int
n.default: 1
=item --outdir=<dir>
Optional output dir that will contain the enriched ALI files and/or taxonomic
reports (will be created if needed) [default: none]. Otherwise, output files
will be written in the same directory as input files.
=for Euclid: dir.type: writable
=item --verbosity=<level>
Verbosity level for logging to STDERR [default: level.default]. Available
levels range from 0 to 6. Level 6 corresponds to debugging mode.
=for Euclid: level.type: int, level >= 0 && level <= 6
level.default: 0
=item --version
=item --usage
=item --help
=item --man
Print the usual program information
=back
=head1 AUTHOR
Denis BAURAIN <denis.baurain@uliege.be>
=head1 CONTRIBUTOR
=for stopwords Mick VAN VLIERBERGHE
Mick VAN VLIERBERGHE <mvanvlierberghe@doct.uliege.be>
=head1 COPYRIGHT AND LICENSE
This software is copyright (c) 2013 by University of Liege / Unit of Eukaryotic Phylogenomics / Denis BAURAIN.
This is free software; you can redistribute it and/or modify it under
the same terms as the Perl 5 programming language system itself.
=cut