App-RL
view release on metacpan or search on metacpan
lib/App/RL/Command/gff.pm view on Meta::CPAN
package App::RL::Command::gff;
use strict;
use warnings;
use autodie;
use App::RL -command;
use App::RL::Common;
sub abstract {
return 'convert gff3 files to chromosome runlists';
}
sub opt_spec {
return (
[ "outfile|o=s", "output filename. [stdout] for screen" ],
[ "tag|t=s", "primary tag (the third field)" ],
[ "remove|r", "remove 'chr0' from chromosome names" ],
{ show_defaults => 1, }
);
}
sub usage_desc {
return "runlist gff [options] <infile> [more infiles]";
}
sub description {
my $desc;
$desc .= ucfirst(abstract) . ".\n";
$desc .= <<'MARKDOWN';
* .gff files can be gzipped
MARKDOWN
return $desc;
}
sub validate_args {
my ( $self, $opt, $args ) = @_;
if ( @{$args} < 1 ) {
my $message = "This command need one or more input files.\n\tIt found";
$message .= sprintf " [%s]", $_ for @{$args};
$message .= ".\n";
$self->usage_error($message);
}
for ( @{$args} ) {
next if lc $_ eq "stdin";
if ( !Path::Tiny::path($_)->is_file ) {
$self->usage_error("The input file [$_] doesn't exist.");
}
}
if ( !exists $opt->{outfile} ) {
$opt->{outfile} = Path::Tiny::path( $args->[0] )->absolute . ".yml";
}
}
sub execute {
my ( $self, $opt, $args ) = @_;
#----------------------------#
# Loading
#----------------------------#
my $set_of = {};
for my $infile ( @{$args} ) {
my @lines = App::RL::Common::read_lines($infile);
for my $line (@lines) {
next if substr( $line, 0, 1 ) eq "#";
my @array = split( "\t", $line );
my $feature_type = $array[2];
if ( defined $opt->{tag} ) {
next if $opt->{tag} ne $feature_type;
}
my $chr_name = $array[0];
my $chr_start = $array[3];
my $chr_end = $array[4];
if ( $opt->{remove} ) {
$chr_name =~ s/chr0?//i;
$chr_name =~ s/\.\d+$//;
}
if ( !exists $set_of->{$chr_name} ) {
$set_of->{$chr_name} = App::RL::Common::new_set;
}
$set_of->{$chr_name}->add_pair( $chr_start, $chr_end );
}
}
# IntSpan to runlist
for my $chr_name ( keys %{$set_of} ) {
$set_of->{$chr_name} = $set_of->{$chr_name}->runlist;
}
( run in 1.505 second using v1.01-cache-2.11-cpan-39bf76dae61 )