App-Anchr
view release on metacpan or search on metacpan
lib/App/Anchr/Command/layout.pm view on Meta::CPAN
package App::Anchr::Command::layout;
use strict;
use warnings;
use autodie;
use App::Anchr -command;
use App::Anchr::Common;
use constant abstract => "layout anthor group";
sub opt_spec {
return (
[ "outfile|o=s", "output filename", ],
[ 'border=i', 'length of borders in anchors', { default => 100 }, ],
[ "max=i", "max distance", { default => 5000 }, ],
[ 'pa=s', 'prefix of anchors', { default => "anchor" }, ],
[ 'oa=s', 'overlaps between anchors', ],
[ "png", "write a png file via graphviz", ],
{ show_defaults => 1, },
);
}
sub usage_desc {
return "anchr layout [options] <.ovlp.tsv> <.relation.tsv> <strand.fasta>";
}
sub description {
my $desc;
$desc .= ucfirst(abstract) . ".\n";
return $desc;
}
sub validate_args {
my ( $self, $opt, $args ) = @_;
if ( @{$args} != 3 ) {
my $message = "This command need one or more input files.\n\tIt found";
$message .= sprintf " [%s]", $_ for @{$args};
$message .= ".\n";
$self->usage_error($message);
}
for ( @{$args} ) {
if ( !Path::Tiny::path($_)->is_file ) {
$self->usage_error("The input file [$_] doesn't exist.");
}
}
if ( $opt->{oa} ) {
if ( !Path::Tiny::path( $opt->{oa} )->is_file ) {
$self->usage_error("The overlap file [$opt->{oa}] doesn't exist.\n");
}
}
if ( !exists $opt->{outfile} ) {
$opt->{outfile} = Path::Tiny::path( $args->[0] )->absolute . ".contig.fasta";
}
}
sub execute {
my ( $self, $opt, $args ) = @_;
#----------------------------#
# load overlaps and build graph
#----------------------------#
my $graph = Graph->new( directed => 1 );
my %is_anchor;
my $links_of = {}; # long_id => { anchor_id => overlap_on_long, }
{
open my $in_fh, "<", $args->[0];
my %seen_pair;
while ( my $line = <$in_fh> ) {
my $info = App::Anchr::Common::parse_ovlp_line($line);
# ignore self overlapping
next if $info->{f_id} eq $info->{g_id};
# we've orient all sequences to the same strand
next if $info->{g_strand} == 1;
# skip duplicated overlaps
my $pair = join( "-", sort ( $info->{f_id}, $info->{g_id} ) );
next if $seen_pair{$pair};
$seen_pair{$pair}++;
$is_anchor{ $info->{f_id} }++ if ( index( $info->{f_id}, $opt->{pa} . "/" ) == 0 );
$is_anchor{ $info->{g_id} }++ if ( index( $info->{g_id}, $opt->{pa} . "/" ) == 0 );
if ( $info->{f_B} > 0 ) {
if ( $info->{f_E} == $info->{f_len} ) {
# f.B f.E
( run in 1.142 second using v1.01-cache-2.11-cpan-0d23b851a93 )