-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparseNetChop.pl
64 lines (57 loc) · 1.55 KB
/
parseNetChop.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
#!/usr/bin/perl
use warnings;
use strict;
use IO::File;
use List::MoreUtils qw(indexes);
use List::Util qw(max);
my $inresults=0;
my $header = 0;
my @pos;
my @aa;
my @cleave;
my @score;
my @name;
my $inFh = IO::File->new( $ARGV[0] ) || die "can't open file\n";
print "sequence_name max_cleavage_score cleavage_pos\n";
while( my $line = $inFh->getline )
{
chomp($line);
if($line =~ /-----/){ #could be a divider or the line before the data, depending on context
if(!$inresults){
if($header==1){ #this is the line after the header, next line starts the results
$header=0;
$inresults=1;
}
next;
} else { #this signals the end of the results
$inresults=0;
#print data we need
my @sites = indexes { $_ ne "." } @cleave;
print $name[0] . "\t";
print max(@score) . "\t";
print join(",",@pos[@sites]) . "\n";
#empty arrays for next sequence
@pos = ();
@aa = ();
@cleave = ();
@score = ();
@name = ();
next;
}
} else {
if($inresults){
my @F = split(/\s+/,$line);
push(@pos, $F[1]);
push(@aa, $F[2]);
push(@cleave, $F[3]);
push(@score, $F[4]);
push(@name, join(" ",@F[5..$#F]));
} else {
if($line =~ /pos AA/){
$header=1;
next;
}
}
}
}
close($inFh);