-
Notifications
You must be signed in to change notification settings - Fork 13
/
Copy pathfinal_process_A5SS_output.pl
134 lines (124 loc) · 5.03 KB
/
final_process_A5SS_output.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
#!/usr/bin/perl
use strict;
use warnings;
use List::Util qw( min max );
use List::Util qw(sum);
use List::MoreUtils qw(uniq);
#data_file_1=MXE_final; $data_file2=out1; $data_file_3=out2;
my $len=scalar(@ARGV);
if ($len < 1) {
die "Usage:final_process_A5SS_output.pl <data_file_1> <data_file_2> <data_file_3>\n";
}
my ($data_file_1, $data_file_2, $data_file_3) = @ARGV;
open(IN1, "<$data_file_1") or die "can't open input1 file: $!";
open(OUT1, ">$data_file_2") || die "can't open OUT1 file";
open(OUT2, ">$data_file_3") || die "can't open OUT2 file";
my $as;
my $chr;
my $strand;
my $common3prime;
my @id=();
my @unique_id=();
my @sorted_id=();
my @pvalue=();
my @qvalue=();
my @dpsi=();
my @a5ss=();
my @array;
my $pmin;
my $qmin;
my $indicator=0;
my $gene;
while(<IN1>) {
chomp;
if($_ !~ /raw_count/) {
if($indicator == 1) {
@array=split(/\s+/,$_);
$gene = $array[0];
$as = $array[1];
$chr = $array[11];
$strand = $array[15];
if(($strand eq "+") || ($strand eq "*")) {
$common3prime = $array[13];
push @a5ss, $array[12];
}
else {
$common3prime = $array[12];
push @a5ss, $array[13];
}
push @id, $array[12];
push @id, $array[13];
push @pvalue, $array[6];
push @qvalue, $array[7];
push @dpsi, $array[-1];
$indicator = $indicator + 1;
}
else {
@array=split(/\s+/,$_);
if ($array[1] eq $as) {
if(($strand eq "+") || ($strand eq "*")) {
push @a5ss, $array[12];
}
else {
push @a5ss, $array[13];
}
push @id, $array[12];
push @id, $array[13];
push @pvalue, $array[6];
push @qvalue, $array[7];
push @dpsi, $array[-1];
}
else {
@unique_id = uniq @id;
@sorted_id = sort { $a <=> $b } @unique_id;
$pmin = min @pvalue;
#print join(':', @qvalue); print "\n";
s/NA/1/g for @qvalue;
$qmin = min @qvalue;
print OUT2 $as; print OUT2 "\t";
print OUT2 $chr; print OUT2 "_"; print OUT2 $strand; print OUT2 "_"; print OUT2 join('_', @sorted_id); print OUT2 "\n";
print OUT1 $gene; print OUT1 "\t"; print OUT1 $chr; print OUT1 "_"; print OUT1 $strand; print OUT1 "_"; print OUT1 join('_', @sorted_id); print OUT1 "\t"; print OUT1 $chr; print OUT1 "\t"; print OUT1 $strand; print OUT1 "\t"; print OUT1 $common3prime; print OUT1 "\t"; print OUT1 join(';', @a5ss); print OUT1 "\t";
print OUT1 $pmin; print OUT1 "\t"; print OUT1 $qmin; print OUT1 "\t";
print OUT1 join(';', @dpsi); print OUT1 "\n";
$as = $array[1];
$gene = $array[0];
$chr = $array[11];
$strand = $array[15];
@id = ();
@pvalue = ();
@qvalue = ();
@dpsi = ();
@a5ss = ();
if(($strand eq "+") || ($strand eq "*")) {
$common3prime = $array[13];
push @a5ss, $array[12];
}
else {
$common3prime = $array[12];
push @a5ss, $array[13];
}
push @dpsi, $array[-1];
push @id, $array[12];
push @id, $array[13];
push @pvalue, $array[6];
push @qvalue, $array[7];
}
$indicator = $indicator + 1;
}
}
else {
@array=split(/\s+/,$_);
print OUT1 "Gene"; print OUT1 "\t"; print OUT1 "AS_event_ID"; print OUT1 "\t"; print OUT1 "chromosome"; print OUT1 "\t"; print OUT1 "strand"; print OUT1 "\t"; print OUT1 "common_3_SS_coor"; print OUT1 "\t"; print OUT1 "A5SS_coordinates"; print OUT1 "\t" ; print OUT1 "pvalue"; print OUT1 "\t"; print OUT1 "qvalue"; print OUT1 "\t"; print OUT1 "deltaPSI_"; print OUT1 $array[8]; print OUT1 "-"; print OUT1 $array[9]; print OUT1 "\n";
$indicator = $indicator+1;
}
}
@unique_id = uniq @id;
@sorted_id = sort { $a <=> $b } @unique_id;
$pmin = min @pvalue;
s/NA/1/g for @qvalue;
$qmin = min @qvalue;
print OUT2 $as; print OUT2 "\t";
print OUT2 $chr; print OUT2 "_"; print OUT2 $strand; print OUT2 "_"; print OUT2 join('_', @sorted_id); print OUT2 "\n";
print OUT1 $gene; print OUT1 "\t"; print OUT1 $chr; print OUT1 "_"; print OUT1 $strand; print OUT1 "_"; print OUT1 join('_', @sorted_id); print OUT1 "\t"; print OUT1 $chr; print OUT1 "\t"; print OUT1 $strand; print OUT1 "\t"; print OUT1 $common3prime; print OUT1 "\t"; print OUT1 join(';', @a5ss); print OUT1 "\t";
print OUT1 $pmin; print OUT1 "\t"; print OUT1 $qmin; print OUT1 "\t";
print OUT1 join(';', @dpsi); print OUT1 "\n";