File: sjCollapseSamples.awk

package info (click to toggle)
rna-star 2.7.8a%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 3,076 kB
  • sloc: cpp: 20,429; awk: 483; ansic: 470; makefile: 181; sh: 31
file content (25 lines) | stat: -rw-r--r-- 548 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
# usage:
# awk -f sjCollapseSamples.awk /path/to/all/*/SJ.out.tab | sort -k1,1V -k2,2n -k3,3n > SJ.all
# output columns:
# 1-6 - same as in SJ.out.tab
# 7   - total number of unique mappers
# 8   - total number of multi-mappers
# 9   - max overhang
# 10  - number of samples the junction was detected in

BEGIN {
    OFS="\t";
}

{
    sj=$1 "\t" $2 "\t" $3 "\t" $4 "\t" $5 "\t" $6; 
    nSamples[sj]++;
    nU[sj]+=$7;
    nM[sj]+=$8;
    if (nO[sj]<$9) nO[sj]=$9;
};

END {
    for (sj in nSamples) print sj,nU[sj],nM[sj],nO[sj],nSamples[sj];
}