File: STAR_align_log_parser.py

package info (click to toggle)
trinityrnaseq 2.15.2%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 468,004 kB
  • sloc: perl: 49,905; cpp: 17,993; java: 12,489; python: 3,282; sh: 1,989; ansic: 985; makefile: 717; xml: 62
file content (50 lines) | stat: -rwxr-xr-x 1,074 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#!/usr/bin/env python

import sys, os, re



def main():

    usage = "\n\n\tusage: {} STAR.Log.final.out [STAR.Log.final.out ...]\n\n".format(sys.argv[0])
    if len(sys.argv) < 2:
        exit(usage)

    tokens = ['sample_name']
    
    processed_first = False
    files = sys.argv[1:]

    for log_filename in files:

        token_to_val = { 'sample_name' : log_filename }
        
        with open(log_filename) as fh:
            for line in fh:
                line = line.rstrip()
                vals = line.split("|")
                if len(vals) != 2:
                    continue
                key = vals[0].strip()
                val = vals[1].strip()
                if not processed_first:
                    tokens.append(key)

                token_to_val[key] = val

        if not processed_first:
            # print header
            print("\t".join(tokens))
            processed_first = True

        
        vals = [token_to_val[x] for x in tokens]
        print("\t".join(vals))
    

    sys.exit(0)



if __name__=='__main__':
    main()