File: merge_replicate_bams_via_samples_file.pl

package info (click to toggle)
trinityrnaseq 2.15.2%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 468,004 kB
  • sloc: perl: 49,905; cpp: 17,993; java: 12,489; python: 3,282; sh: 1,989; ansic: 985; makefile: 717; xml: 62
file content (40 lines) | stat: -rwxr-xr-x 887 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
#!/usr/bin/env perl

use strict;
use warnings;

my $usage = "\n\n\tusage: $0 samples_file dir/containing/bams\n\n";

my $samples_file = $ARGV[0] or die $usage;
my $bam_dir_path = $ARGV[1] or die $usage;


my %tissue_id_to_bams;

open(my $fh, $samples_file) or die $!;
while(<$fh>) {
    chomp;
    my ($tissue_type, $sample_id, @rest) = split(/\t/);
    my @bams = <$bam_dir_path/$sample_id.*.bam>;
    unless (scalar(@bams) == 1) {
        die "Error, cannot find bam corresping to $bam_dir_path/$sample_id.*.bam ";
    }
    push (@{$tissue_id_to_bams{$tissue_type}}, $bams[0]);
}
close $fh;

foreach my $tissue_id (keys %tissue_id_to_bams) {
    
    my @bams = @{$tissue_id_to_bams{$tissue_id}};
    
    my $cmd = "samtools merge $tissue_id.bam @bams";
    print "$cmd\n";
    my $ret = system($cmd);
    if ($ret) {
        die "Error, $cmd died with ret $ret";
    }
}

exit(0)