File: merge_pair_and_LR_scaff_links.pl

package info (click to toggle)
trinityrnaseq 2.11.0%2Bdfsg-6
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 417,528 kB
  • sloc: perl: 48,420; cpp: 17,749; java: 12,695; python: 3,124; sh: 1,030; ansic: 983; makefile: 688; xml: 62
file content (49 lines) | stat: -rwxr-xr-x 1,073 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
#!/usr/bin/env perl

use strict;
use warnings;

my $usage = "\n\n\tusage: $0 scaff_pairs_A.txt scaff_pairs_B.txt ...\n\n";

my @pair_files = @ARGV;
unless (scalar(@pair_files) > 1) {
    die $usage;
}

main: {

    my %top_pairs;
    foreach my $pair_file (@pair_files) {
        open (my $fh, $pair_file) or die "Error, cannot open file $pair_file";
        while (<$fh>) {
            my $line = $_;
            chomp;
            
            my ($iworm_A, $idx_A, $iworm_B, $idx_B, $count) = split(/\t/);

            my $pair_token = join("$;", sort ($iworm_A, $iworm_B));

            if ( (! exists $top_pairs{$pair_token})
                 ||
                 $top_pairs{$pair_token}->{count} < $count) {

                $top_pairs{$pair_token} = { count => $count,
                                            line => $line };

            }
        }
        close $fh;
    }


    my @top_structs = reverse sort {$a->{count} <=> $b->{count}} values %top_pairs;

    foreach my $struct (@top_structs) {

        print $struct->{line};
    
    }

    exit(0);
}