File: fastaSplit.pl

package info (click to toggle)
snpeff 5.4.b%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 757,496 kB
  • sloc: java: 62,572; perl: 2,279; sh: 1,185; python: 744; xml: 507; makefile: 50
file content (42 lines) | stat: -rwxr-xr-x 1,158 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#!/usr/bin/perl

#------------------------------------------------------------------------------
# Split a fasta file (create one file per sequence)
#
#																Pablo Cingolani
#------------------------------------------------------------------------------

use strict;

#------------------------------------------------------------------------------
# Write fasta file
#------------------------------------------------------------------------------
sub writeSeq($$) {
	my($name, $seq) = @_;
	if( $name !~ /^chr/ ) { $name = "chr$name"; }
	$name = "$name.fa";
	print "Writing to $name\n";
	open OUT, "> $name";
	print OUT $seq;
	close OUT;
}

#------------------------------------------------------------------------------
# Main
#------------------------------------------------------------------------------

my($seq, $name) = ('', '');
my($lineNum, $l, $newName);

# Read fasta file
for($lineNum=0 ; $l = <STDIN> ; $lineNum++ ) {
	if( $l =~/^>\s*(.*?)\s+.*/ ) {
		$newName = $1;
		if( $seq ne "" ) { writeSeq($name, $seq); } 
		# New sequence
		$name = $newName;
		$seq = $l;
	} else { $seq .= $l; }
}

if( $seq ne "" ) { writeSeq($name, $seq); }