File: vcfregionreduce_uncompressed

package info (click to toggle)
libvcflib 1.0.0~rc2%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 51,048 kB
  • sloc: cpp: 30,004; perl: 474; sh: 247; makefile: 206; python: 200; ansic: 148
file content (29 lines) | stat: -rwxr-xr-x 835 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash

if [ $# -ne 2 ];
then
    echo "Usage: $0 [region file] [directory]"
    echo
    echo "Generates \`basename directory\`.vcf.gz, which is the concatenation"
    echo "of files in the directory named [directory]/[region1].vcf.gz,"
    echo "[directory]/[region2].vcf.gz, etc. in the order in which they"
    echo "occur in the region file."
    echo
    echo "A tabix index is subsequently generated."
    exit 1
fi

regionfile=$1
mergedir=$2
mergename=$(basename $mergedir)
vcfgenotypes=$mergename.vcf.gz
#vcfsites=$mergename.sites.vcf.gz

firstfile=$mergedir/$(head -1 $regionfile).vcf
files=$(for region in $(cat $regionfile); do echo $mergedir/$region.vcf; done)

( cat $firstfile | head -1000 | grep ^#
for file in $files
do
    cat $file | grep -v "^#"
done ) | ( bgzip >$vcfgenotypes && tabix -p vcf $vcfgenotypes )