File: all-vs-all.sh

package info (click to toggle)
genometools 1.6.6%2Bds-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 50,576 kB
  • sloc: ansic: 271,876; ruby: 29,930; python: 5,106; sh: 3,083; makefile: 1,213; perl: 219; pascal: 159; haskell: 37; sed: 5
file content (23 lines) | stat: -rwxr-xr-x 1,152 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
#!/bin/sh

set -e -x
: "${GTDIR:?Need to set environment GTDIR as path to genometools directory}"
excludelist=Verysmall.fna,TTTN.fna,description_test.fastq,Random160.fna,description_test2.fastq,Copysorttest.fna,TTT-small.fna,paired_reads_1N_2.p.fastq,Random.fna,wildcard1.fastq,wildcard2.fastq,fastq_problem2.fasta,fastq_problem.fasta,Reads3.fna,invalid_with_pos256_q31.fastq,Small.fna,sg_reads.fastq,Reads2.fna,hop_moderate.fastq,hop_aggressive.fastq

for reference in `${GTDIR}/scripts/findfasta.rb -n -e ${excludelist}`
do
  bin/gt encseq encode -indexname ref-index ${reference}
  for query in `${GTDIR}/scripts/findfasta.rb -n -e ${excludelist}`
  do
    bin/gt encseq encode -indexname query-index ${query}
    for mode in "" "-outfmt seed"
    do
      bin/gt seed_extend $mode -v -kmerfile no -ii ref-index -maxfreq 20 -qii query-index > tmp.matches
      bin/gt dev show_seedext -a -f tmp.matches
      bin/gt dev show_seedext -e -f tmp.matches
      bin/gt dev show_seedext -a -f tmp.matches -sort
      bin/gt dev show_seedext -e -f tmp.matches -sort
      bin/gt dev show_seedext -f tmp.matches -sort | ascQorder.rb -c
    done
  done
done