File: run_benchmark_03_sampling.sh

package info (click to toggle)
seqkit 2.9.0%2Bds-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 72,276 kB
  • sloc: sh: 937; perl: 114; makefile: 14
file content (36 lines) | stat: -rwxr-xr-x 896 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
#!/bin/sh

echo Test: C\) Sampling by number

n=10000
n2=20
n3=1000000

NCPUs=$(grep -c processor /proc/cpuinfo)
for i in $(seq 1 $NCPUs); do 
    echo == $i
    for f in dataset_A.fa; do
        echo read file once with cat
        cat $f > /dev/null
        echo data: $f
        memusg -t -H seqkit sample -2 -n $n  $f -j $i -w 0 > $f.sample.seqkit.fa
        /bin/rm $f.sample.seqkit.fa
    done

    for f in dataset_B.fa; do
        echo read file once with cat
        cat $f > /dev/null
        echo data: $f
        memusg -t -H seqkit sample -2 -n $n2 $f -j $i -w 0 > $f.sample.seqkit.fa
        /bin/rm $f.sample.seqkit.fa
    done
    
    for f in dataset_C.fq; do
        echo read file once with cat
        cat $f > /dev/null
        echo data: $f
        memusg -t -H seqkit sample -2 -n $n3 $f -j $i -w 0 > $f.sample.seqkit.fa
        /bin/rm $f.sample.seqkit.fa
    done

done