File: setup-pbs-align-job.sh

package info (click to toggle)
libgoby-java 3.3.1%2Bdfsg2-9
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 58,104 kB
  • sloc: java: 78,105; cpp: 5,011; xml: 3,170; python: 2,108; sh: 1,575; ansic: 277; makefile: 114
file content (96 lines) | stat: -rwxr-xr-x 3,076 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
#!/bin/sh

#
# Script to bundle goby and required data into a
# suitable format for submission to a PBS queue
#

# Absolute path to this script.
SCRIPT=$(readlink -f $0)
# Absolute path this script is in.
SCRIPT_DIR=$(dirname $SCRIPT)

if [ -z $1 ]; then
    echo "Job name is required"
    exit 1
fi

. pbs-env.sh

# Local goby locations
GOBY_DIR=${GOBY_DIR:-$SCRIPT_DIR/../..}

if [ ! -e ${GOBY_DIR}/goby.jar ]; then
    echo "goby.jar not found!"
    exit 2
fi

# The job name identifies the location for the scripts
JOB_TAG=$1
JOB_DIR=$(readlink -f .)/${JOB_TAG}
JOB_RESULTS_DIR=${JOB_RESULTS_DIR:-$(readlink -f .)/${JOB_TAG}-results}

if [ -e ${JOB_DIR} ]; then
    echo "The job output directory already exists"
    exit 3
fi

if [ ! -r ${REFERENCE} ]; then
    echo "WARNING: Reference ${REFERENCE} cannot be read"
fi

# Get the number of bytes in the reads file
if [ ! -r ${READS} ]; then
    echo "WARNING: Reads ${READS} file cannot be read"
    READS_SIZE=0
else
    READS_SIZE=`/usr/bin/stat --format=%s ${READS}`
fi

echo "Bundling job submission files"

# see if the job needs to split into a job array
if [ -z ${CHUNK_SIZE} ] || [ ${CHUNK_SIZE} -le 0 ] || [ ${CHUNK_SIZE} -ge ${READS_SIZE} ]; then
    echo "Alignment will not be split"
else
    NUMBER_OF_JOBS=$((${READS_SIZE} / ${CHUNK_SIZE} + 1))
    PBS_ARRAY_END_INDEX=$((${NUMBER_OF_JOBS} - 1))
    PBS_ARRAY_DIRECTIVE="#PBS -J0-${PBS_ARRAY_END_INDEX}"
    echo "Alignment will run as ${NUMBER_OF_JOBS} jobs"
fi

if [ ! -z ${PBS_STATUS_MAILTO} ]; then
    PBS_MAILTO_DIRECTIVE="#PBS -M ${PBS_STATUS_MAILTO}"
fi

# Use a basename that is based on name of the reads file
BASENAME=$(basename $READS .compact-reads)

# Create a somewhat unique tag but limit it to 15 characters (PBS name limit)
# ("stage" of job will be added - index, align, concat)
PBS_JOB_NAME=${JOB_TAG:0:10}

# Copy goby and submission scripts to the run directory
/bin/mkdir -p ${JOB_DIR}
/bin/cp ${GOBY_DIR}/goby.jar ${SCRIPT_DIR}/align.sh \
    ${SCRIPT_DIR}/index.sh ${SCRIPT_DIR}/align-concat.sh \
    ${SCRIPT_DIR}/index-align.sh ${SCRIPT_DIR}/concat.sh \
    ${SCRIPT_DIR}/index-align-concat.sh ${SCRIPT_DIR}/pbs-env.sh \
    ${JOB_DIR}

# Create job specific scripts from the template files
for FILE in goby-index.qsub goby-align.qsub goby-concat.qsub; do
    sed -e "s|%REFERENCE%|${REFERENCE}|" -e "s|%READS%|${READS}|" \
        -e "s|%PBS_QUEUE%|${PBS_QUEUE}|" -e "s|%PBS_MEMORY%|${PBS_MEMORY}|" \
        -e "s|%PBS_JVM_FLAGS%|${PBS_JVM_FLAGS}|" \
        -e "s|%PBS_ARRAY_DIRECTIVE%|${PBS_ARRAY_DIRECTIVE}|" \
        -e "s|%PBS_MAILTO_DIRECTIVE%|${PBS_MAILTO_DIRECTIVE}|" \
        -e "s|%REFERENCE_INDEX_NAME%|${REFERENCE_INDEX_NAME}|" \
        -e "s|%REFERENCE_INDEX_DIRECTORY%|${REFERENCE_INDEX_DIRECTORY}|" \
        -e "s|%ALIGNER%|${ALIGNER}|" -e "s|%COLORSPACE%|${COLORSPACE}|" \
        -e "s|%CHUNK_SIZE%|${CHUNK_SIZE}|" -e "s|%BASENAME%|${BASENAME}|" \
        -e "s|%PBS_JOB_NAME%|${PBS_JOB_NAME}|" \
        ${SCRIPT_DIR}/templates/${FILE} > ${JOB_DIR}/${FILE}
done

echo "Scripts were written to ${JOB_DIR}"