File: setup-sge-transcript-job.sh

package info (click to toggle)
libgoby-java 3.3.1%2Bdfsg2-9
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 58,104 kB
  • sloc: java: 78,105; cpp: 5,011; xml: 3,170; python: 2,108; sh: 1,575; ansic: 277; makefile: 114
file content (101 lines) | stat: -rwxr-xr-x 3,142 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
#!/bin/sh

#
# Script to bundle goby and required data into a
# suitable format for submission to a SGE queue
#

# Absolute path to this script.
SCRIPT=$(readlink -f $0)
# Absolute path this script is in.
SCRIPT_DIR=$(dirname $SCRIPT)
# Absolute path to the SGE transcript scripts
TRANSCRIPT_SCRIPT_DIR=${SCRIPT_DIR}/transcript/templates

if [ -z $1 ]; then
    echo "Job name is required"
    exit 1
fi

. sge-env.sh

# Local goby locations
GOBY_DIR=${GOBY_DIR:-$SCRIPT_DIR/../..}

if [ ! -e ${GOBY_DIR}/goby.jar ]; then
    echo "goby.jar not found!"
    exit 2
fi

# The job name identifies the location for the scripts
JOB_TAG=$1
JOB_DIR=$(readlink -f .)/${JOB_TAG}
JOB_RESULTS_DIR=${JOB_RESULTS_DIR:-$(readlink -f .)/${JOB_TAG}-results}

if [ -e ${JOB_DIR} ]; then
    echo "The job output directory already exists"
    exit 3
fi

if [ ! -r ${TRANSCRIPT_DIRECTORY} ]; then
    echo "ERROR: Transcript directory ${TRANSCRIPT_DIRECTORY} cannot be read"
    exit 4
fi

/bin/mkdir -p ${JOB_DIR}

if [ -z ${READS} ] || [ ! -r ${READS} ]; then
    echo "WARNING: Reads ${READS} file cannot be read"
fi

ls -1 ${TRANSCRIPT_DIRECTORY} > ${JOB_DIR}/transcript-list.txt
NUMBER_OF_TRANSCRIPTS=`wc -l < ${JOB_DIR}/transcript-list.txt`
echo "Found ${NUMBER_OF_TRANSCRIPTS} transcript files"

echo "Bundling job submission files"

SGE_ARRAY_DIRECTIVE="#$ -t 1-${NUMBER_OF_TRANSCRIPTS}"
echo "Alignment will run as ${NUMBER_OF_TRANSCRIPTS} jobs"

if [ ! -z ${SGE_STATUS_MAILTO} ]; then
    SGE_MAILTO_DIRECTIVE="#$ -M ${SGE_STATUS_MAILTO}"
fi

# Use a basename that is based on name of the reads file
BASENAME=$(basename $READS .compact-reads)

# Create a somewhat unique tag
# ("stage" of job will be added - index, align, concat)
SGE_JOB_NAME=${JOB_TAG}

# Copy goby and submission scripts to the run directory
/bin/cp ${GOBY_DIR}/goby.jar ${GOBY_DIR}/config/log4j.properties \
        ${SCRIPT_DIR}/sge-env.sh ${JOB_DIR}

# Create job specific scripts from the template files
for FILE in ${TRANSCRIPT_SCRIPT_DIR}/*; do
    FILENAME=$(basename ${FILE})
    sed -e "s|%TRANSCRIPT_DIRECTORY%|${TRANSCRIPT_DIRECTORY}|" \
        -e "s|%NUMBER_OF_TRANSCRIPTS%|${NUMBER_OF_TRANSCRIPTS}|" \
        -e "s|%TRANSCRIPT_INDEX_DIRECTORY%|${TRANSCRIPT_INDEX_DIRECTORY}|" \
        -e "s|%GENE_TRANSCRIPT_MAP_FILE%|${GENE_TRANSCRIPT_MAP_FILE}|" \
        -e "s|%READS%|${READS}|" \
        -e "s|%SGE_QUEUE%|${SGE_QUEUE}|" \
        -e "s|%SGE_MEMORY%|${SGE_MEMORY}|" \
        -e "s|%SGE_JVM_FLAGS%|${SGE_JVM_FLAGS}|" \
        -e "s|%SGE_ARRAY_DIRECTIVE%|${SGE_ARRAY_DIRECTIVE}|" \
        -e "s|%SGE_MAILTO_DIRECTIVE%|${SGE_MAILTO_DIRECTIVE}|" \
        -e "s|%ALIGNER%|${ALIGNER}|" \
        -e "s|%COLORSPACE%|${COLORSPACE}|" \
        -e "s|%CHUNK_SIZE%|${CHUNK_SIZE}|" \
        -e "s|%BASENAME%|${BASENAME}|" \
        -e "s|%BWA_ALIGNER_PATH%|${BWA_ALIGNER_PATH}|" \
        -e "s|%LAST_ALIGNER_PATH%|${LAST_ALIGNER_PATH}|" \
        -e "s|%LASTAG_ALIGNER_PATH%|${LASTAG_ALIGNER_PATH}|" \
        -e "s|%SGE_JOB_NAME%|${SGE_JOB_NAME}|" \
        ${FILE} > ${JOB_DIR}/${FILENAME}
done

chmod +x ${JOB_DIR}/*.sh

echo "Scripts were written to ${JOB_DIR}"