File: cpr_migration_command

package info (click to toggle)
gridengine 6.2-4
  • links: PTS, VCS
  • area: main
  • in suites: lenny
  • size: 51,532 kB
  • ctags: 51,172
  • sloc: ansic: 418,155; java: 37,080; sh: 22,593; jsp: 7,699; makefile: 5,292; csh: 4,244; xml: 2,901; cpp: 2,086; perl: 1,895; tcl: 1,188; lisp: 669; ruby: 642; yacc: 393; lex: 266
file content (102 lines) | stat: -rwxr-xr-x 2,826 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
#!/bin/ksh
#
#
#___INFO__MARK_BEGIN__
##########################################################################
#
#  The Contents of this file are made available subject to the terms of
#  the Sun Industry Standards Source License Version 1.2
#
#  Sun Microsystems Inc., March, 2001
#
#
#  Sun Industry Standards Source License Version 1.2
#  =================================================
#  The contents of this file are subject to the Sun Industry Standards
#  Source License Version 1.2 (the "License"); You may not use this file
#  except in compliance with the License. You may obtain a copy of the
#  License at http://gridengine.sunsource.net/Gridengine_SISSL_license.html
#
#  Software provided under this License is provided on an "AS IS" basis,
#  WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
#  WITHOUT LIMITATION, WARRANTIES THAT THE SOFTWARE IS FREE OF DEFECTS,
#  MERCHANTABLE, FIT FOR A PARTICULAR PURPOSE, OR NON-INFRINGING.
#  See the License for the specific provisions governing your rights and
#  obligations concerning the Software.
#
#  The Initial Developer of the Original Code is: Sun Microsystems, Inc.
#
#  Copyright: 2001 by Sun Microsystems, Inc.
#
#  All Rights Reserved.
#
##########################################################################
#___INFO__MARK_END__

set +u

ckpt_dir=$3

if [ ! -f $ckpt_dir/ckpt.log ]; then
   touch $ckpt_dir/ckpt.log
   chmod 666 $ckpt_dir/ckpt.log
fi

sge_root=${SGE_ROOT}
sge_cell=${SGE_CELL}

# workaround to force job to restart on same queue (svd)
. $sge_root/${sge_cell:-default}/common/settings.sh
qalter -q $QUEUE $JOB_ID

# create temp directory for holding checkpoint info

tmpdir=$ckpt_dir/ckpt.$1
mkdir -p $tmpdir
cd $tmpdir

# create log file

#F=$tmpdir/checkpoint.log
F=~/$REQNAME.co$1
touch $F

print -------------------------------------------------------------  >> $F 2>&1
print `basename $0` called at `date`      >> $F 2>&1
print called by: `id`			 >> $F 2>&1
print with args: $*			 >> $F 2>&1

# checkpoint the job to one of two different files (i.e. ping-pong)
# just in case we go down while checkpointing

currcpr=`cat currcpr`
if [ "$currcpr" = "2" ]; then
    currcpr=1
    prevcpr=2
else
    currcpr=2
    prevcpr=1
fi

# use the ASH to checkpoint if it is available.
# otherwise, use the process group ID

if [ -n "$OSJOBID" ]
then
    popt="$OSJOBID:ASH"
else
    popt="$2:GID"
fi

print Migration command: cpr -c cpr_$1.$currcpr -p $popt -f -k >> $F 2>&1
cpr -c cpr_$1.$currcpr -p $popt -f -k >> $F 2>&1
cc=$?
if [ $cc -eq 0 ]; then
   print $currcpr > currcpr
   if [ -d cpr_$1.$prevcpr ]; then
      print Deleting old checkpoint file >> $F 2>&1
      cpr -D cpr_$1.$prevcpr >> $F 2>&1
   fi
fi

print `date +"%D %T"` Job $1 "(pid=$2) checkpointed and killed, status=$cc" >> $ckpt_dir/ckpt.log