#!/bin/sh # # #___INFO__MARK_BEGIN__ ########################################################################## # # The Contents of this file are made available subject to the terms of # the Sun Industry Standards Source License Version 1.2 # # Sun Microsystems Inc., March, 2001 # # # Sun Industry Standards Source License Version 1.2 # ================================================= # The contents of this file are subject to the Sun Industry Standards # Source License Version 1.2 (the "License"); You may not use this file # except in compliance with the License. You may obtain a copy of the # License at http://gridengine.sunsource.net/Gridengine_SISSL_license.html # # Software provided under this License is provided on an "AS IS" basis, # WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, # WITHOUT LIMITATION, WARRANTIES THAT THE SOFTWARE IS FREE OF DEFECTS, # MERCHANTABLE, FIT FOR A PARTICULAR PURPOSE, OR NON-INFRINGING. # See the License for the specific provisions governing your rights and # obligations concerning the Software. # # The Initial Developer of the Original Code is: Sun Microsystems, Inc. # # Copyright: 2001 by Sun Microsystems, Inc. # # All Rights Reserved. # ########################################################################## #___INFO__MARK_END__ ckpt_dir=$3 if [ ! -f $ckpt_dir/ckpt.log ]; then touch $ckpt_dir/ckpt.log chmod 666 $ckpt_dir/ckpt.log fi # create temp directory for holding checkpoint info tmpdir=$ckpt_dir/ckpt.$1 mkdir -p $tmpdir cd $tmpdir # create log file F=$tmpdir/checkpoint.log touch $F echo ------------------------------------------------------------- >> $F 2>&1 echo `basename $0` called at `date` >> $F 2>&1 echo called by: `id` >> $F 2>&1 echo with args: $* >> $F 2>&1 # Cray checkpoint workaround - delete the job script so chkpnt(1) # will save and restore it. For this to work, "shell_start_mode" # should be set to "script_from_stdin" in the global cluster # configuration rm -f $JOB_SCRIPT >> $F 2>&1 # get the O.S. job identifier #job_id=`ps -elw|grep $2 |cut -c34-39,172-176 |grep $2 |cut -c8-12` if [ -f osjobid ] then job_id=`cat osjobid` else job_dir=`dirname $JOB_SCRIPT`/../active_jobs/$1 job_id=`cat $job_dir/osjobid` echo $job_id > osjobid fi # checkpoint the job to a temporary file and then rename that file # just in case we go down while checkpointing #rm -f chkpnt_$1 echo /usr/bin/chkpnt -j $job_id -v -f chkpnt_$1 >> $F 2>&1 /usr/bin/chkpnt -j $job_id -v -f chkpnt_$1.new >> $F 2>&1 cc=$? mv chkpnt_$1.new chkpnt_$1 echo `date +"%D %T"` Job $1 "(osjobid=$job_id) checkpointed, status=$cc" >> $ckpt_dir/ckpt.log