[16] | 1 | #!/bin/ksh |
---|
| 2 | # IBM_PROLOG_BEGIN_TAG |
---|
| 3 | # This is an automatically generated prolog. |
---|
| 4 | # |
---|
| 5 | # |
---|
| 6 | # |
---|
| 7 | # Licensed Materials - Property of IBM |
---|
| 8 | # |
---|
| 9 | # (C) COPYRIGHT International Business Machines Corp. 2003,2005 |
---|
| 10 | # All Rights Reserved |
---|
| 11 | # |
---|
| 12 | # US Government Users Restricted Rights - Use, duplication or |
---|
| 13 | # disclosure restricted by GSA ADP Schedule Contract with IBM Corp. |
---|
| 14 | # |
---|
| 15 | # IBM_PROLOG_END_TAG |
---|
| 16 | # @(#)55 1.18 src/avs/fs/mmfs/ts/admin/mmexectsmcmd.sh, mmfs, avs_rgpfs24, rgpfs240610b 2/11/05 11:32:21 |
---|
| 17 | ############################################################################## |
---|
| 18 | # |
---|
| 19 | # This script issues TSM commands from a GPFS node that is a TSM client. |
---|
| 20 | # |
---|
| 21 | # It accepts the following arguments: |
---|
| 22 | # 1) The mount point of the pertinent file system |
---|
| 23 | # 2) The TSM operation to be performed; supported opperations are: |
---|
| 24 | # - selective |
---|
| 25 | # - incremental |
---|
| 26 | # - expire |
---|
| 27 | # - restore (no longer used since tsrestorefile was dropped) |
---|
| 28 | # 3) A qualifier for the fourth parameter: |
---|
| 29 | # - filelist This value indicates that the fourth parameter |
---|
| 30 | # is the value for the Tivoli filelist=<> option. |
---|
| 31 | # - nofilelist This value indicates that the fourth parameter |
---|
| 32 | # is not to be used as a Tivoli filelist parameter. |
---|
| 33 | # In this case, the Tivoli filelist option is not used. |
---|
| 34 | # 4) If the 3rd parameter was |
---|
| 35 | # - filelist then the 4th parameter is the full path name of the |
---|
| 36 | # file containing the filenames to be operated on. |
---|
| 37 | # - nofilelist then the 4th parameter is another parameter to be |
---|
| 38 | # passed to the Tivoli command. |
---|
| 39 | # 5) The nodename of the master tsbackup process (used for locking) |
---|
| 40 | # 6) The pid number of the master tsbackup process (used for locking) |
---|
| 41 | # 7) The backup client process index (used for file naming) |
---|
| 42 | # 8) The name of the TSM server (checked against dsm.opt file) |
---|
| 43 | # 9) The I/O rate level (used to allow other non-backup processes to run) |
---|
| 44 | # |
---|
| 45 | # The backup client process index is used for constructing the name of |
---|
| 46 | # the file for pending (not successfully completed) transactions. |
---|
| 47 | # |
---|
| 48 | # The program returns: |
---|
| 49 | # 0 on success (i.e., all files were succesfully backed up) |
---|
| 50 | # 1 on partial success (i.e., some but not all files were backed up) |
---|
| 51 | # 2 on failure (i.e., no success at all) |
---|
| 52 | # |
---|
| 53 | ############################################################################## |
---|
| 54 | |
---|
| 55 | # Include global declarations and service routines |
---|
| 56 | . /usr/lpp/mmfs/bin/mmglobfuncs |
---|
| 57 | . /usr/lpp/mmfs/bin/mmsdrfsdef |
---|
| 58 | . /usr/lpp/mmfs/bin/mmfsfuncs |
---|
| 59 | |
---|
| 60 | sourceFile="mmexectsmcmd.sh" |
---|
| 61 | [[ -n $DEBUG || -n $DEBUGmmexectsmcmd ]] && set -x |
---|
| 62 | $mmTRACE_ENTER "$*" |
---|
| 63 | |
---|
| 64 | |
---|
| 65 | #------------------------------------------------- |
---|
| 66 | # Local work files. Names should be of the form: |
---|
| 67 | # fn=${tmpDir}fn.${mmcmd}.$$ |
---|
| 68 | #------------------------------------------------- |
---|
| 69 | |
---|
| 70 | #tmpCtrlFile=${tmpDir}tmpCtrlFile.mmbackup.$$ |
---|
| 71 | #LOCAL_FILES=" $tmpCtrlFile " |
---|
| 72 | |
---|
| 73 | |
---|
| 74 | #------------------ |
---|
| 75 | # Global variables |
---|
| 76 | #------------------ |
---|
| 77 | |
---|
| 78 | dateTime=$($date +"%y%m%d_%H:%M:%S") |
---|
| 79 | |
---|
| 80 | #tsmDate=$(date '+%m/%d/%y') |
---|
| 81 | #tsmTime=$(date '+%H:%M:%S') |
---|
| 82 | |
---|
| 83 | dsmc=/usr/bin/dsmc |
---|
| 84 | |
---|
| 85 | if [[ -n $DSM_CONFIG ]] |
---|
| 86 | then |
---|
| 87 | dsmoptfile=$DSM_CONFIG |
---|
| 88 | elif [[ $osName = AIX ]] |
---|
| 89 | then |
---|
| 90 | dsmoptfile=/usr/tivoli/tsm/client/ba/bin/dsm.opt |
---|
| 91 | elif [[ $osName = Linux ]] |
---|
| 92 | then |
---|
| 93 | dsmoptfile=/opt/tivoli/tsm/client/ba/bin/dsm.opt |
---|
| 94 | else |
---|
| 95 | print -u2 " Unknown operating system $osName " |
---|
| 96 | exit 1 |
---|
| 97 | fi |
---|
| 98 | |
---|
| 99 | searchErrorString="No files matching search criteria" |
---|
| 100 | objectErrorString="No objects on server match" |
---|
| 101 | errorProcessingString="Error processing" |
---|
| 102 | |
---|
| 103 | opf=Operation_Failure |
---|
| 104 | opps=Operation_Partial_Success |
---|
| 105 | ops=Operation_Success |
---|
| 106 | |
---|
| 107 | rc_success=0 |
---|
| 108 | rc_psuccess=1 |
---|
| 109 | rc_fail=2 |
---|
| 110 | |
---|
| 111 | tpl=".mmbuTSMPendingTransactions" |
---|
| 112 | |
---|
| 113 | lockdir="/var/mmfs/etc/mmbackuplock" |
---|
| 114 | |
---|
| 115 | pgm="mmexectsmcmd" |
---|
| 116 | |
---|
| 117 | |
---|
| 118 | #----------------- |
---|
| 119 | # local routines |
---|
| 120 | #----------------- |
---|
| 121 | |
---|
| 122 | |
---|
| 123 | #-------------------------------------------------------------- |
---|
| 124 | # This function is called if there is an interrupt before |
---|
| 125 | # we have obtained a backup lock. |
---|
| 126 | #-------------------------------------------------------------- |
---|
| 127 | function localTrap |
---|
| 128 | { |
---|
| 129 | doCleanupAndExit $rc_fail |
---|
| 130 | } |
---|
| 131 | |
---|
| 132 | |
---|
| 133 | #-------------------------------------------------------------- |
---|
| 134 | # This function is called if there is an interrupt after |
---|
| 135 | # we have obtained a backup lock. |
---|
| 136 | #-------------------------------------------------------------- |
---|
| 137 | function localTrap2 |
---|
| 138 | { |
---|
| 139 | freeLockAndExit $rc_fail |
---|
| 140 | } |
---|
| 141 | |
---|
| 142 | |
---|
| 143 | #-------------------------------------------------------------- |
---|
| 144 | # getBackupLock |
---|
| 145 | # |
---|
| 146 | # Obtain a lock before proceeding. |
---|
| 147 | # |
---|
| 148 | # Here is the mechanism by which locks are managed and used: |
---|
| 149 | # |
---|
| 150 | # 1) Begin to obtain a lock by issuing: mkdir lockdir |
---|
| 151 | # 2) If (1) succeeds, no one else has a lock. Finish obtaining your |
---|
| 152 | # lock by issuing mkdirs for lockdir/masternode_masterpid and |
---|
| 153 | # lockdir/masternode_masterpid/mylocalpid. You now have a valid lock. |
---|
| 154 | # 3) If (1) fails, perhaps one of your local sibling processes already |
---|
| 155 | # has created lockdir and lockdir/masternode_masterpid (as well as |
---|
| 156 | # lockdir/masternode_masterpid/hislocalpid for his own use). Try to |
---|
| 157 | # obtain a lock by doing mkdir lockdir/masternode_masterpid/mylocalpid. |
---|
| 158 | # This will fail if lockdir/masternode_masterpid does not exist and |
---|
| 159 | # succeed if it does. There is a small chance that there is a sibling |
---|
| 160 | # process that is obtaining a lock and has created lockdir but has |
---|
| 161 | # not yet created lockdir/masternode_masterpid. This could be solved |
---|
| 162 | # by trying the mkdir for lockdir/masternode_masterpid/mylocalpid a |
---|
| 163 | # second time. If a mkdir for lockdir/masternode_masterpid/mylocalpid |
---|
| 164 | # succeeds, you have a valid lock. |
---|
| 165 | # 4) If a valid lock is not obtained, exit with a msg to the user stating |
---|
| 166 | # who has the lock, try again later, and how to free the lock if the |
---|
| 167 | # process that had the lock no longer exists. |
---|
| 168 | # 5) If a valid lock is obtained, proceed to do the requested work. |
---|
| 169 | # 6) When the requested work is done, free your lock by doing |
---|
| 170 | # rmdir lockdir/masternode_masterpid/mylocalpid |
---|
| 171 | # rmdir lockdir/masternode_masterpid |
---|
| 172 | # rmdir lockdir |
---|
| 173 | # The latter two rmdirs will fail if any of sibling processes are still |
---|
| 174 | # holding locks, since these directories will then not be empty. |
---|
| 175 | # Care must be taken to always free locks before exiting. |
---|
| 176 | # |
---|
| 177 | #-------------------------------------------------------------- |
---|
| 178 | function getBackupLock |
---|
| 179 | { |
---|
| 180 | # Enable debug output. |
---|
| 181 | typeset sourceFile="mmexectsmcmd.sh" |
---|
| 182 | [[ -n $DEBUG || -n $DEBUGgetBackupLock ]] && set -x |
---|
| 183 | $mmTRACE_ENTER "$*" |
---|
| 184 | |
---|
| 185 | # Try to create the base lock directory. |
---|
| 186 | $mkdir $lockdir > /dev/null 2>&1 |
---|
| 187 | if [[ $? = 0 ]] |
---|
| 188 | then |
---|
| 189 | # The lock was not in use by anyone. Finish creating our lock. |
---|
| 190 | $mkdir $lockdir/$masterNode"_"$masterPid > /dev/null 2>&1 |
---|
| 191 | $mkdir $lockdir/$masterNode"_"$masterPid/$$ > /dev/null 2>&1 |
---|
| 192 | if [[ $? != 0 ]] |
---|
| 193 | then |
---|
| 194 | print "$opf: $sn: Unexpected error creating a lock. Try again. If the problem persists, contact IBM service." |
---|
| 195 | freeLockAndExit $rc_fail |
---|
| 196 | fi |
---|
| 197 | else |
---|
| 198 | # At least one other process has a lock. Try to obtain a lock for |
---|
| 199 | # our own use by issuing a mkdir. If the other processes with locks |
---|
| 200 | # were created by the same master process as our process was, |
---|
| 201 | # the mkdir will succeed. |
---|
| 202 | $mkdir $lockdir/$masterNode"_"$masterPid/$$ > /dev/null 2>&1 |
---|
| 203 | if [[ $? != 0 ]] |
---|
| 204 | then |
---|
| 205 | # Retry the mkdir just in case the first one failed due to timing. |
---|
| 206 | $mkdir $lockdir/$masterNode"_"$masterPid/$$ > /dev/null 2>&1 |
---|
| 207 | if [[ $? != 0 ]] |
---|
| 208 | then |
---|
| 209 | lsOutput=$($ls $lockdir) |
---|
| 210 | |
---|
| 211 | IFS_sv=$IFS |
---|
| 212 | IFS="_" |
---|
| 213 | set -f ; set -- $lsOutput ; set +f |
---|
| 214 | lockhldrNode=$1 |
---|
| 215 | lockhldrPid=$2 |
---|
| 216 | IFS="$IFS_sv" |
---|
| 217 | |
---|
| 218 | # We have the pid and hostname of the process holding the lock. |
---|
| 219 | # Determine whether the process is still running. |
---|
| 220 | if [[ $lockhldrNode = $ourNodeName ]] |
---|
| 221 | then |
---|
| 222 | pidCheckAll=$($mmremote pid $lockhldrPid) |
---|
| 223 | else |
---|
| 224 | pidCheckAll=$($mmcommon on1 $lockhldrNode pid $lockhldrPid) |
---|
| 225 | rc=$? |
---|
| 226 | fi |
---|
| 227 | |
---|
| 228 | pidCheck=$(print "$pidCheckAll" | $egrep "^(died|alive)$") |
---|
| 229 | if [[ $pidCheck != died ]] |
---|
| 230 | then |
---|
| 231 | $mmTRACE "$1 lock held by $lockhldrNode $lockhldrPid" |
---|
| 232 | # The process that has the lock is still alive, or we could |
---|
| 233 | # not determine its status. Either way, give up. |
---|
| 234 | if [[ $pidCheck = alive ]] |
---|
| 235 | then |
---|
| 236 | print "$opf: $sn:\nFailed to obtain GPFS backup lock. Process $lockhldrPid on node $lockhldrNode has it.\nIf process $lockhldrPid is no longer running on $lockhldrNode, clear the lock\nby issuing: \"rm -rf $lockdir\" on all GPFS nodes. Otherwise,\ntry the GPFS backup again when process $lockhldrPid on $lockhldrNode is done.\n" |
---|
| 237 | else |
---|
| 238 | print "$opf: $sn:\nFailed to obtain GPFS backup lock. Unable to reach the holder\nof the lock, which is process $lockhldrPid on node $lockhldrNode.\nIf process $lockhldrPid is no longer running on $lockhldrNode, clear the lock\nby issuing: \"rm -rf $lockdir\" on all GPFS nodes. Otherwise,\ntry the GPFS backup again when process $lockhldrPid on $lockhldrNode is done.\n" |
---|
| 239 | fi |
---|
| 240 | doCleanupAndExit $rc_fail |
---|
| 241 | else |
---|
| 242 | # The process that had the lock somehow went away without unlocking. |
---|
| 243 | # Remove the old lock and establish a new one for the caller. |
---|
| 244 | $rm -rf $lockdir > /dev/null 2>&1 |
---|
| 245 | $mkdir $lockdir > /dev/null 2>&1 |
---|
| 246 | if [[ $? = 0 ]] |
---|
| 247 | then |
---|
| 248 | # Success! Complete the work of establishing the lock. |
---|
| 249 | $mkdir $lockdir/$masterNode"_"$masterPid > /dev/null 2>&1 |
---|
| 250 | $mkdir $lockdir/$masterNode"_"$masterPid/$$ > /dev/null 2>&1 |
---|
| 251 | else |
---|
| 252 | # Failed again! Give up. |
---|
| 253 | print "$opf: $sn:\nFailed to obtain GPFS backup lock even after clearing the lock.\n" |
---|
| 254 | doCleanupAndExit $rc_fail |
---|
| 255 | fi |
---|
| 256 | fi # end of if [[ $pidCheck != died ]] |
---|
| 257 | fi |
---|
| 258 | fi |
---|
| 259 | fi |
---|
| 260 | |
---|
| 261 | } #------ end of function getBackupLock ----------------- |
---|
| 262 | |
---|
| 263 | |
---|
| 264 | #-------------------------------------------------------------- |
---|
| 265 | # freeBackupLock |
---|
| 266 | #-------------------------------------------------------------- |
---|
| 267 | function freeBackupLock |
---|
| 268 | { |
---|
| 269 | # Enable debug output. |
---|
| 270 | typeset sourceFile="mmexectsmcmd.sh" |
---|
| 271 | [[ -n $DEBUG || -n $DEBUGfreeBackupLock ]] && set -x |
---|
| 272 | $mmTRACE_ENTER "$*" |
---|
| 273 | |
---|
| 274 | $rmdir $lockdir/$masterNode"_"$masterPid/$$ > /dev/null 2>&1 |
---|
| 275 | $rmdir $lockdir/$masterNode"_"$masterPid > /dev/null 2>&1 |
---|
| 276 | $rmdir $lockdir > /dev/null 2>&1 |
---|
| 277 | |
---|
| 278 | } #------ end of function freeBackupLock ---------------- |
---|
| 279 | |
---|
| 280 | |
---|
| 281 | #-------------------------------------------------------------- |
---|
| 282 | # |
---|
| 283 | # freeLockAndExit |
---|
| 284 | # |
---|
| 285 | # Function: Free the backup lock and then exit via the |
---|
| 286 | # doCleanupAndExit routine. |
---|
| 287 | # |
---|
| 288 | # Input: $1 - return code with which to exit |
---|
| 289 | # |
---|
| 290 | #-------------------------------------------------------------- |
---|
| 291 | function freeLockAndExit |
---|
| 292 | { |
---|
| 293 | # Enable debug output. |
---|
| 294 | typeset sourceFile="mmexectsmcmd.sh" |
---|
| 295 | [[ -n $DEBUG || -n $DEBUGfreeLockAndExit ]] && set -x |
---|
| 296 | $mmTRACE_ENTER "$*" |
---|
| 297 | |
---|
| 298 | rc=$1 |
---|
| 299 | |
---|
| 300 | freeBackupLock |
---|
| 301 | |
---|
| 302 | doCleanupAndExit $rc |
---|
| 303 | |
---|
| 304 | } #------ end of function freeLockAndExit --------------- |
---|
| 305 | |
---|
| 306 | |
---|
| 307 | #-------------------------------------------------------------- |
---|
| 308 | # |
---|
| 309 | # doCleanupAndExit |
---|
| 310 | # |
---|
| 311 | # Function: Perform cleanup unique to mmexectsmcmd, and then |
---|
| 312 | # exit via the standard cleanupAndExit routine. |
---|
| 313 | # |
---|
| 314 | # Input: $1 - return code with which to exit |
---|
| 315 | # |
---|
| 316 | #-------------------------------------------------------------- |
---|
| 317 | function doCleanupAndExit |
---|
| 318 | { |
---|
| 319 | # Enable debug output. |
---|
| 320 | typeset sourceFile="mmexectsmcmd.sh" |
---|
| 321 | [[ -n $DEBUG || -n $DEBUGdoCleanupAndExit ]] && set -x |
---|
| 322 | $mmTRACE_ENTER "$*" |
---|
| 323 | |
---|
| 324 | rc=$1 |
---|
| 325 | |
---|
| 326 | # If the TSM log file does not exist and have a size greater than 0, |
---|
| 327 | # remove the log directory. |
---|
| 328 | [[ ! -s $logfile ]] && $rm -rf $logdir > /dev/null 2>&1 |
---|
| 329 | |
---|
| 330 | cleanupAndExit $rc |
---|
| 331 | |
---|
| 332 | } #------ end of function doCleanupAndExit --------------- |
---|
| 333 | |
---|
| 334 | |
---|
| 335 | |
---|
| 336 | #------------------------ |
---|
| 337 | # Start main processing. |
---|
| 338 | #------------------------ |
---|
| 339 | |
---|
| 340 | # Set local trap routine. |
---|
| 341 | trap localTrap HUP INT QUIT KILL |
---|
| 342 | |
---|
| 343 | typeset -l keyword_lc # variable for storing keyword in lower case |
---|
| 344 | |
---|
| 345 | # Verify that the correct number of parameters were passed. |
---|
| 346 | if [[ $argc -ne 9 && $argc -ne 2 ]] |
---|
| 347 | then |
---|
| 348 | print "$opf: $sn: An incorrect number of parameters was passed." |
---|
| 349 | print "Usage:\n $pgm <FSname> <tsmOperation> <tsmOperationOption> <filelistname> <invokingNode> <invokingPid> <clientIndex> <tsmServer> <ioRateValue>" |
---|
| 350 | doCleanupAndExit $rc_fail |
---|
| 351 | fi |
---|
| 352 | |
---|
| 353 | [[ -z $MMMODE || -z $primaryServer ]] && \ |
---|
| 354 | determineMode |
---|
| 355 | getLocalNodeData |
---|
| 356 | sn=$ourNodeName |
---|
| 357 | |
---|
| 358 | # |
---|
| 359 | # Assign the input parameters as follows: |
---|
| 360 | # |
---|
| 361 | # arg1 - "givestatus" |
---|
| 362 | # arg2 - number of seconds to sleep between messages |
---|
| 363 | # |
---|
| 364 | # OR |
---|
| 365 | # |
---|
| 366 | # arg1 - mountpoint of filesystem to be operated on |
---|
| 367 | # arg2 - TSM command (selective, incremental, expire, or restore) |
---|
| 368 | # arg3 - TSM command option (filelist or nofilelist) |
---|
| 369 | # arg4 - name of the filelist file (if arg3 was filelist) |
---|
| 370 | # or |
---|
| 371 | # some other TSM command parameter (if arg3 was nofilelist) |
---|
| 372 | # arg5 - name of the invoking node (used for obtaining a backup lock) |
---|
| 373 | # arg6 - pid of the invoking process (used for obtaining a backup lock) |
---|
| 374 | # arg7 - process index (used for creating directory in which, if necessary, |
---|
| 375 | # Tivoli will store a dsmerror.log file) |
---|
| 376 | # arg8 - name of the TSM server (used for checking against the dsm.opt file) |
---|
| 377 | # arg9 - I/O rate value |
---|
| 378 | # |
---|
| 379 | |
---|
| 380 | if [[ $arg1 = "givestatus" ]] |
---|
| 381 | then |
---|
| 382 | integer nSeconds=${arg2} |
---|
| 383 | while true |
---|
| 384 | do |
---|
| 385 | sleep $nSeconds |
---|
| 386 | printInfoMsg 527 mmbackup |
---|
| 387 | done # end while true |
---|
| 388 | fi |
---|
| 389 | |
---|
| 390 | mountPoint=$arg1 |
---|
| 391 | |
---|
| 392 | tsmCommand=$arg2 |
---|
| 393 | |
---|
| 394 | tsmCommandOption=$arg3 |
---|
| 395 | |
---|
| 396 | if [[ $tsmCommandOption = filelist ]] |
---|
| 397 | then |
---|
| 398 | filelistName=$arg4 |
---|
| 399 | if [[ ! -f $filelistName || ! -r $filelistName ]] |
---|
| 400 | then |
---|
| 401 | # The filelist file does not exist or is not readable. |
---|
| 402 | # Issue an error message and fail the command. |
---|
| 403 | print "$opf: $sn: Cannot open $filelistName. Make sure filesystem is mounted on node." |
---|
| 404 | doCleanupAndExit $rc_fail |
---|
| 405 | fi |
---|
| 406 | elif [[ $tsmCommandOption = nofilelist ]] |
---|
| 407 | then |
---|
| 408 | tsmCommandParm=$arg4 |
---|
| 409 | else |
---|
| 410 | print "$opf: $sn: Invalid parameter: $tsmCommandOption" |
---|
| 411 | doCleanupAndExit $rc_fail |
---|
| 412 | fi |
---|
| 413 | |
---|
| 414 | masterNode=$arg5 |
---|
| 415 | |
---|
| 416 | masterPid=$arg6 |
---|
| 417 | |
---|
| 418 | processIndex=$arg7 |
---|
| 419 | |
---|
| 420 | tsmServer=$arg8 |
---|
| 421 | |
---|
| 422 | ioRateValue=$arg9 |
---|
| 423 | |
---|
| 424 | |
---|
| 425 | # Set and export the DSM_LOG environment variable to tell TSM |
---|
| 426 | # where to put any error log it generates. |
---|
| 427 | logdir=$mmbackupDir"$mountPoint"_"$dateTime"_"$processIndex" |
---|
| 428 | logfile=$logdir/dsmerror.log |
---|
| 429 | export DSM_LOG=$logdir |
---|
| 430 | |
---|
| 431 | # Create the directory for the TSM error log. |
---|
| 432 | $mkdir -p $logdir > /dev/null 2>&1 |
---|
| 433 | |
---|
| 434 | # Add a slash to the end of the mount point variable for passing to TSM later. |
---|
| 435 | mountPoint=$mountPoint/ |
---|
| 436 | |
---|
| 437 | # Call routine to obtain a lock before proceeding. |
---|
| 438 | # If a lock cannot be obtained, getBackupLock will exit with a failure rc. |
---|
| 439 | getBackupLock |
---|
| 440 | |
---|
| 441 | # At this point we have obtained a lock. |
---|
| 442 | # Now that we have obtained a backup lock, change the trap routine |
---|
| 443 | # to one that frees the lock before exiting. |
---|
| 444 | trap localTrap2 HUP INT QUIT KILL |
---|
| 445 | |
---|
| 446 | # Check that the TSM server passed on the command matches the one |
---|
| 447 | # specified in the /usr/tivoli/tsm/client/ba/bin/dsm.opt file. |
---|
| 448 | # If it doesn't, issue an error message and exit with a failing rc. |
---|
| 449 | grepOutput=$($grep -i servername $dsmoptfile | $grep -v '*') |
---|
| 450 | set -f ; set -- $grepOutput ; set +f |
---|
| 451 | dsmoptTSMserverKeyword=$1 |
---|
| 452 | dsmoptTSMserver=$2 |
---|
| 453 | |
---|
| 454 | keyword_lc=$dsmoptTSMserverKeyword # Convert keyword to all lower case. |
---|
| 455 | if [[ $keyword_lc != servername ]] |
---|
| 456 | then |
---|
| 457 | print "$opf: $sn: unable to find TSM server name in dsm.opt file" |
---|
| 458 | freeLockAndExit $rc_fail |
---|
| 459 | fi |
---|
| 460 | |
---|
| 461 | if [[ $tsmServer != $dsmoptTSMserver ]] |
---|
| 462 | then |
---|
| 463 | print "$opf: $sn: specified TSM server does not match TSM server in dsm.opt file" |
---|
| 464 | freeLockAndExit $rc_fail |
---|
| 465 | fi |
---|
| 466 | |
---|
| 467 | # Depending on the I/O rate value, take a breather |
---|
| 468 | # to allow other non-backup processes to run. |
---|
| 469 | # The scheme implemented here, wait a fixed number of |
---|
| 470 | # seconds controlled by the passed value, is a very |
---|
| 471 | # rough beginning. A better scheme would be to calculate |
---|
| 472 | # the time used doing backup work, and then sleep a |
---|
| 473 | # fraction of that time based on the I/O rate value. |
---|
| 474 | # (An I/O rate value of 100 would mean don't sleep at all, |
---|
| 475 | # a value of 75 would mean sleep for 1/3 of the time |
---|
| 476 | # spent doing backup, a value of 50 would mean sleep an |
---|
| 477 | # amount of time equal to the time spent on backup, |
---|
| 478 | # and so on.) |
---|
| 479 | integer numberOfSeconds=100-${ioRateValue} |
---|
| 480 | sleep $numberOfSeconds |
---|
| 481 | |
---|
| 482 | |
---|
| 483 | # We now have obtained a backup lock, verified that the TSM server is |
---|
| 484 | # correct, and idled away some time if warranted by the I/O rate value. |
---|
| 485 | # Proceed to process Tivoli Storage Manager commands. |
---|
| 486 | |
---|
| 487 | # TSM selective or incremental command processing |
---|
| 488 | # |
---|
| 489 | if [[ $tsmCommand = selective || $tsmCommand = incremental ]] |
---|
| 490 | then |
---|
| 491 | |
---|
| 492 | # Issue the TSM command to have the list of files backed up. |
---|
| 493 | # $dsmc $tsmCommand -filelist=$filelistName > /tmp/out1i 2> /tmp/out2i |
---|
| 494 | $dsmc $tsmCommand -filelist=$filelistName > /dev/null 2>&1 |
---|
| 495 | rc=$? |
---|
| 496 | |
---|
| 497 | # The return code only indicates whether the TSM executable ran successfully. |
---|
| 498 | # The TSM client returns a code greater than 0 (zero) only if TSM was |
---|
| 499 | # unable to attempt the operations. |
---|
| 500 | # Only those return codes output to the error report (dsmerror.log) |
---|
| 501 | # indicate the success or failure of specific TSM commands. |
---|
| 502 | if [[ $rc -eq 0 ]] |
---|
| 503 | then |
---|
| 504 | |
---|
| 505 | # Clear the error log. It will be recreated |
---|
| 506 | # by the query command to be issued next. |
---|
| 507 | if [[ -a $logfile && -s $logfile ]] |
---|
| 508 | then |
---|
| 509 | $rm -rf $logfile > /dev/null 2>&1 |
---|
| 510 | rc=$? |
---|
| 511 | if [[ $rc -gt 0 ]] |
---|
| 512 | then |
---|
| 513 | print "$opf: $sn: cannot rm $logfile" |
---|
| 514 | freeLockAndExit $rc_fail |
---|
| 515 | fi |
---|
| 516 | fi |
---|
| 517 | |
---|
| 518 | # Issue the query command to determine which files were not |
---|
| 519 | # backed up successfully. |
---|
| 520 | # |
---|
| 521 | # dsmc query backup -fromdate=$tsmDate -fromtime=$tsmTime |
---|
| 522 | # -filelist=$filelistName > /dev/null 2>&1 |
---|
| 523 | # $dsmc query backup -filelist=$filelistName > /tmp/out1q 2> /tmp/out2q |
---|
| 524 | $dsmc query backup -filelist=$filelistName > /dev/null 2>&1 |
---|
| 525 | rc=$? |
---|
| 526 | |
---|
| 527 | if [[ $rc -eq 0 ]] |
---|
| 528 | then |
---|
| 529 | # If we have an error log file, examine it to determine |
---|
| 530 | # the files which were not successfully backed up. |
---|
| 531 | if [[ -a $logfile && -s $logfile ]] |
---|
| 532 | then |
---|
| 533 | |
---|
| 534 | # Process the error log and construct the pending transactions file. |
---|
| 535 | # |
---|
| 536 | # The following is a line from the pertinent error log file: |
---|
| 537 | # 03/13/02 10:37:48 ANS1092E No files matching search criteria |
---|
| 538 | # were found |
---|
| 539 | # or |
---|
| 540 | # 11/16/01 15:24:56 ANS1345E No objects on server match |
---|
| 541 | # '/log/michail/file_4' |
---|
| 542 | |
---|
| 543 | # Check for matching search criteria failure. |
---|
| 544 | pendingBackupsList="$mountPoint$tpl"_"$processIndex" |
---|
| 545 | $grep "${searchErrorString}" $logfile > ${pendingBackupsList} |
---|
| 546 | if [[ -a $pendingBackupsList && -s $pendingBackupsList ]] |
---|
| 547 | then |
---|
| 548 | print "$opf: $sn: TSM dsmc query command indicated search criteria failure (see file $logfile)." |
---|
| 549 | $rm -rf $pendingBackupsList > /dev/null 2>&1 |
---|
| 550 | freeLockAndExit $rc_fail |
---|
| 551 | fi |
---|
| 552 | |
---|
| 553 | # Check for objects which do not match, i.e., |
---|
| 554 | # individual files which were not backed up. |
---|
| 555 | $grep "${objectErrorString}" $logfile | \ |
---|
| 556 | $cut -f2 -d\' >> ${pendingBackupsList} |
---|
| 557 | print "$opps: $sn: TSM dsmc $tsmCommand command partially succeeded (see file $logfile)." |
---|
| 558 | freeLockAndExit $rc_psuccess |
---|
| 559 | else |
---|
| 560 | print "$ops: $sn: TSM dsmc query command did not produce any error log." |
---|
| 561 | freeLockAndExit $rc_success |
---|
| 562 | fi |
---|
| 563 | else |
---|
| 564 | print "$opf: $sn: TSM dsmc query command failed to run." |
---|
| 565 | freeLockAndExit $rc_fail |
---|
| 566 | fi |
---|
| 567 | else |
---|
| 568 | # If there is an error log file, tell the user to examine it |
---|
| 569 | # to determine the cause of the failure. |
---|
| 570 | if [[ -a $logfile && -s $logfile ]] |
---|
| 571 | then |
---|
| 572 | print "$opf: $sn: TSM dsmc $tsmCommand command failed to run (see file $logfile)." |
---|
| 573 | else |
---|
| 574 | print "$opf: $sn: TSM dsmc $tsmCommand command failed to run." |
---|
| 575 | fi |
---|
| 576 | freeLockAndExit $rc_fail |
---|
| 577 | fi |
---|
| 578 | |
---|
| 579 | # TSM expire command processing |
---|
| 580 | # |
---|
| 581 | elif [[ $tsmCommand = expire ]] |
---|
| 582 | then |
---|
| 583 | |
---|
| 584 | # Clear the error log. We are only interested in the error log |
---|
| 585 | # created from issuing the expire command. |
---|
| 586 | if [[ -a $logfile && -s $logfile ]] |
---|
| 587 | then |
---|
| 588 | $rm -rf $logfile > /dev/null 2>&1 |
---|
| 589 | rc=$? |
---|
| 590 | if [[ $rc -gt 0 ]] |
---|
| 591 | then |
---|
| 592 | print "$opf: $sn: cannot rm $logfile" |
---|
| 593 | freeLockAndExit $rc_fail |
---|
| 594 | fi |
---|
| 595 | fi |
---|
| 596 | |
---|
| 597 | # Issue the TSM command to have files in the file system expired. |
---|
| 598 | if [[ $tsmCommandOption = filelist ]] |
---|
| 599 | then |
---|
| 600 | # $dsmc $tsmCommand -noprompt -filelist=$filelistName > /tmp/out1x 2> /tmp/out2x |
---|
| 601 | $dsmc $tsmCommand -noprompt -filelist=$filelistName > /dev/null 2>&1 |
---|
| 602 | else |
---|
| 603 | # $dsmc $tsmCommand -noprompt $tsmCommandParm > /tmp/out1x 2>/tmp/out2x |
---|
| 604 | $dsmc $tsmCommand -noprompt $tsmCommandParm > /dev/null 2>&1 |
---|
| 605 | fi |
---|
| 606 | rc=$? |
---|
| 607 | |
---|
| 608 | # The return code only indicates whether the TSM executable ran |
---|
| 609 | # successfully. |
---|
| 610 | # The TSM client returns a code greater than 0 (zero) only if TSM was |
---|
| 611 | # unable to attempt the operations. |
---|
| 612 | # Only those return codes output to the error report (dsmerror.log) |
---|
| 613 | # indicate the success or failure of specific TSM commands. |
---|
| 614 | if [[ $rc -eq 0 ]] |
---|
| 615 | then |
---|
| 616 | |
---|
| 617 | # If we have an error log file examine it to determine the files |
---|
| 618 | # which were not successfully restored. |
---|
| 619 | if [[ -a $logfile && -s $logfile ]] |
---|
| 620 | then |
---|
| 621 | |
---|
| 622 | # Process the error log and construct the transactions_pending file. |
---|
| 623 | # Check for objects which failed to get processed (i.e expired). |
---|
| 624 | pendingExpiresList="$mountPoint$tpl"_"$processIndex" |
---|
| 625 | $grep "${errorProcessingString}" $logfile | \ |
---|
| 626 | $cut -f2 -d\' > ${pendingExpiresList} |
---|
| 627 | |
---|
| 628 | if [[ -a $pendingExpiresList && -s $pendingExpiresList ]] |
---|
| 629 | then |
---|
| 630 | print "$opf: $sn: TSM dsmc query command indicated search criteria failure (see file $logfile)." |
---|
| 631 | $rm -rf $pendingExpiresList > /dev/null 2>&1 |
---|
| 632 | freeLockAndExit $rc_fail |
---|
| 633 | fi |
---|
| 634 | |
---|
| 635 | # Check for objects which do not match, namely, |
---|
| 636 | # individual files which were not restored. |
---|
| 637 | $grep "${objectErrorString}" $logfile | \ |
---|
| 638 | $cut -f2 -d\' >> ${pendingExpiresList} |
---|
| 639 | print "$opps: $sn: TSM dsmc expire command partially succeeded (see file $logfile)." |
---|
| 640 | freeLockAndExit $rc_psuccess |
---|
| 641 | else |
---|
| 642 | print "$ops: $sn: TSM dsmc expire command did not produce any error log." |
---|
| 643 | freeLockAndExit $rc_success |
---|
| 644 | fi |
---|
| 645 | else |
---|
| 646 | # If there is an error log file, tell the user to examine it |
---|
| 647 | # to determine the cause of the failure. |
---|
| 648 | if [[ -a $logfile && -s $logfile ]] |
---|
| 649 | then |
---|
| 650 | print "$opf: $sn: TSM dsmc expire command failed to run (see file $logfile)." |
---|
| 651 | else |
---|
| 652 | print "$opf: $sn: TSM dsmc expire command failed to run." |
---|
| 653 | fi |
---|
| 654 | freeLockAndExit $rc_fail |
---|
| 655 | fi |
---|
| 656 | |
---|
| 657 | # TSM restore command processing |
---|
| 658 | # |
---|
| 659 | elif [[ $tsmCommand = restore ]] |
---|
| 660 | then |
---|
| 661 | |
---|
| 662 | # Clear the error log. We are only interested in the error log |
---|
| 663 | # created from issuing the restore command. |
---|
| 664 | if [[ -a $logfile && -s $logfile ]] |
---|
| 665 | then |
---|
| 666 | $rm -rf $logfile > /dev/null 2>&1 |
---|
| 667 | rc=$? |
---|
| 668 | if [[ $rc -gt 0 ]] |
---|
| 669 | then |
---|
| 670 | print "$opf: $sn: cannot rm $logfile" |
---|
| 671 | freeLockAndExit $rc_fail |
---|
| 672 | fi |
---|
| 673 | fi |
---|
| 674 | |
---|
| 675 | # Issue the TSM command to have the list of files restored |
---|
| 676 | # NOTE: We restore the files specified to the mount point of the file |
---|
| 677 | # system and not to the snapshot the files were backed up from. |
---|
| 678 | # $dsmc $tsmCommand -filelist=$filelistName $mountPoint > /tmp/out1r 2>/tmp/out2r |
---|
| 679 | $dsmc $tsmCommand -filelist=$filelistName $mountPoint > /dev/null 2>&1 |
---|
| 680 | rc=$? |
---|
| 681 | |
---|
| 682 | # The return code only indicates whether the TSM executable ran successfully. |
---|
| 683 | # The TSM client returns a code greater than 0 (zero) only if TSM was |
---|
| 684 | # unable to attempt the operations. |
---|
| 685 | # Only those return codes output to the error report (dsmerror.log) |
---|
| 686 | # indicate the success or failure of specific TSM commands. |
---|
| 687 | # NOTE: |
---|
| 688 | # According to TSM documentation ("Return Codes from TSM Executables |
---|
| 689 | # and Shell Scripts"): |
---|
| 690 | # TSM returns 0 even if the file is not successfully backed up, |
---|
| 691 | # archived, or restored if the reason for the unsuccessful process is: |
---|
| 692 | # . the client could not establish a session with the TSM server, or |
---|
| 693 | # . the file does not exist. |
---|
| 694 | # WARNING: |
---|
| 695 | # In unit testing it was learned that if a file does not exist, |
---|
| 696 | # the return code on a restore operation is not zero. |
---|
| 697 | # The following code tries to deal with this situation |
---|
| 698 | # (which situation contradicts what was stated above). |
---|
| 699 | |
---|
| 700 | # If we have an error log file examine it to determine the files |
---|
| 701 | # which were not successfully restored. |
---|
| 702 | if [[ -a $logfile && -s $logfile ]] |
---|
| 703 | then |
---|
| 704 | |
---|
| 705 | # Process the error log and construct the transactions_pending file. |
---|
| 706 | # |
---|
| 707 | # The following is a line from the pertinent error log file: |
---|
| 708 | # 04/05/02 15:41:52 ANS4007E Error processing |
---|
| 709 | # '/backup_tsm/.backup_snapshot/.NodeCtrl' |
---|
| 710 | # or |
---|
| 711 | # 11/16/01 15:24:56 ANS1345E No objects on server match |
---|
| 712 | # '/log/michail/file_4' |
---|
| 713 | |
---|
| 714 | # Check for objects which failed to get processed (i.e., restored). |
---|
| 715 | pendingRestoresList="$mountPoint$tpl"_"$processIndex" |
---|
| 716 | $grep "${errorProcessingString}" $logfile | \ |
---|
| 717 | $cut -f2 -d\' > ${pendingRestoresList} |
---|
| 718 | |
---|
| 719 | # Check for objects which do not match, i.e., |
---|
| 720 | # individual files which were not restored. |
---|
| 721 | $grep "${objectErrorString}" $logfile | \ |
---|
| 722 | $cut -f2 -d\' >> ${pendingRestoresList} |
---|
| 723 | if [[ -a $pendingRestoresList && -s $pendingRestoresList ]] |
---|
| 724 | then |
---|
| 725 | print "$opps: $sn: TSM dsmc restore command partially succeeded (see file $logfile)." |
---|
| 726 | freeLockAndExit $rc_psuccess |
---|
| 727 | else |
---|
| 728 | print "$opf: $sn: TSM dsmc restore command failed (see file $logfile)." |
---|
| 729 | freeLockAndExit $rc_fail |
---|
| 730 | fi |
---|
| 731 | elif [[ $rc -eq 0 ]] |
---|
| 732 | then |
---|
| 733 | print "$ops: $sn: TSM dsmc restore command did not produce any error log." |
---|
| 734 | freeLockAndExit $rc_success |
---|
| 735 | else |
---|
| 736 | print "$opf: $sn: TSM dsmc restore command failed to run." |
---|
| 737 | freeLockAndExit $rc_fail |
---|
| 738 | fi |
---|
| 739 | |
---|
| 740 | else |
---|
| 741 | print "$opf: $sn: Wrong value ($tsmCommand) passed for TSM operation." |
---|
| 742 | freeLockAndExit $rc_fail |
---|
| 743 | fi |
---|
| 744 | |
---|
| 745 | freeLockAndExit $rc_success |
---|
| 746 | |
---|