#!/usr/bin/env expect ############################################################################ # Purpose: Test of Slurm functionality # Test of job dependencies and deferred begin time (--dependency # and --begin options). # # Output: "TEST: #.#" followed by "SUCCESS" if test was successful, OR # "FAILURE: ..." otherwise with an explanation of the failure, OR # anything else indicates a failure mode that must be investigated. ############################################################################ # Copyright (C) 2004-2007 The Regents of the University of California. # Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER). # Written by Morris Jette # CODE-OCEC-09-009. All rights reserved. # # This file is part of Slurm, a resource management program. # For details, see . # Please also read the included file: DISCLAIMER. # # Slurm is free software; you can redistribute it and/or modify it under # the terms of the GNU General Public License as published by the Free # Software Foundation; either version 2 of the License, or (at your option) # any later version. # # Slurm is distributed in the hope that it will be useful, but WITHOUT ANY # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS # FOR A PARTICULAR PURPOSE. See the GNU General Public License for more # details. # # You should have received a copy of the GNU General Public License along # with Slurm; if not, write to the Free Software Foundation, Inc., # 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. ############################################################################ source ./globals set test_id "17.18" set file_in "test$test_id.input" set file_out "test$test_id.output" set exit_code 0 set job_id1 0 set job_id2 0 print_header $test_id # # Build input script file # exec $bin_rm -f $file_in $file_out make_bash_script $file_in "$bin_sleep 5" # # Spawn a batch job that just sleeps for a while # set timeout $max_job_delay spawn $sbatch --output=/dev/null --error=/dev/null -t1 $file_in expect { -re "Submitted batch job ($number)" { set job_id1 $expect_out(1,string) exp_continue } timeout { send_user "\nFAILURE: sbatch not responding\n" set exit_code 1 exp_continue } eof { wait } } if {$job_id1 == 0} { send_user "\nFAILURE: batch submit failure\n" exit 1 } # # Submit a dependent job # exec $bin_rm -f $file_in make_bash_script $file_in "$scontrol show job $job_id1" set match_state 0 set timeout 30 spawn $sbatch --dependency=afterany:$job_id1 --output=$file_out $file_in expect { -re "Submitted batch job ($number)" { set job_id2 $expect_out(1,string) exp_continue } eof { wait } } if {$job_id2 == 0} { send_user "\nFAILURE: batch submit failure\n" exit 1 } # # Confirm dependency info within second job # set match_jobid 0 set purged_job 0 spawn $scontrol show job $job_id2 expect { -re "Dependency=afterany:($number)" { set match_jobid $expect_out(1,string) exp_continue } -re "Invalid job id specified" { set purged_job 1 exp_continue } timeout { send_user "\nFAILURE: scontrol not responding\n" set exit_code 1 } eof { wait } } if {$match_jobid == 0} { set min_job_age [get_min_job_age] if {$min_job_age < 60} { send_user "\nWARNING: MinJobAge ($min_job_age) configured too low " send_user "to capture job state after completion\n" } else { send_user "\nFAILURE: Dependency information is missing\n" set exit_code 1 } } elseif {$match_jobid != $job_id1} { send_user "\nFAILURE: Dependency information not processed\n" set exit_code 1 } # # Wait for job to complete # if {[wait_for_job $job_id2 "DONE"] != 0} { send_user "\nFAILURE: waiting for job to complete\n" cancel_job $job_id2 cancel_job $job_id1 exit 1 } cancel_job $job_id1 # # Inspect the job's output file # if {[wait_for_file $file_out] != 0} { exit 1 } spawn $bin_cat $file_out expect { # Could be COMPLETED or COMPLETING -re "JobState=COMPLET" { set match_state 1 exp_continue } eof { wait } } if {$match_state == 0} { send_user "\nFAILURE: Dependent job not completed\n" set exit_code 1 } # # Submit a job to run at noon tomorrow # set job_id1 0 spawn $sbatch --output=/dev/null --error=/dev/null --begin=noon-tomorrow $file_in expect { -re "Submitted batch job ($number)" { set job_id1 $expect_out(1,string) exp_continue } eof { wait } } if {$job_id1 == 0} { send_user "\nFAILURE: batch submit failure\n" exit 1 } exec $bin_sleep 5 set match 0 spawn $scontrol show job $job_id1 expect { -re "JobState=PENDING" { incr match exp_continue } -re "StartTime=($number)/($number)-12:00:00" { incr match exp_continue } -re "StartTime=($number)-($number)-($number)T12:00:00" { incr match exp_continue } timeout { send_user "\nFAILURE: scontrol not responding\n" set exit_code 1 exp_continue } eof { wait } } if {$match != 2} { send_user "\nFAILURE: unexpected JobState or StartTime $match\n" set exit_code 1 } # Reset start time and test for completion spawn $scontrol update JobId=$job_id1 StartTime=now expect { timeout { send_user "\nFAILURE: scontrol not responding\n" set exit_code 1 exp_continue } eof { wait } } set delayed 0 set is_done 0 set purged_job 0 while { $delayed < $max_job_delay } { exec $bin_sleep 10 incr delayed +10 spawn $scontrol show job $job_id1 expect { -re "JobState=COMPLETED" { set is_done 1 exp_continue } -re "Invalid job id specified" { set is_done 1 set purged_job 1 exp_continue } timeout { send_user "\nFAILURE: scontrol not responding\n" set exit_code 1 exp_continue } eof { wait } } if {$is_done == 1} { break } } if {$is_done == 0} { send_user "\nFAILURE: unexpected JobState\n" cancel_job $job_id1 set exit_code 1 } if {$purged_job == 1} { set min_job_age [get_min_job_age] if {$min_job_age < 60} { send_user "\nWARNING: MinJobAge ($min_job_age) configured too low " send_user "to capture job state after completion\n" } else { send_user "\nFAILURE: Could not find job $job_id1\n" set exit_code 1 } } if {$exit_code == 0} { exec $bin_rm -f $file_in $file_out send_user "\nSUCCESS\n" } exit $exit_code