#!/usr/bin/env expect ############################################################################ # Purpose: Test of Slurm functionality # Test of partition specification on job submission (--partition # option). ############################################################################ # Copyright (C) 2002-2006 The Regents of the University of California. # Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER). # Written by Morris Jette # CODE-OCEC-09-009. All rights reserved. # # This file is part of Slurm, a resource management program. # For details, see . # Please also read the included file: DISCLAIMER. # # Slurm is free software; you can redistribute it and/or modify it under # the terms of the GNU General Public License as published by the Free # Software Foundation; either version 2 of the License, or (at your option) # any later version. # # Slurm is distributed in the hope that it will be useful, but WITHOUT ANY # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS # FOR A PARTICULAR PURPOSE. See the GNU General Public License for more # details. # # You should have received a copy of the GNU General Public License along # with Slurm; if not, write to the Free Software Foundation, Inc., # 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. ############################################################################ source ./globals set def_part_name "" set exit_code 0 set file_in "test$test_id.input" set job_id 0 set other_part_name "" # # Identify the partitions in the cluster, identifying the default # spawn $sinfo --summarize expect { -re "($end_of_line)($re_word_str) *up" { set last [string last "*" $expect_out(2,string)] if { $last != -1 } { set def_part_name [string range $expect_out(2,string) 0 [expr $last-1]] } else { set other_part_name $expect_out(2,string) } exp_continue } -re "Unable to contact" { fail "Slurm appears to be down" } timeout { log_error "sinfo not responding" set exit_code 1 } eof { wait } } # # Submit a job explicitly to the default partition # set job_id 0 set timeout $max_job_delay set salloc_pid [spawn $salloc --partition=$def_part_name -t1 $bin_sleep 1] expect { -re "Granted job allocation ($number)" { set job_id $expect_out(1,string) exp_continue } timeout { log_error "salloc not responding" if {$job_id != 0} { cancel_job $job_id } slow_kill [expr 0 - $salloc_pid] set exit_code 1 } eof { wait } } # Confirm the job's partition if {$job_id == 0} { log_error "Job submit failure" set exit_code 1 } else { set read_part "" spawn $scontrol show job $job_id expect { -re "Partition=($re_word_str)" { set read_part $expect_out(1,string) exp_continue } timeout { log_error "scontrol not responding" set exit_code 1 } eof { wait } } if ([string compare $read_part $def_part_name]) { log_error "Improper partition selected" set exit_code 1 } cancel_job $job_id } # # Test if a non-default partition exists, terminate if none # if (![string compare $other_part_name ""]) { skip "Can't test salloc partition option only the default partition exists" } # # Submit job explicitly to a non-default partition # set job_id 0 set legit_failure 0 set salloc_pid [spawn $salloc --partition=$other_part_name -t1 $bin_sleep 1] expect { -re "Required node not available" { set legit_failure 1 exec $bin_kill -INT $salloc_pid exp_continue } -re "Granted job allocation ($number)" { set job_id $expect_out(1,string) exp_continue } timeout { log_error "srun not responding" if {$job_id != 0} { cancel_job $job_id } slow_kill [expr 0 - $salloc_pid] set exit_code 1 } eof { wait } } # Confirm the job's partition if {$legit_failure == 1} { log_warn "Partition '$other_part_name' is not usable" } elseif {$job_id == 0} { log_error "Batch submit failure" set exit_code 1 } else { set read_part "" spawn $scontrol show job $job_id expect { -re "Partition=($re_word_str)" { set read_part $expect_out(1,string) exp_continue } timeout { log_error "scontrol not responding" set exit_code 1 } eof { wait } } if ([string compare $read_part $other_part_name]) { log_error "Improper partition selected" set exit_code 1 } cancel_job $job_id } if {$exit_code != 0} { fail "Test failed due to previous errors (\$exit_code = $exit_code)" }