-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathtestsuite_control_cluster.sh
executable file
·106 lines (86 loc) · 1.98 KB
/
testsuite_control_cluster.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
#!/bin/sh
#########################################################
#
#
#########################################################
## INIT nodes / SOME CHECKS
#########################################################
# all is done from the Host
if [ -f `pwd`/functions ] ; then
. `pwd`/functions
else
echo "! need functions in current path; Exiting"; exit 1
fi
check_load_config_file
slurm_down_up() {
echo $I "############ START slurm_down_up" $O
exec_on_node ${NODENAME}1 "scontrol show node"
exec_on_node ${NODENAME}1 "sinfo"
exec_on_node ${NODENAME}1 "scontrol update NodeName=${NODENAME}[1-${NBNODE}] State=down Reason=hung_proc"
sleep 3
exec_on_node ${NODENAME}1 "scontrol update NodeName=${NODENAME}[1-${NBNODE}] State=resume"
exec_on_node ${NODENAME}1 "sinfo"
}
cmd_on_nodes() {
echo $I "############ START cmd" $O
if [ -z "$*" ]; then echo "- First arg must be the command!"; exit 1; fi
CMD="$*"
for i in `seq 1 $NBNODE`
do
exec_on_node ${NODENAME}${i} "$CMD"
done
}
#scontrol show job
#scontrol show partition
##########################
##########################
### MAIN
##########################
##########################
case "$1" in
slurmdownup)
slurm_down_up
;;
scc)
enable_SCC_repo
;;
cleanrepo)
cleanup_zypper_repo
;;
update)
update_nodes
;;
start)
start_vm
;;
stop)
stop_vm
;;
cmd)
cmd_on_nodes $2
;;
install)
install_package $2
;;
*)
echo "
media
enable DVD media on all nodes
scc
enable SCC repo and add PackageHub repo
cleanrepo
disable SCC (cleanup) and remove all zypper repo
update
update all nodes with latest packages
start
start all nodes
stop
stop all nodes
install
install package name (or list)
slurmdownup
scontrol update NodeName=<node> State=down Reason=hung_proc
scontrol update NodeName=<node> State=resume
"
exit 1
esac