-
Notifications
You must be signed in to change notification settings - Fork 57
/
Copy pathdocker-entrypoint.sh
executable file
·84 lines (69 loc) · 2.15 KB
/
docker-entrypoint.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
#!/bin/bash
set -eo pipefail
export SLURM_NODE_COUNT=${SLURM_NODE_COUNT:-3}
SLURMD_PORT_BASE=7000
declare -a SLURMD_PORT_RANGE=$(seq -w $SLURMD_PORT_BASE $((SLURMD_PORT_BASE + SLURM_NODE_COUNT)))
declare -a SLURM_PORTS=(6817 6819 6820 3306 $SLURMD_PORT_RANGE)
function error_with_msg {
if [[ "$count" -eq 0 ]]
then
echo
echo >&2 "$1"
exit 1
fi
}
if [ ! -d "/var/lib/mysql/mysql" ]
then
echo "[mysqld]\nskip-host-cache\nskip-name-resolve" > /etc/my.cnf.d/docker.cnf
echo "- Initializing database"
/usr/bin/mysql_install_db --user=mysql &> /dev/null
echo "- Database initialized"
fi
if [ ! -d "/var/lib/mysql/slurm_acct_db" ]
then
/usr/bin/mysqld_safe &
for count in {30..0}; do
if echo "SELECT 1" | mysql &> /dev/null
then
break
fi
echo "- Starting MariaDB to create Slurm account database"
sleep 1
done
error_with_msg "MariaDB did not start"
echo "- Creating Slurm acct database"
mysql -NBe "CREATE USER 'slurm'@'localhost' identified by 'password'"
mysql -NBe "GRANT ALL ON slurm_acct_db.* to 'slurm'@'localhost' identified by 'password' with GRANT option"
mysql -NBe "GRANT ALL ON slurm_acct_db.* to 'slurm'@'slurmctl' identified by 'password' with GRANT option"
mysql -NBe "CREATE DATABASE slurm_acct_db"
echo "- Slurm acct database created. Stopping MariaDB"
killall mysqld
for count in {30..0}; do
if echo "SELECT 1" | mysql &> /dev/null
then
sleep 1
else
break
fi
done
error_with_msg "MariaDB did not stop"
fi
echo "- Starting supervisord process manager"
/usr/bin/supervisord --configuration /etc/supervisord.conf
echo "- Starting all Services..."
for service in munged mysqld slurmdbd slurmctld slurmd slurmrestd
do
/usr/bin/supervisorctl start "$service:*"
done
echo "- Waiting for the cluster to become available"
for count in {10..0}; do
if ! grep -q "normal.*idle" <(timeout 1 sinfo)
then
sleep 1
else
break
fi
done
error_with_msg "Slurm partitions failed to start successfully."
echo "- Cluster is now available"
exec "$@"