Skip to content

Commit 7b767be

Browse files
committed
refactored some common code ; setting default value for metadata attribute correctly
1 parent 4587725 commit 7b767be

File tree

1 file changed

+36
-32
lines changed

1 file changed

+36
-32
lines changed

dask/dask.sh

Lines changed: 36 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -807,7 +807,7 @@ function install_systemd_dask_worker() {
807807
local compute_mode_cmd=""
808808
if command -v nvidia-smi ; then compute_mode_cmd="nvidia-smi --compute-mode=DEFAULT" ; fi
809809
local worker_name="dask worker"
810-
if test -f "${DASK_CONDA_ENV}/bin/dask-cuda-worker" ; then worker_name="dask-cuda worker" ; fi
810+
if test -f "${DASK_CONDA_ENV}/bin/dask-cuda" ; then worker_name="dask-cuda worker" ; fi
811811
local worker="${DASK_CONDA_ENV}/bin/${worker_name}"
812812
cat <<EOF >"${DASK_WORKER_LAUNCHER}"
813813
#!/bin/bash
@@ -898,6 +898,39 @@ function install_systemd_dask_service() {
898898
install_systemd_dask_worker
899899
}
900900

901+
function start_systemd_dask_service() {
902+
# only run scheduler on primary master
903+
if [[ "$(hostname -s)" == "${MASTER}" ]]; then
904+
date
905+
time systemctl start "${DASK_SCHEDULER_SERVICE}"
906+
local substate_val="$(systemctl show ${DASK_SCHEDULER_SERVICE} -p SubState --value)"
907+
if [[ "${substate_val}" != 'running' ]] ; then
908+
cat "/var/log/${DASK_SCHEDULER_SERVICE}.log"
909+
fi
910+
systemctl status "${DASK_SCHEDULER_SERVICE}"
911+
fi
912+
913+
echo "Starting Dask 'standalone' cluster..."
914+
if [[ "${enable_systemd_dask_worker_service}" == "1" ]]; then
915+
date
916+
# Pause while scheduler comes online
917+
retries=30
918+
while ! nc -vz "${MASTER}" 8786 ; do
919+
sleep 3s
920+
((retries--))
921+
if [[ "${retries}" == "0" ]] ; then echo "dask scheduler unreachable" ; exit 1 ; fi
922+
done
923+
time systemctl start "${DASK_WORKER_SERVICE}"
924+
local substate_val="$(systemctl show ${DASK_WORKER_SERVICE} -p SubState --value)"
925+
if [[ "${substate_val}" != 'running' ]] ; then
926+
cat "/var/log/${DASK_WORKER_SERVICE}.log"
927+
fi
928+
systemctl status "${DASK_WORKER_SERVICE}"
929+
fi
930+
931+
date
932+
}
933+
901934
function configure_knox_for_dask() {
902935
if [[ ! -d "${KNOX_HOME}" ]]; then
903936
echo "Skip configuring Knox rules for Dask"
@@ -1273,37 +1306,8 @@ function main() {
12731306
elif [[ "${DASK_RUNTIME}" == "standalone" ]]; then
12741307
# Create Dask service
12751308
install_systemd_dask_service
1309+
start_systemd_dask_service
12761310

1277-
# only run scheduler on primary master
1278-
if [[ "$(hostname -s)" == "${MASTER}" ]]; then
1279-
date
1280-
time systemctl start "${DASK_SCHEDULER_SERVICE}"
1281-
local substate_val="$(systemctl show ${DASK_SCHEDULER_SERVICE} -p SubState --value)"
1282-
if [[ "${substate_val}" != 'running' ]] ; then
1283-
cat "/var/log/${DASK_SCHEDULER_SERVICE}.log"
1284-
fi
1285-
systemctl status "${DASK_SCHEDULER_SERVICE}"
1286-
fi
1287-
1288-
echo "Starting Dask 'standalone' cluster..."
1289-
if [[ "${enable_systemd_dask_worker_service}" == "1" ]]; then
1290-
date
1291-
# Pause while scheduler comes online
1292-
retries=30
1293-
while ! nc -vz "${MASTER}" 8786 ; do
1294-
sleep 3s
1295-
((retries--))
1296-
if [[ "${retries}" == "0" ]] ; then echo "dask scheduler unreachable" ; exit 1 ; fi
1297-
done
1298-
time systemctl start "${DASK_WORKER_SERVICE}"
1299-
local substate_val="$(systemctl show ${DASK_WORKER_SERVICE} -p SubState --value)"
1300-
if [[ "${substate_val}" != 'running' ]] ; then
1301-
cat "/var/log/${DASK_WORKER_SERVICE}.log"
1302-
fi
1303-
systemctl status "${DASK_WORKER_SERVICE}"
1304-
fi
1305-
1306-
date
13071311
configure_knox_for_dask
13081312

13091313
local DASK_CLOUD_LOGGING="$(get_metadata_attribute dask-cloud-logging || echo 'false')"
@@ -1325,7 +1329,7 @@ function exit_handler() {
13251329

13261330
function prepare_to_install(){
13271331
prepare_common_env
1328-
conda_env="$(get_metadata_attribute conda-env || echo 'dask')"
1332+
conda_env="$(get_metadata_attribute conda-env 'dask')"
13291333
readonly conda_env
13301334
prepare_dask_env
13311335
trap exit_handler EXIT

0 commit comments

Comments
 (0)