@@ -807,7 +807,7 @@ function install_systemd_dask_worker() {
807807 local compute_mode_cmd=" "
808808 if command -v nvidia-smi ; then compute_mode_cmd=" nvidia-smi --compute-mode=DEFAULT" ; fi
809809 local worker_name=" dask worker"
810- if test -f " ${DASK_CONDA_ENV} /bin/dask-cuda-worker " ; then worker_name=" dask-cuda worker" ; fi
810+ if test -f " ${DASK_CONDA_ENV} /bin/dask-cuda" ; then worker_name=" dask-cuda worker" ; fi
811811 local worker=" ${DASK_CONDA_ENV} /bin/${worker_name} "
812812 cat << EOF >"${DASK_WORKER_LAUNCHER} "
813813#!/bin/bash
@@ -898,6 +898,39 @@ function install_systemd_dask_service() {
898898 install_systemd_dask_worker
899899}
900900
901+ function start_systemd_dask_service() {
902+ # only run scheduler on primary master
903+ if [[ " $( hostname -s) " == " ${MASTER} " ]]; then
904+ date
905+ time systemctl start " ${DASK_SCHEDULER_SERVICE} "
906+ local substate_val=" $( systemctl show ${DASK_SCHEDULER_SERVICE} -p SubState --value) "
907+ if [[ " ${substate_val} " != ' running' ]] ; then
908+ cat " /var/log/${DASK_SCHEDULER_SERVICE} .log"
909+ fi
910+ systemctl status " ${DASK_SCHEDULER_SERVICE} "
911+ fi
912+
913+ echo " Starting Dask 'standalone' cluster..."
914+ if [[ " ${enable_systemd_dask_worker_service} " == " 1" ]]; then
915+ date
916+ # Pause while scheduler comes online
917+ retries=30
918+ while ! nc -vz " ${MASTER} " 8786 ; do
919+ sleep 3s
920+ (( retries-- ))
921+ if [[ " ${retries} " == " 0" ]] ; then echo " dask scheduler unreachable" ; exit 1 ; fi
922+ done
923+ time systemctl start " ${DASK_WORKER_SERVICE} "
924+ local substate_val=" $( systemctl show ${DASK_WORKER_SERVICE} -p SubState --value) "
925+ if [[ " ${substate_val} " != ' running' ]] ; then
926+ cat " /var/log/${DASK_WORKER_SERVICE} .log"
927+ fi
928+ systemctl status " ${DASK_WORKER_SERVICE} "
929+ fi
930+
931+ date
932+ }
933+
901934function configure_knox_for_dask() {
902935 if [[ ! -d " ${KNOX_HOME} " ]]; then
903936 echo " Skip configuring Knox rules for Dask"
@@ -1273,37 +1306,8 @@ function main() {
12731306 elif [[ " ${DASK_RUNTIME} " == " standalone" ]]; then
12741307 # Create Dask service
12751308 install_systemd_dask_service
1309+ start_systemd_dask_service
12761310
1277- # only run scheduler on primary master
1278- if [[ " $( hostname -s) " == " ${MASTER} " ]]; then
1279- date
1280- time systemctl start " ${DASK_SCHEDULER_SERVICE} "
1281- local substate_val=" $( systemctl show ${DASK_SCHEDULER_SERVICE} -p SubState --value) "
1282- if [[ " ${substate_val} " != ' running' ]] ; then
1283- cat " /var/log/${DASK_SCHEDULER_SERVICE} .log"
1284- fi
1285- systemctl status " ${DASK_SCHEDULER_SERVICE} "
1286- fi
1287-
1288- echo " Starting Dask 'standalone' cluster..."
1289- if [[ " ${enable_systemd_dask_worker_service} " == " 1" ]]; then
1290- date
1291- # Pause while scheduler comes online
1292- retries=30
1293- while ! nc -vz " ${MASTER} " 8786 ; do
1294- sleep 3s
1295- (( retries-- ))
1296- if [[ " ${retries} " == " 0" ]] ; then echo " dask scheduler unreachable" ; exit 1 ; fi
1297- done
1298- time systemctl start " ${DASK_WORKER_SERVICE} "
1299- local substate_val=" $( systemctl show ${DASK_WORKER_SERVICE} -p SubState --value) "
1300- if [[ " ${substate_val} " != ' running' ]] ; then
1301- cat " /var/log/${DASK_WORKER_SERVICE} .log"
1302- fi
1303- systemctl status " ${DASK_WORKER_SERVICE} "
1304- fi
1305-
1306- date
13071311 configure_knox_for_dask
13081312
13091313 local DASK_CLOUD_LOGGING=" $( get_metadata_attribute dask-cloud-logging || echo ' false' ) "
@@ -1325,7 +1329,7 @@ function exit_handler() {
13251329
13261330function prepare_to_install(){
13271331 prepare_common_env
1328- conda_env=" $( get_metadata_attribute conda-env || echo ' dask' ) "
1332+ conda_env=" $( get_metadata_attribute conda-env ' dask' ) "
13291333 readonly conda_env
13301334 prepare_dask_env
13311335 trap exit_handler EXIT
0 commit comments