Commit a8bd41f 1 parent cb88657 commit a8bd41f Copy full SHA for a8bd41f
File tree 1 file changed +6
-7
lines changed
1 file changed +6
-7
lines changed Original file line number Diff line number Diff line change @@ -6,12 +6,10 @@ usage() {
6
6
}
7
7
8
8
# parse arguments
9
- address=localhost
10
9
rmm_pool_size=1GB
11
10
12
11
while getopts " :a:i:r:t:" flag; do
13
12
case " ${flag} " in
14
- a) address=${OPTARG} ;;
15
13
i) interface=${OPTARG} ;;
16
14
r) rmm_pool_size=${OPTARG} ;;
17
15
t) transport=${OPTARG} ;;
@@ -29,8 +27,8 @@ DASK_UCX__CUDA_COPY=True
29
27
DASK_UCX__TCP=True
30
28
DASK_RMM__POOL_SIZE=$rmm_pool_size
31
29
32
- scheduler_flags=" --protocol ucx"
33
- worker_flags=" --enable-tcp-over-ucx --rmm-pool-size ${rmm_pool_size} "
30
+ scheduler_flags=" --scheduler-file scheduler.json -- protocol ucx"
31
+ worker_flags=" --scheduler-file scheduler.json -- enable-tcp-over-ucx --rmm-pool-size ${rmm_pool_size} "
34
32
35
33
if ! [ -z ${interface+x} ]; then
36
34
scheduler_flags+=" --interface ${interface} "
@@ -42,14 +40,15 @@ if [[ $transport == *"nvlink"* ]]; then
42
40
fi
43
41
if [[ $transport == * " ib" * ]]; then
44
42
DASK_UCX__INFINIBAND=True
45
- DASK_UCX__RDMACM=True
43
+ # DASK_UCX__RDMACM=True # RDMACM not working right now
46
44
DASK_UCX__NET_DEVICES=mlx5_0:1
47
45
48
- worker_flags+=" --enable-infiniband --enable-rdmacm --net-devices=auto"
46
+ # worker_flags+=" --enable-infiniband --enable-rdmacm --net-devices=auto"
47
+ worker_flags+=" --enable-infiniband --net-devices=auto"
49
48
fi
50
49
51
50
# initialize scheduler
52
51
dask-scheduler $scheduler_flags &
53
52
54
53
# initialize workers
55
- dask-cuda-worker ucx:// ${address} :8786 $worker_flags
54
+ dask-cuda-worker $worker_flags
You can’t perform that action at this time.
0 commit comments