From 8b3d66167f9d0823198cecfef44dd216f4da07bd Mon Sep 17 00:00:00 2001 From: dbaranchuk Date: Sun, 31 Jul 2022 06:13:59 +0300 Subject: [PATCH] set throughput=1 to fix 0 throughput problem --- cli/demo_deploy_server.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cli/demo_deploy_server.sh b/cli/demo_deploy_server.sh index 298d187..2b8f9cb 100644 --- a/cli/demo_deploy_server.sh +++ b/cli/demo_deploy_server.sh @@ -28,4 +28,4 @@ NUM_BLOCKS="3" # one converted block consumes ~3.5Gb export OMP_NUM_THREADS="16" # just in case CUDA_VISIBLE_DEVICES=${GPU_ID} python -m cli.run_server --converted_model_name_or_path ${MODEL_NAME} --torch_dtype float16 --initial_peer ${INITIAL_PEER} \ --compression BLOCKWISE_8BIT --identity_path ${SERVER_ID_PATH} --host_maddrs ${HOST_MADDR} \ - --num_blocks ${NUM_BLOCKS} --load_in_8bit \ No newline at end of file + --num_blocks ${NUM_BLOCKS} --load_in_8bit --throughput 1 \ No newline at end of file