deploy_server.sh 2.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586
  1. #!/usr/bin/env bash
  2. #################
  3. # Parse options #
  4. #################
  5. instructions() {
  6. echo "Usage: $0 [-m] [-i] [ -d ] [ -p ] [ -b ] [-a] [-t]" >&2
  7. echo " -m: model name"
  8. echo " -i: initial peer"
  9. echo " -d: device" >&2
  10. echo " -p: server identity path" >&2
  11. echo " -b: block_ids" >&2
  12. echo " -a: host maddrs" >&2
  13. echo " -t: whether to run local tests" >&2
  14. exit 1
  15. }
  16. if [ ! $# -ge 8 ]; then
  17. instructions
  18. fi
  19. while getopts ":m:i:d:p:b:a:t:" option; do
  20. case $option in
  21. m) MODEL_NAME=${OPTARG}
  22. ;;
  23. i) INITIAL_PEER=${OPTARG}
  24. ;;
  25. d) DEVICE=${OPTARG}
  26. ;;
  27. p) SERVER_ID_PATH=${OPTARG}
  28. ;;
  29. b) BLOCK_IDS=${OPTARG}
  30. ;;
  31. a) HOST_MADDR=${OPTARG} # TODO: allow several maddrs
  32. ;;
  33. t) RUN_LOCAL_TESTS=true
  34. ;;
  35. \?) instructions
  36. ;;
  37. esac
  38. done
  39. echo "=========="
  40. echo "= Config ="
  41. echo "=========="
  42. echo "Model name: ${MODEL_NAME}"
  43. echo "Initial peer: ${INITIAL_PEER}"
  44. echo "Device: ${DEVICE}"
  45. echo "Server name: ${SERVER_ID_PATH}"
  46. echo "Server address: ${HOST_MADDR}"
  47. echo "Bloom blocks: ${BLOCK_IDS}"
  48. ###########################
  49. # Install or activate env #
  50. ###########################
  51. # TODO fix bug with self calling
  52. source ~/miniconda3/etc/profile.d/conda.sh
  53. if conda env list | grep ".*bloom-demo.*" >/dev/null 2>/dev/null; then
  54. conda activate bloom-demo
  55. else
  56. conda create -y --name bloom-demo python=3.8.12 pip
  57. conda activate bloom-demo
  58. conda install -y -c conda-forge cudatoolkit-dev==11.3.1 cudatoolkit==11.3.1 cudnn==8.2.1.32
  59. pip install -i https://pypi.org/simple torch==1.12.0+cu113 -f https://download.pytorch.org/whl/torch_stable.html
  60. pip install -i https://pypi.org/simple -r requirements.txt
  61. fi
  62. ##############
  63. # Run server #
  64. ##############
  65. # [('NONE', 0),
  66. # ('MEANSTD_16BIT', 1),
  67. # ('FLOAT16', 2),
  68. # ('QUANTILE_8BIT', 3),
  69. # ('UNIFORM_8BIT', 4),
  70. # ('BLOCKWISE_8BIT', 5)]
  71. export OMP_NUM_THREADS=16
  72. CUDA_VISIBLE_DEVICES=${DEVICE} python -m cli.run_server --converted_model_name_or_path ${MODEL_NAME} --torch_dtype float16 --initial_peer ${INITIAL_PEER} --cache_dir '/extra_disk_1/dbaranchuk/test-bloomd' \
  73. --block_indices ${BLOCK_IDS} --compression BLOCKWISE_8BIT --identity_path ${SERVER_ID_PATH} --host_maddrs ${HOST_MADDR} --load_in_8bit #&> logs/${SERVER_ID_PATH}.log