1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586 |
- #!/usr/bin/env bash
- #################
- # Parse options #
- #################
- instructions() {
- echo "Usage: $0 [-m] [-i] [ -d ] [ -p ] [ -b ] [-a] [-t]" >&2
- echo " -m: model name"
- echo " -i: initial peer"
- echo " -d: device" >&2
- echo " -p: server identity path" >&2
- echo " -b: block_ids" >&2
- echo " -a: host maddrs" >&2
- echo " -t: whether to run local tests" >&2
- exit 1
- }
- if [ ! $# -ge 8 ]; then
- instructions
- fi
- while getopts ":m:i:d:p:b:a:t:" option; do
- case $option in
- m) MODEL_NAME=${OPTARG}
- ;;
- i) INITIAL_PEER=${OPTARG}
- ;;
- d) DEVICE=${OPTARG}
- ;;
- p) SERVER_ID_PATH=${OPTARG}
- ;;
- b) BLOCK_IDS=${OPTARG}
- ;;
- a) HOST_MADDR=${OPTARG} # TODO: allow several maddrs
- ;;
- t) RUN_LOCAL_TESTS=true
- ;;
- \?) instructions
- ;;
- esac
- done
- echo "=========="
- echo "= Config ="
- echo "=========="
- echo "Model name: ${MODEL_NAME}"
- echo "Initial peer: ${INITIAL_PEER}"
- echo "Device: ${DEVICE}"
- echo "Server name: ${SERVER_ID_PATH}"
- echo "Server address: ${HOST_MADDR}"
- echo "Bloom blocks: ${BLOCK_IDS}"
- ###########################
- # Install or activate env #
- ###########################
- # TODO fix bug with self calling
- source ~/miniconda3/etc/profile.d/conda.sh
- if conda env list | grep ".*bloom-demo.*" >/dev/null 2>/dev/null; then
- conda activate bloom-demo
- else
- conda create -y --name bloom-demo python=3.8.12 pip
- conda activate bloom-demo
- conda install -y -c conda-forge cudatoolkit-dev==11.3.1 cudatoolkit==11.3.1 cudnn==8.2.1.32
- pip install -i https://pypi.org/simple torch==1.12.0+cu113 -f https://download.pytorch.org/whl/torch_stable.html
- pip install -i https://pypi.org/simple -r requirements.txt
- fi
- ##############
- # Run server #
- ##############
- # [('NONE', 0),
- # ('MEANSTD_16BIT', 1),
- # ('FLOAT16', 2),
- # ('QUANTILE_8BIT', 3),
- # ('UNIFORM_8BIT', 4),
- # ('BLOCKWISE_8BIT', 5)]
- export OMP_NUM_THREADS=16
- CUDA_VISIBLE_DEVICES=${DEVICE} python -m cli.run_server --converted_model_name_or_path ${MODEL_NAME} --torch_dtype float16 --initial_peer ${INITIAL_PEER} --cache_dir '/extra_disk_1/dbaranchuk/test-bloomd' \
- --block_indices ${BLOCK_IDS} --compression BLOCKWISE_8BIT --identity_path ${SERVER_ID_PATH} --host_maddrs ${HOST_MADDR} --load_in_8bit #&> logs/${SERVER_ID_PATH}.log
|