Spaces:
Runtime error
Runtime error
| TOT_CUDA="0,1,2,3" #Upgrade bitsandbytes to the latest version to enable balanced loading of multiple GPUs | |
| BASE_MODEL="yahma/llama-7b-hf" | |
| LORA_PATH="Chinese-Vicuna/Chinese-Vicuna-lora-7b-chatv1" | |
| INT8=1 | |
| SHOW_BEAM=0 # 是否显示全部的beam生成效果 | |
| if [[ $DEBUG -eq 1 ]] | |
| then | |
| CUDA_VISIBLE_DEVICES=${TOT_CUDA} jurigged -v chat.py --model_path $BASE_MODEL --lora_path $LORA_PATH\ | |
| --int8 $INT8\ | |
| --use_typewriter 1 \ | |
| --show_beam $SHOW_BEAM \ | |
| --prompt_type "chat" \ | |
| --share_link 0 | |
| else | |
| CUDA_VISIBLE_DEVICES=${TOT_CUDA} python chat.py --model_path $BASE_MODEL --lora_path $LORA_PATH\ | |
| --int8 $INT8\ | |
| --use_typewriter 1 \ | |
| --show_beam $SHOW_BEAM \ | |
| --prompt_type "chat" \ | |
| --share_link 0 | |
| fi |