1. 租GPU
2. 安装 docker
bash -c "$(curl -L https://github.com/initialencounter/mydocker/raw/main/utils/nvidia-container.sh)"
start
docker run -it -p 3389:7860 --gpus 0 initialencounter/fish-speech
start service
cd /app/fish-speech
HF_ENDPOINT=https://hf-mirror.com python -m zibai tools.api_server:app --listen 0.0.0.0:7860
put model
curl -X 'PUT' \
'http://localhost:3389/v1/models/default' \
-H 'accept: application/json' \
-H 'Content-Type: application/json' \
-d '{
"device": "cuda",
"llama": {
"config_name": "text2semantic_finetune",
"checkpoint_path": "../text2semantic-400m-v0.2-4k.pth",
"precision": "bfloat16",
"tokenizer": "fishaudio/speech-lm-v1",
"compile": true
},
"vqgan": {
"config_name": "vqgan_pretrain",
"checkpoint_path": "../vqgan-v1.pth"
}
}'