|
@@ -61,7 +61,7 @@
|
|
|
"# !set HF_ENDPOINT=https://hf-mirror.com\n",
|
|
"# !set HF_ENDPOINT=https://hf-mirror.com\n",
|
|
|
"# !export HF_ENDPOINT=https://hf-mirror.com \n",
|
|
"# !export HF_ENDPOINT=https://hf-mirror.com \n",
|
|
|
"\n",
|
|
"\n",
|
|
|
- "!huggingface-cli download fishaudio/fish-speech-1.2-sft --local-dir checkpoints/fish-speech-1.2-sft/"
|
|
|
|
|
|
|
+ "!huggingface-cli download fishaudio/fish-speech-1.4 --local-dir checkpoints/fish-speech-1.4/"
|
|
|
]
|
|
]
|
|
|
},
|
|
},
|
|
|
{
|
|
{
|
|
@@ -84,8 +84,8 @@
|
|
|
"outputs": [],
|
|
"outputs": [],
|
|
|
"source": [
|
|
"source": [
|
|
|
"!python tools/webui.py \\\n",
|
|
"!python tools/webui.py \\\n",
|
|
|
- " --llama-checkpoint-path checkpoints/fish-speech-1.2-sft \\\n",
|
|
|
|
|
- " --decoder-checkpoint-path checkpoints/fish-speech-1.2-sft/firefly-gan-vq-fsq-4x1024-42hz-generator.pth \\\n",
|
|
|
|
|
|
|
+ " --llama-checkpoint-path checkpoints/fish-speech-1.4 \\\n",
|
|
|
|
|
+ " --decoder-checkpoint-path checkpoints/fish-speech-1.4/firefly-gan-vq-fsq-8x1024-21hz-generator.pth \\\n",
|
|
|
" # --compile"
|
|
" # --compile"
|
|
|
]
|
|
]
|
|
|
},
|
|
},
|
|
@@ -122,7 +122,7 @@
|
|
|
"\n",
|
|
"\n",
|
|
|
"!python tools/vqgan/inference.py \\\n",
|
|
"!python tools/vqgan/inference.py \\\n",
|
|
|
" -i {src_audio} \\\n",
|
|
" -i {src_audio} \\\n",
|
|
|
- " --checkpoint-path \"checkpoints/fish-speech-1.2-sft/firefly-gan-vq-fsq-4x1024-42hz-generator.pth\"\n",
|
|
|
|
|
|
|
+ " --checkpoint-path \"checkpoints/fish-speech-1.4/firefly-gan-vq-fsq-8x1024-21hz-generator.pth\"\n",
|
|
|
"\n",
|
|
"\n",
|
|
|
"from IPython.display import Audio, display\n",
|
|
"from IPython.display import Audio, display\n",
|
|
|
"audio = Audio(filename=\"fake.wav\")\n",
|
|
"audio = Audio(filename=\"fake.wav\")\n",
|
|
@@ -158,7 +158,7 @@
|
|
|
" --text \"hello world\" \\\n",
|
|
" --text \"hello world\" \\\n",
|
|
|
" --prompt-text \"The text corresponding to reference audio\" \\\n",
|
|
" --prompt-text \"The text corresponding to reference audio\" \\\n",
|
|
|
" --prompt-tokens \"fake.npy\" \\\n",
|
|
" --prompt-tokens \"fake.npy\" \\\n",
|
|
|
- " --checkpoint-path \"checkpoints/fish-speech-1.2-sft\" \\\n",
|
|
|
|
|
|
|
+ " --checkpoint-path \"checkpoints/fish-speech-1.4\" \\\n",
|
|
|
" --num-samples 2\n",
|
|
" --num-samples 2\n",
|
|
|
" # --compile"
|
|
" # --compile"
|
|
|
]
|
|
]
|
|
@@ -182,7 +182,7 @@
|
|
|
"source": [
|
|
"source": [
|
|
|
"!python tools/vqgan/inference.py \\\n",
|
|
"!python tools/vqgan/inference.py \\\n",
|
|
|
" -i \"codes_0.npy\" \\\n",
|
|
" -i \"codes_0.npy\" \\\n",
|
|
|
- " --checkpoint-path \"checkpoints/fish-speech-1.2-sft/firefly-gan-vq-fsq-4x1024-42hz-generator.pth\"\n",
|
|
|
|
|
|
|
+ " --checkpoint-path \"checkpoints/fish-speech-1.4/firefly-gan-vq-fsq-8x1024-21hz-generator.pth\"\n",
|
|
|
"\n",
|
|
"\n",
|
|
|
"from IPython.display import Audio, display\n",
|
|
"from IPython.display import Audio, display\n",
|
|
|
"audio = Audio(filename=\"fake.wav\")\n",
|
|
"audio = Audio(filename=\"fake.wav\")\n",
|