Ver Fonte

Update vqgan config & baseline

Lengyue há 2 anos atrás
pai
commit
e596deff1f

+ 1 - 0
fish_speech/configs/vqgan_pretrain.yaml

@@ -126,3 +126,4 @@ callbacks:
       - encoder
       - encoder
       - decoder
       - decoder
       - quantizer
       - quantizer
+      - discriminator

+ 8 - 0
fish_speech/models/vqgan/lit_module.py

@@ -213,6 +213,14 @@ class VQGAN(L.LightningModule):
             prog_bar=False,
             prog_bar=False,
             logger=True,
             logger=True,
         )
         )
+        self.log(
+            "train/generator/loss_adv",
+            loss_adv,
+            on_step=True,
+            on_epoch=False,
+            prog_bar=False,
+            logger=True,
+        )
 
 
         # Generator backward
         # Generator backward
         optim_g.zero_grad()
         optim_g.zero_grad()

+ 2 - 2
tools/vqgan/inference.py

@@ -26,7 +26,7 @@ OmegaConf.register_new_resolver("eval", eval)
 @click.option(
 @click.option(
     "--input-path",
     "--input-path",
     "-i",
     "-i",
-    default="data/sft/Rail_ZH/三月七/1fe0cc6fc3fe3e6d.wav",
+    default="test.wav",
     type=click.Path(exists=True, path_type=Path),
     type=click.Path(exists=True, path_type=Path),
 )
 )
 @click.option(
 @click.option(
@@ -36,7 +36,7 @@ OmegaConf.register_new_resolver("eval", eval)
 @click.option(
 @click.option(
     "--checkpoint-path",
     "--checkpoint-path",
     "-ckpt",
     "-ckpt",
-    default="results/vq-group-fsq-8x1024-wn-20x512-cond-e009/checkpoints/step_000355000.ckpt",
+    default="checkpoints/vq-gan-group-fsq-8x1024-wn-20x768-30kh.pth",
 )
 )
 def main(input_path, output_path, config_name, checkpoint_path):
 def main(input_path, output_path, config_name, checkpoint_path):
     with initialize(version_base="1.3", config_path="../../fish_speech/configs"):
     with initialize(version_base="1.3", config_path="../../fish_speech/configs"):