naive_8_codebook_small.yaml 373 B

123456789101112
  1. _target_: fish_speech.models.text2semantic.llama.NaiveTransformer
  2. config:
  3. _target_: fish_speech.models.text2semantic.llama.DualARModelArgs
  4. max_seq_len: ${max_length}
  5. vocab_size: 36408
  6. n_layer: 12
  7. n_head: 12
  8. dim: 768
  9. rope_base: 10000
  10. norm_eps: 1e-5
  11. num_codebooks: 8 # input/output codebook size
  12. codebook_size: 264 # codebook size 256 + 2 special tokens