pretrain.yaml 1.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. datasets:
  2. - root: data/StarRail/Chinese
  3. source: StarRail
  4. languages: [ZH, EN]
  5. extension: .lab
  6. # This controls the grouping of the dataset (i.e. speaker)
  7. # 1 means we use the parent folder of the file as the group name
  8. group_parent_level: 1
  9. - root: data/StarRail/English
  10. source: StarRail
  11. languages: [EN]
  12. extension: .lab
  13. group_parent_level: 1
  14. - root: data/StarRail/Japanese
  15. source: StarRail
  16. languages: [JP, EN]
  17. extension: .lab
  18. group_parent_level: 1
  19. - root: data/Genshin/Chinese
  20. source: Genshin
  21. languages: [ZH, EN]
  22. extension: .lab
  23. group_parent_level: 1
  24. - root: data/Genshin/English
  25. source: Genshin
  26. languages: [EN]
  27. extension: .lab
  28. group_parent_level: 1
  29. - root: data/Genshin/Japanese
  30. source: Genshin
  31. languages: [JP, EN]
  32. extension: .lab
  33. group_parent_level: 1
  34. - root: data/LibriTTS_R
  35. source: LibriTTS_R
  36. languages: [EN]
  37. extension: .normalized.txt
  38. group_parent_level: 2
  39. - root: data/WenetSpeech
  40. source: WenetSpeech
  41. languages: [ZH, EN]
  42. extension: .txt
  43. group_parent_level: 1