1234567891011121314151617181920212223242526272829303132 |
- import os
- def geberateAudioPath(filepath,orifilepath):
- data_path = "/Users/tzld/Downloads/LJSpeech-1.1/wavs/"
- with open(filepath, 'w') as f:
- with open(orifilepath,'r') as f1:
- while True:
- content = f1.readline()
- if content =='':
- break
- # try:
- filename = content.split('|')[0].split('/')[-1]
- path = data_path+filename
- str = path + '|' + content.split('|')[1] + '|' + content.split('|')[2]
- f.write(str)
- # except:
- # print(content)
- if __name__ == '__main__':
- trainfilepath = './ljs_audiopaths_text_sid_train_filelist.txt'
- valfilepath = './ljs_audiopaths_text_sid_val_filelist.txt'
- targettrainfilepath = './ljs_audiopaths_text_sid_train_filelist_new.txt'
- targetvalfilepath = './ljs_audiopaths_text_sid_val_filelist_new.txt'
- geberateAudioPath(targettrainfilepath,trainfilepath)
- geberateAudioPath(targetvalfilepath,valfilepath)
- #
- #
- # origin_tarin_data_df["ID"] = origin_tarin_data_df.apply(lambda s:data_path + s['ID'].split('/')[-1],axis=1)
- # origin_val_data_df["ID"] = origin_tarin_data_df.apply(lambda s:data_path + s['ID'].split('/')[-1],axis=1)
- #
- # origin_tarin_data_df.to_csv("./ljs_audiopaths_text_sid_train_filelist_new.txt",sep="|",header=False,index=False)
- # origin_val_data_df.to_csv("./ljs_audiopaths_text_sid_val_filelist_new.txt",sep="|",header=False,index=False)
|