|
@@ -11,6 +11,7 @@ from threading import Timer
|
|
from whisper_asr import get_whisper_asr
|
|
from whisper_asr import get_whisper_asr
|
|
from gpt_tag import request_gpt
|
|
from gpt_tag import request_gpt
|
|
from config import set_config
|
|
from config import set_config
|
|
|
|
+from audio_process import get_wav
|
|
from log import Log
|
|
from log import Log
|
|
config_ = set_config()
|
|
config_ = set_config()
|
|
log_ = Log()
|
|
log_ = Log()
|
|
@@ -23,15 +24,16 @@ def get_asr(video_id, download_folder, asr_folder):
|
|
video_type = filename.split('.')[-1]
|
|
video_type = filename.split('.')[-1]
|
|
if video_type in ['mp4', 'm3u8']:
|
|
if video_type in ['mp4', 'm3u8']:
|
|
video_file = os.path.join(video_folder, filename)
|
|
video_file = os.path.join(video_folder, filename)
|
|
|
|
+ audio_path = get_wav(video_file)
|
|
# 1. asr识别
|
|
# 1. asr识别
|
|
- asr_res_initial = get_whisper_asr(video=video_file)
|
|
|
|
|
|
+ asr_res_initial = get_whisper_asr(audio=audio_path)
|
|
print(video_id, asr_res_initial)
|
|
print(video_id, asr_res_initial)
|
|
# 2. 识别结果写入文件
|
|
# 2. 识别结果写入文件
|
|
asr_path = os.path.join(asr_folder, f"{video_id}.txt")
|
|
asr_path = os.path.join(asr_folder, f"{video_id}.txt")
|
|
with open(asr_path, 'w', encoding='utf-8') as wf:
|
|
with open(asr_path, 'w', encoding='utf-8') as wf:
|
|
wf.write(asr_res_initial)
|
|
wf.write(asr_res_initial)
|
|
# 将处理过的视频进行删除
|
|
# 将处理过的视频进行删除
|
|
- shutil.rmtree(os.path.join(download_folder, video_id))
|
|
|
|
|
|
+ # shutil.rmtree(os.path.join(download_folder, video_id))
|
|
break
|
|
break
|
|
|
|
|
|
|
|
|