From abe3d6650b73f3a739c33da7969cf12da37693d3 Mon Sep 17 00:00:00 2001 From: fanpt <320622572@qq.com> Date: Mon, 17 Jun 2024 11:33:52 +0800 Subject: [PATCH] =?UTF-8?q?=E8=AE=B0=E5=BD=95=E7=94=9F=E6=88=90=E8=A7=86?= =?UTF-8?q?=E9=A2=91=E7=9A=84=E8=B7=AF=E5=BE=84?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- image_enhancer.py | 4 ++-- silent_video_record.txt | 1 + text_wav.py | 4 ++-- 3 files changed, 5 insertions(+), 4 deletions(-) create mode 100644 silent_video_record.txt diff --git a/image_enhancer.py b/image_enhancer.py index 8dc2eec..85a7663 100644 --- a/image_enhancer.py +++ b/image_enhancer.py @@ -2,7 +2,7 @@ from PIL import Image, ImageEnhance, ImageFilter # 打开图像文件 -image_path = r'E:\SadTalker\examples\source_image\91a54181-568f-4cda-8f3c-0f2c811eaf20.jpg' +image_path = r'E:\SadTalker\examples\source_image\001.png' image = Image.open(image_path) # 创建ImageEnhance.Color对象 @@ -21,4 +21,4 @@ blurred_image = color_image.filter(ImageFilter.GaussianBlur(1)) blurred_image.show() # 保存图像 -blurred_image.save('path_to_save_image.jpg') +blurred_image.save('test.jpg') diff --git a/silent_video_record.txt b/silent_video_record.txt new file mode 100644 index 0000000..38e3c0b --- /dev/null +++ b/silent_video_record.txt @@ -0,0 +1 @@ +7c7b0b462a5a7d798a5b0950601eafeb results/silent-video\001##silent_audio_enhanced_trimmed.mp4 diff --git a/text_wav.py b/text_wav.py index 2a7d93b..47fb8a2 100644 --- a/text_wav.py +++ b/text_wav.py @@ -13,7 +13,7 @@ def text_to_speech(text, output_file): # 请求参数 request_data = { "text": text, - "spk_id": 0, + "spk_id": 3, # 语速 "speed": 0.87, "volume": 1.0, @@ -43,7 +43,7 @@ statements = [ ] # 保存语音的文件名列表 -output_files = [f"E:\\SadTalker\\temp\\wav\\tts_result_{i}.wav" for i in range(len(statements))] +output_files = [f"E:\\SadTalker\\temp\\wav\\3.wav" for i in range(len(statements))] # 发送每个语句的请求并保存音频文件 for i in range(len(statements)):