EchoMimic

Sleeping

App Files Files Community

fantaxy commited on Jul 29, 2024

Commit

279f990

verified ·

1 Parent(s): 5d91330

Update webgui.py

Browse files

Files changed (1) hide show

webgui.py +17 -6

webgui.py CHANGED Viewed

@@ -28,6 +28,7 @@ import argparse
 import gradio as gr
 import huggingface_hub
 huggingface_hub.snapshot_download(
     repo_id='BadToBest/EchoMimic',
@@ -155,8 +156,8 @@ def select_face(det_bboxes, probs):
     sorted_bboxes = sorted(filtered_bboxes, key=lambda x:(x[3]-x[1]) * (x[2] - x[0]), reverse=True)
     return sorted_bboxes[0]
-def process_video(uploaded_img, uploaded_audio, width, height, length, seed, facemask_dilation_ratio, facecrop_dilation_ratio, context_frames, context_overlap, cfg, steps, sample_rate, fps, device):
     if seed is not None and seed > -1:
         generator = torch.manual_seed(seed)
     else:
@@ -176,7 +177,7 @@ def process_video(uploaded_img, uploaded_audio, width, height, length, seed, fac
         r_pad = int((re - rb) * facemask_dilation_ratio)
         c_pad = int((ce - cb) * facemask_dilation_ratio)
         face_mask[rb - r_pad : re + r_pad, cb - c_pad : ce + c_pad] = 255
         #### face crop
         r_pad_crop = int((re - rb) * facecrop_dilation_ratio)
         c_pad_crop = int((ce - cb) * facecrop_dilation_ratio)
@@ -188,7 +189,7 @@ def process_video(uploaded_img, uploaded_audio, width, height, length, seed, fac
     ref_image_pil = Image.fromarray(face_img[:, :, [2, 1, 0]])
     face_mask_tensor = torch.Tensor(face_mask).to(dtype=weight_dtype, device="cuda").unsqueeze(0).unsqueeze(0).unsqueeze(0) / 255.0
     video = pipe(
         ref_image_pil,
         uploaded_audio,
@@ -212,9 +213,19 @@ def process_video(uploaded_img, uploaded_audio, width, height, length, seed, fac
     video_clip = VideoFileClip(str(output_video_path))
     audio_clip = AudioFileClip(uploaded_audio)
-    final_output_path = save_dir / "output_video_with_audio.mp4"
-    video_clip = video_clip.set_audio(audio_clip)
-    video_clip.write_videofile(str(final_output_path), codec="libx264", audio_codec="aac")
     return final_output_path

 import gradio as gr
 import huggingface_hub
+from moviepy.editor import VideoFileClip, AudioFileClip, ImageClip
 huggingface_hub.snapshot_download(
     repo_id='BadToBest/EchoMimic',
     sorted_bboxes = sorted(filtered_bboxes, key=lambda x:(x[3]-x[1]) * (x[2] - x[0]), reverse=True)
     return sorted_bboxes[0]
+def process_video(uploaded_img, uploaded_audio, width, height, length, seed, facemask_dilation_ratio, facecrop_dilation_ratio, context_frames, context_overlap, cfg, steps, sample_rate, fps, device):
     if seed is not None and seed > -1:
         generator = torch.manual_seed(seed)
     else:
         r_pad = int((re - rb) * facemask_dilation_ratio)
         c_pad = int((ce - cb) * facemask_dilation_ratio)
         face_mask[rb - r_pad : re + r_pad, cb - c_pad : ce + c_pad] = 255
         #### face crop
         r_pad_crop = int((re - rb) * facecrop_dilation_ratio)
         c_pad_crop = int((ce - cb) * facecrop_dilation_ratio)
     ref_image_pil = Image.fromarray(face_img[:, :, [2, 1, 0]])
     face_mask_tensor = torch.Tensor(face_mask).to(dtype=weight_dtype, device="cuda").unsqueeze(0).unsqueeze(0).unsqueeze(0) / 255.0
     video = pipe(
         ref_image_pil,
         uploaded_audio,
     video_clip = VideoFileClip(str(output_video_path))
     audio_clip = AudioFileClip(uploaded_audio)
+    # 워터마크 이미지 로드 및 크기 조정
+    watermark = (ImageClip("watermark.png")  # 워터마크 이미지 경로
+                 .set_duration(video_clip.duration)
+                 .resize(height=50)  # 워터마크 크기 조정
+                 .margin(right=8, bottom=8, opacity=0)  # 마진 및 투명도 설정
+                 .set_pos(("right", "bottom")))  # 위치 설정
+    final_clip = video_clip.set_audio(audio_clip).set_position(("center", "center")).fx(vfx.composite, watermark)
+    # APP.PY와 동일한 경로에 위치시키기
+    final_output_path = Path(__file__).parent / "output_video_with_audio.mp4"
+    final_clip.write_videofile(str(final_output_path), codec="libx264", audio_codec="aac")
     return final_output_path