Spaces:

VIDraft
/

Portrait-Animation

Runtime error

App Files Files Community

openfree commited on Feb 10

Commit

244a523

verified ·

1 Parent(s): 729c163

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -13

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from sonic import Sonic
 from PIL import Image
 import torch
-# Initialize the model
 cmd = (
     'python3 -m pip install "huggingface_hub[cli]"; '
     'huggingface-cli download LeonJoe13/Sonic --local-dir  checkpoints; '
@@ -23,17 +23,15 @@ def get_md5(content):
     md5hash = hashlib.md5(content)
     return md5hash.hexdigest()
-@spaces.GPU(duration=300)  # Increased duration to handle longer videos
 def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
     expand_ratio = 0.5
     min_resolution = 512
-    fps = 25  # 원하는 프레임 레이트 설정 (예: 25 fps)
-    # 오디오 파일로부터 실제 오디오 길이를 구하고, 그에 맞춰 추론 단계를 계산합니다.
     audio = AudioSegment.from_file(audio_path)
     duration = len(audio) / 1000.0  # 초 단위
-    # 오디오 길이에 따른 프레임 수 계산 (예: 5초 -> 5*25 = 125 단계)
-    inference_steps = int(duration * fps)
     print(f"Audio duration: {duration} seconds, using inference_steps: {inference_steps}")
     face_info = pipe.preprocess(img_path, expand_ratio=expand_ratio)
@@ -45,16 +43,15 @@ def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
         img_path = crop_image_path
         os.makedirs(os.path.dirname(res_video_path), exist_ok=True)
-        # Sonic.process() 호출 시, 동적으로 계산된 inference_steps를 전달합니다.
         pipe.process(
-            img_path,
-            audio_path,
-            res_video_path,
             min_resolution=min_resolution,
             inference_steps=inference_steps,
             dynamic_scale=dynamic_scale
         )
-        # 생성된 비디오 파일 경로 반환
         return res_video_path
     else:
         return -1
@@ -107,7 +104,7 @@ def process_sonic(image, audio, dynamic_scale):
         print(f"Generating new video with dynamic scale: {dynamic_scale}")
         return get_video_res(image_path, audio_path, res_video_path, dynamic_scale)
-# 예시 데이터를 위한 dummy 함수 (필요시 실제 예시 데이터로 수정)
 def get_example():
     return []
@@ -204,5 +201,5 @@ with gr.Blocks(css=css) as demo:
         </div>
     """)
-# 공개 링크를 생성하려면 share=True 옵션 사용
 demo.launch(share=True)

 from PIL import Image
 import torch
+# 모델 초기화
 cmd = (
     'python3 -m pip install "huggingface_hub[cli]"; '
     'huggingface-cli download LeonJoe13/Sonic --local-dir  checkpoints; '
     md5hash = hashlib.md5(content)
     return md5hash.hexdigest()
+@spaces.GPU(duration=300)  # 긴 비디오 처리를 위해 duration 300초로 설정
 def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
     expand_ratio = 0.5
     min_resolution = 512
+    inference_steps = 25  # 2초 분량의 비디오(25 프레임)로 고정
+    # 오디오 길이(참고용) 출력
     audio = AudioSegment.from_file(audio_path)
     duration = len(audio) / 1000.0  # 초 단위
     print(f"Audio duration: {duration} seconds, using inference_steps: {inference_steps}")
     face_info = pipe.preprocess(img_path, expand_ratio=expand_ratio)
         img_path = crop_image_path
         os.makedirs(os.path.dirname(res_video_path), exist_ok=True)
+        # 고정된 inference_steps(25)로 비디오 생성
         pipe.process(
+            img_path,
+            audio_path,
+            res_video_path,
             min_resolution=min_resolution,
             inference_steps=inference_steps,
             dynamic_scale=dynamic_scale
         )
         return res_video_path
     else:
         return -1
         print(f"Generating new video with dynamic scale: {dynamic_scale}")
         return get_video_res(image_path, audio_path, res_video_path, dynamic_scale)
+# 예시 데이터를 위한 dummy 함수 (필요시 실제 예시 데이터를 추가하세요)
 def get_example():
     return []
         </div>
     """)
+# 공개 링크 생성: share=True
 demo.launch(share=True)