Spaces:

alexnasa
/

HuMo_local

Running on Zero

App Files Files Community

alex commited on Oct 15

Commit

33e0319

1 Parent(s): e04a1e2

unused parameter removed

Browse files

Files changed (1) hide show

app.py +18 -15

app.py CHANGED Viewed

@@ -114,7 +114,7 @@ def restore_inductor_cache_from_hub(repo_id: str, filename: str = "torch_compile
 # restore_inductor_cache_from_hub("alexnasa/humo-compiled")
-def get_duration(prompt_text, steps, image_file, audio_file_path, tea_cache_l1_thresh, max_duration, session_id):
     return calculate_required_time(steps, max_duration)
@@ -125,7 +125,7 @@ def calculate_required_time(steps, max_duration):
     max_duration_duration_mapping = {
         1: 8,
         2: 8,
-        3: 11,
         4: 20,
     }
     each_step_s = max_duration_duration_mapping[max_duration]
@@ -147,7 +147,7 @@ def update_required_time(steps, max_duration):
     return get_required_time_string(steps, max_duration)
-def generate_scene(prompt_text, steps, image_paths, audio_file_path, tea_cache_l1_thresh, max_duration = 3, session_id = None):
     print(image_paths)
     prompt_text_check = (prompt_text or "").strip()
@@ -157,7 +157,7 @@ def generate_scene(prompt_text, steps, image_paths, audio_file_path, tea_cache_l
     if not audio_file_path and not image_paths:
         raise gr.Error("Please provide a reference image or a lipsync audio.")
-    return run_pipeline(prompt_text, steps, image_paths, audio_file_path, tea_cache_l1_thresh, max_duration, session_id)
 def upload_inductor_cache_to_hub(
     repo_id: str,
@@ -211,7 +211,7 @@ def upload_inductor_cache_to_hub(
 @spaces.GPU(duration=get_duration)
-def run_pipeline(prompt_text, steps, image_paths, audio_file_path, tea_cache_l1_thresh = 0.0, max_duration = 3, session_id = None):
     if session_id is None:
         session_id = uuid.uuid4().hex
@@ -266,7 +266,7 @@ def run_pipeline(prompt_text, steps, image_paths, audio_file_path, tea_cache_l1_
         height,
         steps,
         frames = int(duration_frame_mapping[max_duration]),
-        tea_cache_l1_thresh = tea_cache_l1_thresh,
     )
     # Return resulting video path
@@ -347,7 +347,6 @@ with gr.Blocks(css=css) as demo:
         max_duration = gr.Slider(minimum=2, maximum=4, value=default_max_duration, step=1, label="Max Duration")
         steps_input = gr.Slider(minimum=10, maximum=50, value=default_steps, step=5, label="Diffusion Steps")
-        tea_cache_l1_thresh = gr.Slider(minimum=0.0, maximum=1.0, value=0.0, step=0.01, label="Cache", visible=False)
@@ -386,32 +385,36 @@ with gr.Blocks(css=css) as demo:
                     "A handheld tracking shot follows a female through a science lab. Her determined eyes are locked straight ahead. The clip is in black and white and patchy as she is explaining something to someone standing opposite her",
                     10,
                     ["./examples/naomi.png"],
-                    "./examples/science.wav",
                 ],
                 [
                     "A reddish-brown haired  woman sits pensively against swirling blue-and-white brushstrokes, dressed in a blue coat and dark waistcoat. The artistic backdrop and her thoughtful pose evoke a Post-Impressionist style in a studio-like setting.",
                     10,
                     ["./examples/art.png"],
-                    "./examples/art.wav",
                 ],
                 [
-                    "A handheld tracking shot follows a female warrior walking through a cave. Her determined eyes are locked straight ahead. She speaks with intensity.",
-                    10,
                     ["./examples/naomi.png"],
-                    "./examples/dream.mp3",
                 ],
                 [
                     "A woman with long, wavy dark hair looking at a person sitting opposite her whilst holding a book, wearing a leather jacket, long-sleeved jacket with a semi purple color one seen on a photo. Warm, window-like light bathes her figure, highlighting the outfit's elegant design and her graceful movements.",
                     30,
                     ["./examples/amber.png", "./examples/jacket.png"],
-                    "./examples/fictional.wav",
                 ],
             ],
-            inputs=[prompt_tb, steps_input, img_input, audio_input],
             outputs=[video_output],
             fn=run_pipeline,
             cache_examples=True,
@@ -421,7 +424,7 @@ with gr.Blocks(css=css) as demo:
         run_btn.click(
             fn=generate_scene,
-            inputs=[prompt_tb, steps_input, img_input, audio_input, tea_cache_l1_thresh, max_duration, session_state],
             outputs=[video_output],
         )

 # restore_inductor_cache_from_hub("alexnasa/humo-compiled")
+def get_duration(prompt_text, steps, image_file, audio_file_path, max_duration, session_id):
     return calculate_required_time(steps, max_duration)
     max_duration_duration_mapping = {
         1: 8,
         2: 8,
+        3: 12,
         4: 20,
     }
     each_step_s = max_duration_duration_mapping[max_duration]
     return get_required_time_string(steps, max_duration)
+def generate_scene(prompt_text, steps, image_paths, audio_file_path, max_duration = 3, session_id = None):
     print(image_paths)
     prompt_text_check = (prompt_text or "").strip()
     if not audio_file_path and not image_paths:
         raise gr.Error("Please provide a reference image or a lipsync audio.")
+    return run_pipeline(prompt_text, steps, image_paths, audio_file_path, max_duration, session_id)
 def upload_inductor_cache_to_hub(
     repo_id: str,
 @spaces.GPU(duration=get_duration)
+def run_pipeline(prompt_text, steps, image_paths, audio_file_path, max_duration = 3, session_id = None):
     if session_id is None:
         session_id = uuid.uuid4().hex
         height,
         steps,
         frames = int(duration_frame_mapping[max_duration]),
+        tea_cache_l1_thresh = 0.0,
     )
     # Return resulting video path
         max_duration = gr.Slider(minimum=2, maximum=4, value=default_max_duration, step=1, label="Max Duration")
         steps_input = gr.Slider(minimum=10, maximum=50, value=default_steps, step=5, label="Diffusion Steps")
                     "A handheld tracking shot follows a female through a science lab. Her determined eyes are locked straight ahead. The clip is in black and white and patchy as she is explaining something to someone standing opposite her",
                     10,
                     ["./examples/naomi.png"],
+                    "./examples/science.wav",
+                    3,
                 ],
                 [
                     "A reddish-brown haired  woman sits pensively against swirling blue-and-white brushstrokes, dressed in a blue coat and dark waistcoat. The artistic backdrop and her thoughtful pose evoke a Post-Impressionist style in a studio-like setting.",
                     10,
                     ["./examples/art.png"],
+                    "./examples/art.wav",
+                    2,
                 ],
                 [
+                    "A handheld tracking shot follows a female warrior walking through a cave. Her determined eyes are locked straight ahead as she grips a blazing torch tightly in her hand. She speaks with intensity.",
+                    5,
                     ["./examples/naomi.png"],
+                    "./examples/dream.mp3",
+                    5,
                 ],
                 [
                     "A woman with long, wavy dark hair looking at a person sitting opposite her whilst holding a book, wearing a leather jacket, long-sleeved jacket with a semi purple color one seen on a photo. Warm, window-like light bathes her figure, highlighting the outfit's elegant design and her graceful movements.",
                     30,
                     ["./examples/amber.png", "./examples/jacket.png"],
+                    "./examples/fictional.wav",
+                    5,
                 ],
             ],
+            inputs=[prompt_tb, steps_input, img_input, audio_input, max_duration],
             outputs=[video_output],
             fn=run_pipeline,
             cache_examples=True,
         run_btn.click(
             fn=generate_scene,
+            inputs=[prompt_tb, steps_input, img_input, audio_input, max_duration, session_state],
             outputs=[video_output],
         )