Spaces:

ginigen
/

Nano-Banana-Video

Paused

App Files Files Community

ginipick commited on Aug 28

Commit

e48246c

verified ·

1 Parent(s): cea104c

Update app.py

Browse files

Files changed (1) hide show

app.py +322 -353

app.py CHANGED Viewed

@@ -7,18 +7,12 @@ from io import BytesIO
 import time
 import tempfile
 import base64
 import numpy as np
 import random
 import gc
-# GPU 관련 임포트는 나중에 조건부로 처리
-try:
-    import torch
-    TORCH_AVAILABLE = True
-except ImportError:
-    TORCH_AVAILABLE = False
-    print("Warning: PyTorch not available. Video generation will be disabled.")
 # ===========================
 # Configuration
 # ===========================
@@ -27,51 +21,23 @@ except ImportError:
 os.environ['REPLICATE_API_TOKEN'] = os.getenv('REPLICATE_API_TOKEN')
 # Video Model Configuration
-VIDEO_MODEL_ID = "Wan-AI/Wan2.2-I2V-A14B-Diffusers"
-LANDSCAPE_WIDTH = 832
-LANDSCAPE_HEIGHT = 480
 MAX_SEED = np.iinfo(np.int32).max
-FIXED_FPS = 16
 MIN_FRAMES_MODEL = 8
-MAX_FRAMES_MODEL = 81
-MIN_DURATION = round(MIN_FRAMES_MODEL/FIXED_FPS, 1)
-MAX_DURATION = round(MAX_FRAMES_MODEL/FIXED_FPS, 1)
-default_prompt_i2v = "make this image come alive, cinematic motion, smooth animation"
-default_negative_prompt = "static, still, no motion, frozen"
-# ===========================
-# Initialize Video Pipeline (Lazy Loading)
-# ===========================
-video_pipe = None
-video_pipeline_ready = False
-def lazy_import_video_dependencies():
-    """Lazy import video dependencies only when needed"""
-    global video_pipe, video_pipeline_ready
-    if not TORCH_AVAILABLE:
-        raise gr.Error("PyTorch is not installed. Video generation is not available.")
-    try:
-        # Try to import video pipeline dependencies
-        from diffusers.pipelines.wan.pipeline_wan_i2v import WanImageToVideoPipeline
-        from diffusers.models.transformers.transformer_wan import WanTransformer3DModel
-        from diffusers.utils.export_utils import export_to_video
-        return WanImageToVideoPipeline, WanTransformer3DModel, export_to_video
-    except ImportError as e:
-        print(f"Warning: Video dependencies not available: {e}")
-        return None, None, None
 # ===========================
 # Image Processing Functions
 # ===========================
 def upload_image_to_hosting(image):
-    """Upload image to multiple hosting services with fallback"""
-    # Method 1: Try imgbb.com
     try:
         buffered = BytesIO()
         image.save(buffered, format="PNG")
@@ -84,7 +50,7 @@ def upload_image_to_hosting(image):
                 'key': '6d207e02198a847aa98d0a2a901485a5',
                 'image': img_base64,
             },
-            timeout=10
         )
         if response.status_code == 200:
@@ -92,23 +58,9 @@ def upload_image_to_hosting(image):
             if data.get('success'):
                 return data['data']['url']
     except Exception as e:
-        print(f"imgbb upload failed: {e}")
-    # Method 2: Try 0x0.st
-    try:
-        buffered = BytesIO()
-        image.save(buffered, format="PNG")
-        buffered.seek(0)
-        files = {'file': ('image.png', buffered, 'image/png')}
-        response = requests.post("https://0x0.st", files=files, timeout=10)
-        if response.status_code == 200:
-            return response.text.strip()
-    except Exception as e:
-        print(f"0x0.st upload failed: {e}")
-    # Method 3: Fallback to base64
     buffered = BytesIO()
     image.save(buffered, format="PNG")
     buffered.seek(0)
@@ -116,193 +68,179 @@ def upload_image_to_hosting(image):
     return f"data:image/png;base64,{img_base64}"
 def process_images(prompt, image1, image2=None):
-    """Process uploaded images with Replicate API"""
     if not image1:
         return None, "Please upload at least one image", None
     if not os.getenv('REPLICATE_API_TOKEN'):
-        return None, "Please set REPLICATE_API_TOKEN", None
     try:
-        image_urls = []
-        # Upload images
         url1 = upload_image_to_hosting(image1)
-        image_urls.append(url1)
-        if image2:
-            url2 = upload_image_to_hosting(image2)
-            image_urls.append(url2)
-        # Run the model (using a placeholder model name - replace with actual)
-        # Note: "google/nano-banana" doesn't exist - replace with actual model
         output = replicate.run(
             "stability-ai/sdxl:39ed52f2a78e934b3ba6e2a89f5b1c712de7dfea535525255b1aa35c5565e08b",
             input={
-                "prompt": prompt,
-                "image": url1 if len(image_urls) == 1 else None,
                 "width": 1024,
-                "height": 1024
             }
         )
-        if output is None:
-            return None, "No output received", None
-        # Get the generated image
-        img = None
-        # Handle different output formats
-        if isinstance(output, list) and len(output) > 0:
-            output_url = output[0]
-        elif isinstance(output, str):
-            output_url = output
-        else:
-            output_url = str(output)
-        if output_url:
-            response = requests.get(output_url, timeout=30)
             if response.status_code == 200:
                 img = Image.open(BytesIO(response.content))
-        if img:
-            return img, "✨ Image generated successfully!", img
-        else:
-            return None, "Could not process output", None
     except Exception as e:
-        return None, f"Error: {str(e)[:200]}", None
 # ===========================
-# Video Generation Functions (Simplified)
 # ===========================
 def resize_image_for_video(image: Image.Image) -> Image.Image:
     """Resize image for video generation"""
-    target_aspect = LANDSCAPE_WIDTH / LANDSCAPE_HEIGHT
-    width, height = image.size
-    in_aspect = width / height
-    if in_aspect > target_aspect:
-        new_width = round(height * target_aspect)
-        left = (width - new_width) // 2
-        image = image.crop((left, 0, left + new_width, height))
-    else:
-        new_height = round(width / target_aspect)
-        top = (height - new_height) // 2
-        image = image.crop((0, top, width, top + new_height))
-    return image.resize((LANDSCAPE_WIDTH, LANDSCAPE_HEIGHT), Image.LANCZOS)
-def generate_video(
     input_image,
     prompt,
-    steps=4,
     negative_prompt=default_negative_prompt,
-    duration_seconds=1.5,
-    guidance_scale=1,
-    guidance_scale_2=1,
     seed=42,
     randomize_seed=False,
 ):
-    """Generate a video from an input image (simplified version)"""
-    if input_image is None:
-        raise gr.Error("Please generate or upload an image first.")
-    if not TORCH_AVAILABLE:
-        raise gr.Error("Video generation is not available. PyTorch is not installed.")
     try:
-        # Import dependencies
-        video_deps = lazy_import_video_dependencies()
-        if not all(video_deps):
-            raise gr.Error("Video generation dependencies are not available.")
-        WanImageToVideoPipeline, WanTransformer3DModel, export_to_video = video_deps
-        global video_pipe
-        # Simple initialization without complex optimizations
-        if video_pipe is None:
-            print("Initializing video pipeline (simplified)...")
-            # Clear GPU memory first
-            if TORCH_AVAILABLE:
-                torch.cuda.empty_cache()
-                gc.collect()
-            # Basic pipeline loading
-            try:
-                video_pipe = WanImageToVideoPipeline.from_pretrained(
-                    VIDEO_MODEL_ID,
-                    torch_dtype=torch.float16 if TORCH_AVAILABLE else None,
-                    low_cpu_mem_usage=True,
-                    device_map="auto"
-                )
-                print("Video pipeline loaded")
-            except Exception as e:
-                print(f"Failed to load video pipeline: {e}")
-                raise gr.Error("Could not load video model. Please try again later.")
-        # Prepare video generation
-        num_frames = min(17, int(round(duration_seconds * FIXED_FPS)))  # Limit frames
-        num_frames = ((num_frames - 1) // 4) * 4 + 1  # Ensure divisible by 4
-        current_seed = random.randint(0, MAX_SEED) if randomize_seed else int(seed)
         # Resize image
         resized_image = resize_image_for_video(input_image)
-        # Generate video with minimal settings
-        print(f"Generating {num_frames} frames...")
-        if TORCH_AVAILABLE:
-            generator = torch.Generator(device="cuda" if torch.cuda.is_available() else "cpu").manual_seed(current_seed)
-        else:
-            generator = None
-        output_frames_list = video_pipe(
-            image=resized_image,
-            prompt=prompt,
-            negative_prompt=negative_prompt,
-            height=LANDSCAPE_HEIGHT,
-            width=LANDSCAPE_WIDTH,
-            num_frames=num_frames,
-            guidance_scale=float(guidance_scale),
-            num_inference_steps=int(steps),
-            generator=generator,
-        ).frames[0]
-        # Save video
-        with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmpfile:
-            video_path = tmpfile.name
-        export_to_video(output_frames_list, video_path, fps=FIXED_FPS)
-        return video_path, current_seed, f"🎬 Video generated! ({num_frames} frames)"
     except Exception as e:
-        if TORCH_AVAILABLE:
             torch.cuda.empty_cache()
             gc.collect()
-        error_msg = str(e)[:200]
-        if "out of memory" in error_msg.lower():
-            return None, seed, "GPU memory exceeded. Try reducing duration and steps."
-        return None, seed, f"Error: {error_msg}"
 # ===========================
-# Simple CSS
 # ===========================
 css = """
 .gradio-container {
-    max-width: 1200px;
-    margin: 0 auto;
 }
 .header-container {
-    background: linear-gradient(135deg, #ffd93d 0%, #ffb347 100%);
     padding: 2rem;
-    border-radius: 12px;
     margin-bottom: 2rem;
     text-align: center;
 }
@@ -310,197 +248,228 @@ css = """
     font-size: 2.5rem;
     font-weight: bold;
     color: #2d3436;
-    margin: 0;
 }
 .subtitle {
     color: #2d3436;
-    font-size: 1rem;
     margin-top: 0.5rem;
 }
 """
 # ===========================
-# Gradio Interface (Simplified)
 # ===========================
-def create_demo():
-    with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
-        # Shared state
-        generated_image_state = gr.State(None)
-        gr.HTML("""
-            <div class="header-container">
-                <h1 class="logo-text">🍌 Nano Banana + Video</h1>
-                <p class="subtitle">AI-Powered Image Generation with Video Creation</p>
-            </div>
-        """)
-        with gr.Tabs():
-            # Tab 1: Image Generation
-            with gr.TabItem("🎨 Step 1: Generate Image"):
-                with gr.Row():
-                    with gr.Column():
-                        style_prompt = gr.Textbox(
-                            label="Style Description",
-                            placeholder="Describe your style...",
-                            lines=3,
-                            value="A beautiful landscape in anime style"
-                        )
                         image1 = gr.Image(
                             label="Reference Image (Optional)",
-                            type="pil"
                         )
                         image2 = gr.Image(
-                            label="Secondary Image (Optional)",
-                            type="pil"
-                        )
-                        generate_img_btn = gr.Button(
-                            "Generate Image ✨",
-                            variant="primary"
                         )
-                    with gr.Column():
-                        output_image = gr.Image(
-                            label="Generated Result",
-                            type="pil"
-                        )
-                        img_status = gr.Textbox(
-                            label="Status",
-                            interactive=False,
-                            value="Ready..."
-                        )
-                        send_to_video_btn = gr.Button(
-                            "Send to Video Generation →",
-                            variant="secondary",
-                            visible=False
-                        )
-            # Tab 2: Video Generation
-            with gr.TabItem("🎬 Step 2: Generate Video"):
-                with gr.Row():
-                    with gr.Column():
-                        video_input_image = gr.Image(
-                            type="pil",
-                            label="Input Image"
-                        )
-                        video_prompt = gr.Textbox(
-                            label="Animation Prompt",
-                            value=default_prompt_i2v
-                        )
                         duration_input = gr.Slider(
-                            minimum=0.5,
-                            maximum=2.0,
                             step=0.5,
-                            value=1.0,
                             label="Duration (seconds)"
                         )
                         steps_slider = gr.Slider(
-                            minimum=1,
-                            maximum=8,
-                            step=1,
-                            value=4,
-                            label="Inference Steps"
-                        )
-                        generate_video_btn = gr.Button(
-                            "Generate Video 🎬",
-                            variant="primary"
                         )
-                    with gr.Column():
-                        video_output = gr.Video(
-                            label="Generated Video",
-                            autoplay=True
                         )
-                        video_status = gr.Textbox(
-                            label="Status",
-                            interactive=False,
-                            value="Ready..."
                         )
-        # Event Handlers
-        def on_image_generated(prompt, img1, img2):
-            img, status, state_img = process_images(prompt, img1, img2)
-            if img:
-                return img, status, state_img, gr.update(visible=True)
-            return img, status, state_img, gr.update(visible=False)
-        def send_image_to_video(img):
-            if img:
-                return img, "Image loaded!"
-            return None, "No image to send."
-        # Wire up events
-        generate_img_btn.click(
-            fn=on_image_generated,
-            inputs=[style_prompt, image1, image2],
-            outputs=[output_image, img_status, generated_image_state, send_to_video_btn]
-        )
-        send_to_video_btn.click(
-            fn=send_image_to_video,
-            inputs=[generated_image_state],
-            outputs=[video_input_image, video_status]
-        )
-        # Simplified video generation
-        def generate_video_wrapper(img, prompt, duration, steps):
-            if not TORCH_AVAILABLE:
-                return None, "Video generation requires PyTorch. Please install it first."
-            try:
-                video_path, seed, status = generate_video(
-                    img, prompt, steps=steps, duration_seconds=duration
-                )
-                return video_path, status
-            except Exception as e:
-                return None, f"Error: {str(e)[:100]}"
-        generate_video_btn.click(
-            fn=generate_video_wrapper,
-            inputs=[video_input_image, video_prompt, duration_input, steps_slider],
-            outputs=[video_output, video_status]
-        )
-        return demo
-# ===========================
-# Main Launch
-# ===========================
-if __name__ == "__main__":
-    print("=" * 50)
-    print("Starting Nano Banana + Video Application")
-    print("=" * 50)
-    # Check environment
-    if not os.getenv('REPLICATE_API_TOKEN'):
-        print("Warning: REPLICATE_API_TOKEN not set. Image generation may not work.")
-    if not TORCH_AVAILABLE:
-        print("Warning: PyTorch not available. Video generation will be disabled.")
-        print("To enable video generation, install PyTorch: pip install torch")
-    try:
-        # Create and launch demo
-        demo = create_demo()
-        demo.launch(
-            share=False,  # Set to True if you want a public link
-            server_name="0.0.0.0",
-            server_port=7860,
-            show_error=True,
-            debug=False  # Set to True for debugging
-        )
-    except Exception as e:
-        print(f"Failed to launch application: {e}")
-        print("Please check your environment and dependencies.")

 import time
 import tempfile
 import base64
+import spaces
+import torch
 import numpy as np
 import random
 import gc
 # ===========================
 # Configuration
 # ===========================
 os.environ['REPLICATE_API_TOKEN'] = os.getenv('REPLICATE_API_TOKEN')
 # Video Model Configuration
+VIDEO_MODEL_ID = "cjwbw/videocrafter2:02e509c789964be7d70de8d8fef3a6dd18f160b37272bcccc742d5adabb9f38f"  # Using public model
+LANDSCAPE_WIDTH = 512  # Reduced for stability
+LANDSCAPE_HEIGHT = 320  # Reduced for stability
 MAX_SEED = np.iinfo(np.int32).max
+FIXED_FPS = 8  # Reduced FPS
 MIN_FRAMES_MODEL = 8
+MAX_FRAMES_MODEL = 32  # Reduced max frames
+default_prompt_i2v = "make this image come alive, smooth animation"
+default_negative_prompt = "static, still, blurry, low quality"
 # ===========================
 # Image Processing Functions
 # ===========================
 def upload_image_to_hosting(image):
+    """Upload image to hosting service"""
     try:
         buffered = BytesIO()
         image.save(buffered, format="PNG")
                 'key': '6d207e02198a847aa98d0a2a901485a5',
                 'image': img_base64,
             },
+            timeout=30
         )
         if response.status_code == 200:
             if data.get('success'):
                 return data['data']['url']
     except Exception as e:
+        print(f"Upload failed: {e}")
+    # Fallback to base64
     buffered = BytesIO()
     image.save(buffered, format="PNG")
     buffered.seek(0)
     return f"data:image/png;base64,{img_base64}"
 def process_images(prompt, image1, image2=None):
+    """Process images using Replicate API"""
     if not image1:
         return None, "Please upload at least one image", None
     if not os.getenv('REPLICATE_API_TOKEN'):
+        return None, "Please set REPLICATE_API_TOKEN in Space settings", None
     try:
+        # Upload image
         url1 = upload_image_to_hosting(image1)
+        # Use SDXL for image generation/editing
         output = replicate.run(
             "stability-ai/sdxl:39ed52f2a78e934b3ba6e2a89f5b1c712de7dfea535525255b1aa35c5565e08b",
             input={
+                "prompt": prompt + ", high quality, detailed",
+                "negative_prompt": "low quality, blurry, distorted",
                 "width": 1024,
+                "height": 1024,
+                "num_inference_steps": 25
             }
         )
+        if output and isinstance(output, list) and len(output) > 0:
+            img_url = output[0]
+            response = requests.get(img_url, timeout=30)
             if response.status_code == 200:
                 img = Image.open(BytesIO(response.content))
+                return img, "✨ Image generated successfully!", img
+        return None, "Could not process output", None
     except Exception as e:
+        error_msg = str(e)
+        if "trial" in error_msg.lower():
+            return None, "Replicate API limit reached. Please try again later.", None
+        return None, f"Error: {error_msg[:200]}", None
 # ===========================
+# Video Generation Functions
 # ===========================
 def resize_image_for_video(image: Image.Image) -> Image.Image:
     """Resize image for video generation"""
+    # Convert RGBA to RGB if necessary
+    if image.mode == 'RGBA':
+        background = Image.new('RGB', image.size, (255, 255, 255))
+        background.paste(image, mask=image.split()[3])
+        image = background
+    # Resize to target dimensions
+    image = image.resize((LANDSCAPE_WIDTH, LANDSCAPE_HEIGHT), Image.LANCZOS)
+    return image
+# GPU function with proper decorator
+@spaces.GPU(duration=60)
+def generate_video_gpu(
     input_image,
     prompt,
+    steps=25,
     negative_prompt=default_negative_prompt,
+    duration_seconds=2.0,
     seed=42,
     randomize_seed=False,
 ):
+    """Generate video using Replicate API with GPU"""
+    if input_image is None:
+        return None, seed, "Please provide an input image"
     try:
+        # Clear GPU memory
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+            gc.collect()
         # Resize image
         resized_image = resize_image_for_video(input_image)
+        # Save resized image temporarily
+        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_img:
+            resized_image.save(tmp_img.name)
+            # Upload to hosting
+            img_url = upload_image_to_hosting(resized_image)
+        current_seed = random.randint(0, MAX_SEED) if randomize_seed else int(seed)
+        # Use Replicate for video generation
+        print("Generating video with Replicate...")
+        output = replicate.run(
+            VIDEO_MODEL_ID,
+            input={
+                "prompt": prompt,
+                "image": img_url,
+                "steps": int(steps),
+                "fps": FIXED_FPS,
+                "seconds": min(duration_seconds, 3),  # Limit to 3 seconds
+                "seed": current_seed
+            }
+        )
+        if output:
+            # Download video
+            if isinstance(output, str):
+                video_url = output
+            elif hasattr(output, 'url'):
+                video_url = output.url()
+            else:
+                video_url = str(output)
+            response = requests.get(video_url, timeout=60)
+            if response.status_code == 200:
+                with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp_video:
+                    tmp_video.write(response.content)
+                    return tmp_video.name, current_seed, "🎬 Video generated successfully!"
+        return None, seed, "Failed to generate video"
     except Exception as e:
+        error_msg = str(e)
+        if "out of memory" in error_msg.lower():
             torch.cuda.empty_cache()
             gc.collect()
+            return None, seed, "GPU memory exceeded. Try reducing duration."
+        return None, seed, f"Error: {error_msg[:200]}"
+# Wrapper function for video generation
+def generate_video(
+    input_image,
+    prompt,
+    steps=25,
+    negative_prompt=default_negative_prompt,
+    duration_seconds=2.0,
+    seed=42,
+    randomize_seed=False,
+):
+    """Wrapper function that calls the GPU function"""
+    if not os.getenv('REPLICATE_API_TOKEN'):
+        return None, seed, "Please set REPLICATE_API_TOKEN in Space settings"
+    return generate_video_gpu(
+        input_image,
+        prompt,
+        steps,
+        negative_prompt,
+        duration_seconds,
+        seed,
+        randomize_seed
+    )
+# ===========================
+# Simple dummy GPU function for startup
+# ===========================
+@spaces.GPU(duration=1)
+def dummy_gpu_function():
+    """Dummy function to satisfy Spaces GPU requirement"""
+    return "GPU initialized"
 # ===========================
+# CSS Styling
 # ===========================
 css = """
 .gradio-container {
+    max-width: 1200px !important;
+    margin: 0 auto !important;
 }
 .header-container {
+    background: linear-gradient(135deg, #ffd93d, #ffb347);
     padding: 2rem;
+    border-radius: 15px;
     margin-bottom: 2rem;
     text-align: center;
 }
     font-size: 2.5rem;
     font-weight: bold;
     color: #2d3436;
 }
 .subtitle {
     color: #2d3436;
+    font-size: 1.1rem;
     margin-top: 0.5rem;
 }
+.gr-button {
+    font-size: 1rem !important;
+    padding: 12px 24px !important;
+}
+.gr-button-primary {
+    background: linear-gradient(135deg, #ffd93d, #ffb347) !important;
+    border: none !important;
+}
+.gr-button-secondary {
+    background: linear-gradient(135deg, #667eea, #764ba2) !important;
+    color: white !important;
+    border: none !important;
+}
 """
 # ===========================
+# Gradio Interface
 # ===========================
+with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
+    # Initialize GPU on startup
+    startup_status = gr.State(dummy_gpu_function())
+    # Shared state
+    generated_image_state = gr.State(None)
+    gr.HTML("""
+        <div class="header-container">
+            <h1 class="logo-text">🍌 Nano Banana + Video</h1>
+            <p class="subtitle">AI Image Generation with Video Creation</p>
+            <p style="color: #636e72; font-size: 0.9rem; margin-top: 10px;">
+                ⚠️ Note: Add REPLICATE_API_TOKEN in Space Settings > Repository secrets
+            </p>
+        </div>
+    """)
+    with gr.Tabs():
+        # Tab 1: Image Generation
+        with gr.TabItem("🎨 Step 1: Generate Image"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    style_prompt = gr.Textbox(
+                        label="Image Description",
+                        placeholder="Describe what you want to create...",
+                        lines=3,
+                        value="A beautiful fantasy landscape with mountains and a river, studio ghibli style"
+                    )
+                    with gr.Row():
                         image1 = gr.Image(
                             label="Reference Image (Optional)",
+                            type="pil",
+                            height=200
                         )
                         image2 = gr.Image(
+                            label="Style Reference (Optional)",
+                            type="pil",
+                            height=200
                         )
+                    generate_img_btn = gr.Button(
+                        "🎨 Generate Image",
+                        variant="primary",
+                        size="lg"
+                    )
+                with gr.Column(scale=1):
+                    output_image = gr.Image(
+                        label="Generated Result",
+                        type="pil",
+                        height=400
+                    )
+                    img_status = gr.Textbox(
+                        label="Status",
+                        interactive=False,
+                        value="Ready to generate..."
+                    )
+                    send_to_video_btn = gr.Button(
+                        "➡️ Send to Video Generation",
+                        variant="secondary",
+                        visible=False
+                    )
+        # Tab 2: Video Generation
+        with gr.TabItem("🎬 Step 2: Generate Video"):
+            gr.Markdown("### Transform your image into a video")
+            with gr.Row():
+                with gr.Column(scale=1):
+                    video_input_image = gr.Image(
+                        type="pil",
+                        label="Input Image",
+                        height=300
+                    )
+                    video_prompt = gr.Textbox(
+                        label="Animation Description",
+                        value=default_prompt_i2v,
+                        lines=2
+                    )
+                    with gr.Row():
                         duration_input = gr.Slider(
+                            minimum=1.0,
+                            maximum=3.0,
                             step=0.5,
+                            value=2.0,
                             label="Duration (seconds)"
                         )
                         steps_slider = gr.Slider(
+                            minimum=10,
+                            maximum=50,
+                            step=5,
+                            value=25,
+                            label="Quality Steps"
                         )
+                    with gr.Row():
+                        video_seed = gr.Slider(
+                            label="Seed",
+                            minimum=0,
+                            maximum=MAX_SEED,
+                            step=1,
+                            value=42
                         )
+                        randomize_seed = gr.Checkbox(
+                            label="Random seed",
+                            value=True
                         )
+                    video_negative_prompt = gr.Textbox(
+                        label="Negative Prompt",
+                        value=default_negative_prompt,
+                        lines=2
+                    )
+                    generate_video_btn = gr.Button(
+                        "🎬 Generate Video",
+                        variant="primary",
+                        size="lg"
+                    )
+                with gr.Column(scale=1):
+                    video_output = gr.Video(
+                        label="Generated Video",
+                        autoplay=True,
+                        height=400
+                    )
+                    video_status = gr.Textbox(
+                        label="Status",
+                        interactive=False,
+                        value="Ready to generate video..."
+                    )
+    # Event Handlers
+    def on_image_generated(prompt, img1, img2):
+        img, status, state_img = process_images(prompt, img1, img2)
+        if img:
+            return img, status, state_img, gr.update(visible=True)
+        return None, status, None, gr.update(visible=False)
+    def send_image_to_video(img):
+        if img:
+            return img, "Image loaded! Ready to generate video."
+        return None, "No image to send."
+    # Connect events
+    generate_img_btn.click(
+        fn=on_image_generated,
+        inputs=[style_prompt, image1, image2],
+        outputs=[output_image, img_status, generated_image_state, send_to_video_btn]
+    )
+    send_to_video_btn.click(
+        fn=send_image_to_video,
+        inputs=[generated_image_state],
+        outputs=[video_input_image, video_status]
+    )
+    generate_video_btn.click(
+        fn=generate_video,
+        inputs=[
+            video_input_image,
+            video_prompt,
+            steps_slider,
+            video_negative_prompt,
+            duration_input,
+            video_seed,
+            randomize_seed
+        ],
+        outputs=[video_output, video_seed, video_status]
+    )
+    # Examples
+    gr.Examples(
+        examples=[
+            ["A majestic castle on a hilltop at sunset, fantasy art style"],
+            ["Cute robot in a flower garden, pixar animation style"],
+            ["Northern lights over a frozen lake, photorealistic"],
+            ["Ancient temple in a jungle, mysterious atmosphere"],
+        ],
+        inputs=[style_prompt],
+        label="Example Prompts"
+    )
+# Launch the app
+if __name__ == "__main__":
+    print("Starting Nano Banana + Video app...")
+    print("Make sure to set REPLICATE_API_TOKEN in your Space settings!")
+    demo.launch(
+        share=False,
+        show_error=True
+    )