Spaces:

rambo12
/

text-to-video-generator

Running

File size: 17,325 Bytes

db8251f

import gradio as gr
import logging
import tempfile
import os

# Set up logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

class TextToVideoGenerator:
    def __init__(self):
        self.device = "cpu"  # Simplified for testing
        
        # Available models - including the advanced Wan2.1 model
        self.models = {
            "damo-vilab/text-to-video-ms-1.7b": {
                "name": "DAMO Text-to-Video MS-1.7B",
                "description": "Fast and efficient text-to-video model",
                "max_frames": 16,
                "fps": 8,
                "quality": "Good",
                "speed": "Fast"
            },
            "cerspense/zeroscope_v2_XL": {
                "name": "Zeroscope v2 XL",
                "description": "High-quality text-to-video model",
                "max_frames": 24,
                "fps": 6,
                "quality": "Excellent",
                "speed": "Medium"
            },
            "Wan-AI/Wan2.1-T2V-14B": {
                "name": "Wan2.1-T2V-14B (SOTA)",
                "description": "State-of-the-art text-to-video model with 14B parameters",
                "max_frames": 32,
                "fps": 8,
                "quality": "SOTA",
                "speed": "Medium",
                "resolutions": ["480P", "720P"],
                "features": ["Chinese & English text", "High motion dynamics", "Best quality"]
            }
        }
        
        # Voice options (gTTS only supports language, not gender/age)
        self.voices = {
            "Default (English)": "en"
        }
    
    def generate_video(self, prompt, model_id, num_frames=16, fps=8, num_inference_steps=25, guidance_scale=7.5, seed=None, resolution="480P", voice_script="", voice_type="Default (English)", add_voice=True):
        """Generate video from text prompt with optional voice (DEMO VERSION)"""
        try:
            # This is a demo version that simulates video generation
            logger.info(f"DEMO: Would generate video with prompt: {prompt}")
            logger.info(f"DEMO: Model: {model_id}, Frames: {num_frames}, FPS: {fps}")
            
            if add_voice and voice_script.strip():
                logger.info(f"DEMO: Would add voice narration: {voice_script}")
            
            # Create a dummy video file for demonstration
            dummy_video_path = "demo_video.mp4"
            
            # For demo purposes, return a success message
            return dummy_video_path, f"DEMO: Video generation completed! (This is a test version - no actual video generated)"
            
        except Exception as e:
            logger.error(f"Error in demo video generation: {str(e)}")
            return None, f"Demo error: {str(e)}"
    
    def get_available_models(self):
        """Get list of available models"""
        return list(self.models.keys())
    
    def get_model_info(self, model_id):
        """Get information about a specific model"""
        if model_id in self.models:
            return self.models[model_id]
        return None
    
    def get_available_voices(self):
        """Get list of available voices"""
        return list(self.voices.keys())

# Initialize the generator
generator = TextToVideoGenerator()

def create_interface():
    """Create Gradio interface"""
    
    def generate_video_interface(prompt, model_id, num_frames, fps, num_inference_steps, guidance_scale, seed, resolution, voice_script, voice_type, add_voice):
        if not prompt.strip():
            return None, "Please enter a prompt"
        
        return generator.generate_video(
            prompt=prompt,
            model_id=model_id,
            num_frames=num_frames,
            fps=fps,
            num_inference_steps=num_inference_steps,
            guidance_scale=guidance_scale,
            seed=seed,
            resolution=resolution,
            voice_script=voice_script,
            voice_type=voice_type,
            add_voice=add_voice
        )
    
    # Custom CSS for professional styling
    custom_css = """
    .gradio-container {
        max-width: 1200px !important;
        margin: 0 auto !important;
    }
    
    .header {
        text-align: center;
        padding: 2rem 0;
        background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
        color: white;
        border-radius: 15px;
        margin-bottom: 2rem;
    }
    
    .header h1 {
        font-size: 2.5rem;
        font-weight: 700;
        margin: 0;
        text-shadow: 2px 2px 4px rgba(0,0,0,0.3);
    }
    
    .header p {
        font-size: 1.1rem;
        margin: 0.5rem 0 0 0;
        opacity: 0.9;
    }
    
    .feature-card {
        background: white;
        border-radius: 10px;
        padding: 1.5rem;
        box-shadow: 0 4px 6px rgba(0,0,0,0.1);
        margin-bottom: 1rem;
        border-left: 4px solid #667eea;
    }
    
    .feature-card h3 {
        color: #333;
        margin: 0 0 0.5rem 0;
        font-size: 1.2rem;
    }
    
    .feature-card p {
        color: #666;
        margin: 0;
        font-size: 0.9rem;
    }
    
    .model-info {
        background: #f8f9fa;
        border-radius: 8px;
        padding: 1rem;
        border: 1px solid #e9ecef;
    }
    
    .model-info h4 {
        color: #495057;
        margin: 0 0 0.5rem 0;
        font-size: 1rem;
    }
    
    .model-info p {
        color: #6c757d;
        margin: 0.25rem 0;
        font-size: 0.85rem;
    }
    
    .generate-btn {
        background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
        border: none !important;
        color: white !important;
        font-weight: 600 !important;
        padding: 1rem 2rem !important;
        border-radius: 10px !important;
        font-size: 1.1rem !important;
        transition: all 0.3s ease !important;
    }
    
    .generate-btn:hover {
        transform: translateY(-2px) !important;
        box-shadow: 0 6px 12px rgba(102, 126, 234, 0.4) !important;
    }
    
    .example-card {
        background: #f8f9fa;
        border-radius: 8px;
        padding: 1rem;
        margin: 0.5rem 0;
        border: 1px solid #e9ecef;
        cursor: pointer;
        transition: all 0.2s ease;
    }
    
    .example-card:hover {
        background: #e9ecef;
        transform: translateX(5px);
    }
    
    .status-box {
        background: #e3f2fd;
        border: 1px solid #2196f3;
        border-radius: 8px;
        padding: 1rem;
    }
    
    .pricing-info {
        background: linear-gradient(135deg, #ffecd2 0%, #fcb69f 100%);
        border-radius: 10px;
        padding: 1rem;
        text-align: center;
        margin: 1rem 0;
    }
    
    .pricing-info h4 {
        color: #d84315;
        margin: 0 0 0.5rem 0;
    }
    
    .pricing-info p {
        color: #bf360c;
        margin: 0;
        font-size: 0.9rem;
    }
    
    .demo-notice {
        background: linear-gradient(135deg, #fff3cd 0%, #ffeaa7 100%);
        border: 1px solid #ffc107;
        border-radius: 8px;
        padding: 1rem;
        margin: 1rem 0;
        text-align: center;
    }
    """
    
    # Create interface
    with gr.Blocks(title="AI Video Creator Pro - DEMO", theme=gr.themes.Soft(), css=custom_css) as interface:
        
        # Professional Header
        with gr.Group(elem_classes="header"):
            gr.Markdown("""
            # 🎬 AI Video Creator Pro
            ### Transform Your Ideas Into Stunning Videos with AI-Powered Generation
            """)
        
        # Demo Notice
        with gr.Group(elem_classes="demo-notice"):
            gr.Markdown("""
            ## 🚧 DEMO VERSION
            This is a demonstration of the professional UI. Video generation is simulated for testing purposes.
            The full version with actual AI video generation will be available once dependencies are resolved.
            """)
        
        with gr.Row():
            with gr.Column(scale=2):
                # Main Input Section
                with gr.Group(elem_classes="feature-card"):
                    gr.Markdown("## 🎯 Video Generation")
                    
                    prompt = gr.Textbox(
                        label="📝 Video Description",
                        placeholder="Describe the video you want to create... (e.g., 'A majestic dragon soaring through a mystical forest with glowing mushrooms')",
                        lines=3,
                        max_lines=5,
                        container=True
                    )
                    
                    with gr.Row():
                        model_id = gr.Dropdown(
                            choices=generator.get_available_models(),
                            value=generator.get_available_models()[0],
                            label="🤖 AI Model",
                            info="Choose the AI model for video generation",
                            container=True
                        )
                        
                        resolution = gr.Dropdown(
                            choices=["480P", "720P"],
                            value="480P",
                            label="📐 Resolution (Wan2.1 only)",
                            info="Select video resolution",
                            visible=False,
                            container=True
                        )
                    
                    with gr.Row():
                        num_frames = gr.Slider(
                            minimum=8,
                            maximum=32,
                            value=16,
                            step=1,
                            label="🎞️ Video Length (Frames)",
                            info="More frames = longer video"
                        )
                        
                        fps = gr.Slider(
                            minimum=4,
                            maximum=12,
                            value=8,
                            step=1,
                            label="⚡ FPS",
                            info="Frames per second"
                        )
                    
                    with gr.Row():
                        num_inference_steps = gr.Slider(
                            minimum=10,
                            maximum=50,
                            value=25,
                            step=1,
                            label="🎨 Quality Steps",
                            info="More steps = better quality but slower"
                        )
                        
                        guidance_scale = gr.Slider(
                            minimum=1.0,
                            maximum=20.0,
                            value=7.5,
                            step=0.5,
                            label="🎯 Guidance Scale",
                            info="Higher values = more prompt adherence"
                        )
                    
                    seed = gr.Number(
                        label="🎲 Seed (Optional)",
                        value=None,
                        info="Set for reproducible results",
                        container=True
                    )
                
                # Voice Section
                with gr.Group(elem_classes="feature-card"):
                    gr.Markdown("## 🎤 Voice & Audio")
                    
                    with gr.Row():
                        add_voice = gr.Checkbox(
                            label="🎵 Add Voice Narration",
                            value=True,
                            info="Enable to add professional voice-over"
                        )
                        
                        voice_type = gr.Dropdown(
                            choices=generator.get_available_voices(),
                            value="Default (English)",
                            label="🗣️ Voice Type",
                            info="Select the voice for narration",
                            container=True
                        )
                    
                    voice_script = gr.Textbox(
                        label="📜 Narration Script (Optional)",
                        placeholder="Enter your narration script here... (Leave blank to use video description)",
                        lines=2,
                        max_lines=3,
                        info="If left blank, the video description will be used as narration",
                        container=True
                    )
                
                # Generate Button
                generate_btn = gr.Button("🚀 Generate Professional Video (DEMO)", variant="primary", size="lg", elem_classes="generate-btn")
                
                # Output Section
                with gr.Group(elem_classes="feature-card"):
                    gr.Markdown("## 📺 Generated Video")
                    status_text = gr.Textbox(label="📊 Status", interactive=False, elem_classes="status-box")
                    video_output = gr.Video(label="🎬 Your Video", elem_classes="status-box")
            
            with gr.Column(scale=1):
                # Model Information
                with gr.Group(elem_classes="model-info"):
                    gr.Markdown("## 🤖 AI Model Details")
                    model_info = gr.JSON(label="Current Model Specifications", elem_classes="model-info")
                
                # Pricing Information
                with gr.Group(elem_classes="pricing-info"):
                    gr.Markdown("## 💰 Pricing")
                    gr.Markdown("""
                    **Free Tier:** 5 videos per day
                    
                    **Pro Plan:** $9.99/month
                    - Unlimited videos
                    - Priority processing
                    - HD quality
                    - Advanced features
                    
                    **Enterprise:** Contact us
                    """)
                
                # Examples
                with gr.Group():
                    gr.Markdown("## 💡 Inspiration Examples")
                    examples = [
                        ["A beautiful sunset over the ocean with waves crashing on the shore"],
                        ["A cat playing with a ball of yarn in a cozy living room"],
                        ["A futuristic city with flying cars and neon lights"],
                        ["A butterfly emerging from a cocoon in a garden"],
                        ["A rocket launching into space with fire and smoke"],
                        ["Two anthropomorphic cats in comfy boxing gear and bright gloves fight intensely on a spotlighted stage"],
                        ["A majestic dragon soaring through a mystical forest with glowing mushrooms"]
                    ]
                    gr.Examples(
                        examples=examples,
                        inputs=prompt,
                        label="Click to try these examples"
                    )
                
                # Features
                with gr.Group():
                    gr.Markdown("## ✨ Features")
                    gr.Markdown("""
                    🎬 **Multiple AI Models**
                    - State-of-the-art video generation
                    - Quality vs speed options
                    
                    🎤 **Professional Voice-Over**
                    - Multiple voice types
                    - Custom narration scripts
                    
                    🎨 **Advanced Controls**
                    - Quality settings
                    - Resolution options
                    - Reproducible results
                    
                    ⚡ **Fast Processing**
                    - GPU acceleration
                    - Optimized pipelines
                    """)
        
        # Event handlers
        generate_btn.click(
            fn=generate_video_interface,
            inputs=[prompt, model_id, num_frames, fps, num_inference_steps, guidance_scale, seed, resolution, voice_script, voice_type, add_voice],
            outputs=[video_output, status_text]
        )
        
        # Update model info when model changes
        def update_model_info(model_id):
            info = generator.get_model_info(model_id)
            return info
        
        # Show/hide resolution selector based on model
        def update_resolution_visibility(model_id):
            if model_id == "Wan-AI/Wan2.1-T2V-14B":
                return gr.Dropdown(visible=True)
            else:
                return gr.Dropdown(visible=False)
        
        model_id.change(
            fn=update_model_info,
            inputs=model_id,
            outputs=model_info
        )
        
        model_id.change(
            fn=update_resolution_visibility,
            inputs=model_id,
            outputs=resolution
        )
        
        # Load initial model info
        interface.load(lambda: generator.get_model_info(generator.get_available_models()[0]), outputs=model_info)
    
    return interface

# Create and launch the interface
interface = create_interface()
interface.launch(
    server_name="0.0.0.0",
    server_port=7861,
    share=True,
    show_error=True
)