Spaces:

VirtualOasis
/

CineGen

Sleeping

App Files Files Community

VirtualOasis commited on 24 days ago

Commit

46c3ea1

1 Parent(s): acd33ac

video

Browse files

Files changed (5) hide show

app.py +1 -1
cinegen/character_engine.py +18 -8
cinegen/placeholders.py +13 -4
cinegen/story_engine.py +10 -5
cinegen/video_engine.py +29 -26

app.py CHANGED Viewed

@@ -16,7 +16,7 @@ STYLE_CHOICES = [
 ]
 VIDEO_MODEL_CHOICES = [
-    ("Wan 2.1 (fal-ai)", "Wan-AI/Wan2.1-T2V-14B"),
     ("LTX Video 0.9.7", "Lightricks/LTX-Video-0.9.7-distilled"),
     ("Hunyuan Video 1.5", "tencent/HunyuanVideo-1.5"),
     ("CogVideoX 5B", "THUDM/CogVideoX-5b"),

 ]
 VIDEO_MODEL_CHOICES = [
+    ("Wan 2.2 TI2V (fal-ai)", "Wan-AI/Wan2.2-TI2V-5B"),
     ("LTX Video 0.9.7", "Lightricks/LTX-Video-0.9.7-distilled"),
     ("Hunyuan Video 1.5", "tencent/HunyuanVideo-1.5"),
     ("CogVideoX 5B", "THUDM/CogVideoX-5b"),

cinegen/character_engine.py CHANGED Viewed

@@ -29,16 +29,26 @@ class CharacterDesigner:
     def design(self, storyboard: Storyboard) -> Tuple[List[Tuple[str, str]], Storyboard]:
         gallery: List[Tuple[str, str]] = []
         for character in storyboard.characters:
-            image_path = None
-            if self.client:
-                image_path = self._try_generate(character, storyboard.style)
-            if not image_path:
-                image_path = synthesize_character_card(character, storyboard.style)
-            character.reference_image = image_path
-            caption = f"{character.name} — {character.role}"
-            gallery.append((image_path, caption))
         return gallery, storyboard
     def _try_generate(self, character, style: str) -> Optional[str]:  # pragma: no cover
         prompt = (
             f"Create a portrait for {character.name}, a {character.role} in a {style} short film. "

     def design(self, storyboard: Storyboard) -> Tuple[List[Tuple[str, str]], Storyboard]:
         gallery: List[Tuple[str, str]] = []
         for character in storyboard.characters:
+            gallery.append(self._refresh_reference(character, storyboard.style))
         return gallery, storyboard
+    def redesign_character(self, storyboard: Storyboard, character_id: str) -> Tuple[Tuple[str, str], Storyboard]:
+        target = next((char for char in storyboard.characters if char.identifier == character_id), None)
+        if not target:
+            raise ValueError(f"Character {character_id} not found.")
+        card = self._refresh_reference(target, storyboard.style)
+        return card, storyboard
+    def _refresh_reference(self, character, style: str) -> Tuple[str, str]:
+        image_path = None
+        if self.client:
+            image_path = self._try_generate(character, style)
+        if not image_path:
+            image_path = synthesize_character_card(character, style)
+        character.reference_image = image_path
+        caption = f"{character.name} — {character.role}"
+        return image_path, caption
     def _try_generate(self, character, style: str) -> Optional[str]:  # pragma: no cover
         prompt = (
             f"Create a portrait for {character.name}, a {character.role} in a {style} short film. "

cinegen/placeholders.py CHANGED Viewed

@@ -43,13 +43,22 @@ def _slugify(text: str) -> str:
     return safe or "cinegen"
 def build_stub_storyboard(
     idea: str,
     style: str,
-    scene_count: int,
     inspiration_hint: str | None,
 ) -> Storyboard:
-    random.seed(_slugify(idea) + style + str(scene_count))
     title = idea.title() if idea else f"{style} Short"
     synopsis = (
         f"A {style.lower()} short that transforms the idea '{idea or 'mystery cue'}' "
@@ -57,7 +66,7 @@ def build_stub_storyboard(
     )
     characters: List[CharacterSpec] = []
     for idx, (role, desc) in enumerate(CHARACTER_ARCHETYPES):
-        if idx >= 3 and scene_count <= 3:
             break
         identifier = f"CHAR-{idx+1}"
         name = f"{role} {random.choice(string.ascii_uppercase)}"
@@ -75,7 +84,7 @@ def build_stub_storyboard(
         )
     scenes: List[SceneBeat] = []
-    for idx in range(scene_count):
         label = SCENE_TITLES[idx % len(SCENE_TITLES)]
         scene_id = f"SCENE-{idx+1}"
         visuals = (

     return safe or "cinegen"
+def normalize_scene_count(scene_count: int | float | str | None) -> int:
+    try:
+        value = int(float(scene_count))
+    except (TypeError, ValueError):
+        return 3
+    return max(1, value)
 def build_stub_storyboard(
     idea: str,
     style: str,
+    scene_count: int | float | str,
     inspiration_hint: str | None,
 ) -> Storyboard:
+    normalized_scenes = normalize_scene_count(scene_count)
+    random.seed(_slugify(idea) + style + str(normalized_scenes))
     title = idea.title() if idea else f"{style} Short"
     synopsis = (
         f"A {style.lower()} short that transforms the idea '{idea or 'mystery cue'}' "
     )
     characters: List[CharacterSpec] = []
     for idx, (role, desc) in enumerate(CHARACTER_ARCHETYPES):
+        if idx >= 3 and normalized_scenes <= 3:
             break
         identifier = f"CHAR-{idx+1}"
         name = f"{role} {random.choice(string.ascii_uppercase)}"
         )
     scenes: List[SceneBeat] = []
+    for idx in range(normalized_scenes):
         label = SCENE_TITLES[idx % len(SCENE_TITLES)]
         scene_id = f"SCENE-{idx+1}"
         visuals = (

cinegen/story_engine.py CHANGED Viewed

@@ -5,7 +5,11 @@ import os
 from typing import Any, Dict, Optional
 from .models import Storyboard, CharacterSpec, SceneBeat
-from .placeholders import build_stub_storyboard, describe_image_reference
 DEFAULT_STORY_MODEL = os.environ.get("CINEGEN_STORY_MODEL", "gemini-2.5-flash")
@@ -32,18 +36,19 @@ class StoryGenerator:
         self,
         idea: str,
         style: str,
-        scene_count: int,
         inspiration_path: Optional[str] = None,
     ) -> Storyboard:
         if not self.client:
             return build_stub_storyboard(
                 idea=idea,
                 style=style,
-                scene_count=scene_count,
                 inspiration_hint=describe_image_reference(inspiration_path),
             )
-        prompt = self._build_prompt(idea, style, scene_count)
         contents = [prompt]
         parts = self._maybe_add_image_part(inspiration_path)
         contents = parts + contents if parts else contents
@@ -64,7 +69,7 @@ class StoryGenerator:
             return build_stub_storyboard(
                 idea=idea,
                 style=style,
-                scene_count=scene_count,
                 inspiration_hint=describe_image_reference(inspiration_path),
             )

 from typing import Any, Dict, Optional
 from .models import Storyboard, CharacterSpec, SceneBeat
+from .placeholders import (
+    build_stub_storyboard,
+    describe_image_reference,
+    normalize_scene_count,
+)
 DEFAULT_STORY_MODEL = os.environ.get("CINEGEN_STORY_MODEL", "gemini-2.5-flash")
         self,
         idea: str,
         style: str,
+        scene_count: int | float | str,
         inspiration_path: Optional[str] = None,
     ) -> Storyboard:
+        scene_total = normalize_scene_count(scene_count)
         if not self.client:
             return build_stub_storyboard(
                 idea=idea,
                 style=style,
+                scene_count=scene_total,
                 inspiration_hint=describe_image_reference(inspiration_path),
             )
+        prompt = self._build_prompt(idea, style, scene_total)
         contents = [prompt]
         parts = self._maybe_add_image_part(inspiration_path)
         contents = parts + contents if parts else contents
             return build_stub_storyboard(
                 idea=idea,
                 style=style,
+                scene_count=scene_total,
                 inspiration_hint=describe_image_reference(inspiration_path),
             )

cinegen/video_engine.py CHANGED Viewed

@@ -2,21 +2,28 @@ from __future__ import annotations
 import os
 import tempfile
-import time
-from typing import List, Optional, Sequence, Tuple
-import requests
 from .models import SceneBeat, Storyboard
 from .placeholders import create_placeholder_video
 DEFAULT_VIDEO_MODELS = [
-    "Wan-AI/Wan2.1-T2V-14B",
     "Lightricks/LTX-Video-0.9.7-distilled",
     "tencent/HunyuanVideo-1.5",
     "THUDM/CogVideoX-5b",
 ]
 class VideoDirector:
     def __init__(
@@ -59,29 +66,25 @@ class VideoDirector:
     def _call_hf_inference(self, prompt: str, model_id: str, duration: int) -> str:
         if not self.token:
             raise RuntimeError("Missing Hugging Face token")
-        url = f"https://api-inference.huggingface.co/models/{model_id}"
-        headers = {
-            "Authorization": f"Bearer {self.token}",
-            "Accept": "video/mp4",
-        }
-        payload = {
-            "inputs": prompt,
-            "parameters": {"duration": duration},
-        }
-        for _ in range(3):
-            response = requests.post(url, headers=headers, json=payload, timeout=600)
-            if response.status_code == 200:
-                tmp_dir = tempfile.mkdtemp(prefix="cinegen-video-")
-                path = os.path.join(tmp_dir, f"{model_id.split('/')[-1]}.mp4")
-                with open(path, "wb") as handle:
-                    handle.write(response.content)
-                return path
-            if response.status_code in (503, 529, 202):
-                time.sleep(5)
-                continue
-            raise RuntimeError(f"{response.status_code}: {response.text[:120]}")
-        raise RuntimeError("Model busy")
     @staticmethod
     def _compose_prompt(storyboard: Storyboard, scene: SceneBeat) -> str:

 import os
 import tempfile
+from typing import Dict, List, Optional, Sequence, Tuple
+from huggingface_hub import InferenceClient
 from .models import SceneBeat, Storyboard
 from .placeholders import create_placeholder_video
 DEFAULT_VIDEO_MODELS = [
+    "Wan-AI/Wan2.2-TI2V-5B",
     "Lightricks/LTX-Video-0.9.7-distilled",
     "tencent/HunyuanVideo-1.5",
     "THUDM/CogVideoX-5b",
 ]
+MODEL_PROVIDER_OVERRIDES: Dict[str, Optional[str]] = {
+    "Wan-AI/Wan2.2-TI2V-5B": "fal-ai",
+}
+MIN_FRAMES = 16
+MAX_FRAMES = 240
+FRAMES_PER_SECOND = 8
 class VideoDirector:
     def __init__(
     def _call_hf_inference(self, prompt: str, model_id: str, duration: int) -> str:
         if not self.token:
             raise RuntimeError("Missing Hugging Face token")
+        client = self._build_client(model_id)
+        frames = max(MIN_FRAMES, min(MAX_FRAMES, int(duration * FRAMES_PER_SECOND)))
+        video_bytes = client.text_to_video(
+            prompt,
+            model=model_id,
+            num_frames=frames,
+        )
+        tmp_dir = tempfile.mkdtemp(prefix="cinegen-video-")
+        path = os.path.join(tmp_dir, f"{model_id.split('/')[-1]}.mp4")
+        with open(path, "wb") as handle:
+            handle.write(video_bytes)
+        return path
+    def _build_client(self, model_id: str) -> InferenceClient:
+        provider = MODEL_PROVIDER_OVERRIDES.get(model_id)
+        kwargs = {"token": self.token}
+        if provider:
+            kwargs["provider"] = provider
+        return InferenceClient(**kwargs)
     @staticmethod
     def _compose_prompt(storyboard: Storyboard, scene: SceneBeat) -> str: