mgbam commited on
Commit
e555883
Β·
verified Β·
1 Parent(s): 29c2122

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +245 -218
app.py CHANGED
@@ -3,289 +3,316 @@ import streamlit as st
3
  from core.gemini_handler import GeminiHandler
4
  from core.visual_engine import VisualEngine
5
  from core.prompt_engineering import (
6
- create_story_breakdown_prompt,
7
- create_image_prompt_from_scene_data,
8
- create_narration_script_prompt, # New
9
- create_scene_regeneration_prompt,
10
- create_visual_regeneration_prompt
11
  )
12
  import os
13
 
14
  # --- Configuration & Initialization ---
15
- st.set_page_config(page_title="CineGen AI Ultra", layout="wide", initial_sidebar_state="expanded")
16
 
17
  # --- Global State Variables & API Key Setup ---
18
- # Simplified API Key Loading
19
  def load_api_key(key_name_streamlit, key_name_env):
20
- key = None
21
  try:
22
- if key_name_streamlit in st.secrets: key = st.secrets[key_name_streamlit]
23
- except AttributeError: print(f"st.secrets not available for {key_name_streamlit}.") # Local dev
24
- except Exception as e: print(f"Error accessing st.secrets for {key_name_streamlit}: {e}")
25
  if not key and key_name_env in os.environ: key = os.environ[key_name_env]
26
  return key
27
 
28
- if 'GEMINI_API_KEY' not in st.session_state:
 
29
  st.session_state.GEMINI_API_KEY = load_api_key("GEMINI_API_KEY", "GEMINI_API_KEY")
30
- if not st.session_state.GEMINI_API_KEY: st.error("Gemini API Key missing!"); st.stop()
31
- if 'gemini_handler' not in st.session_state:
 
 
 
 
32
  st.session_state.gemini_handler = GeminiHandler(api_key=st.session_state.GEMINI_API_KEY)
33
-
34
- if 'visual_engine' not in st.session_state:
35
  st.session_state.visual_engine = VisualEngine(output_dir="temp_cinegen_media")
36
- st.session_state.visual_engine.set_openai_api_key(load_api_key("OPENAI_API_KEY", "OPENAI_API_KEY"))
37
- st.session_state.visual_engine.set_elevenlabs_api_key(load_api_key("ELEVENLABS_API_KEY", "ELEVENLABS_API_KEY"))
38
- st.session_state.visual_engine.set_pexels_api_key(load_api_key("PEXELS_API_KEY", "PEXELS_API_KEY"))
 
39
 
40
- # Initialize other session state variables (same as before)
41
  for key, default_val in [
42
- ('story_scenes', []), ('scene_image_prompts', []), ('generated_images_paths', []),
43
- ('video_path', None), ('character_definitions', {}), ('style_reference_description', ""),
44
- ('overall_narration_path', None), ('narration_script_for_display', "")
45
  ]:
46
  if key not in st.session_state: st.session_state[key] = default_val
47
- # --- End State & API Key Setup ---
48
-
49
 
50
- def initialize_new_story(): # Remains same
51
- st.session_state.story_scenes = []
52
- st.session_state.scene_image_prompts = []
53
- st.session_state.generated_images_paths = []
 
54
  st.session_state.video_path = None
55
- st.session_state.overall_narration_path = None
56
- st.session_state.narration_script_for_display = ""
57
 
58
-
59
- def generate_visual_for_scene_wrapper(scene_index, scene_data, is_regeneration=False, version_count=1):
60
- # ... (This helper remains the same, but now `generate_image_visual` in engine has Pexels fallback) ...
61
- # Pass scene_data for Pexels query generation
62
- scene_num_for_log = scene_data.get('scene_number', scene_index + 1)
63
- textual_image_prompt = ""
64
- if is_regeneration and scene_index < len(st.session_state.scene_image_prompts) and st.session_state.scene_image_prompts[scene_index]:
65
- textual_image_prompt = st.session_state.scene_image_prompts[scene_index]
66
- else:
67
- textual_image_prompt = create_image_prompt_from_scene_data(
68
- scene_data, st.session_state.character_definitions, st.session_state.style_reference_description)
69
- if not textual_image_prompt: return False
70
- if scene_index >= len(st.session_state.scene_image_prompts):
71
- while len(st.session_state.scene_image_prompts) <= scene_index: st.session_state.scene_image_prompts.append("")
72
- st.session_state.scene_image_prompts[scene_index] = textual_image_prompt
73
- image_filename = f"scene_{scene_num_for_log}_visual_v{version_count}.png" # DALL-E saves as PNG
74
-
75
- # Pass scene_data to visual engine for Pexels query if DALL-E fails
76
- generated_image_path = st.session_state.visual_engine.generate_image_visual(
77
- textual_image_prompt, scene_data, image_filename
78
  )
79
- while len(st.session_state.generated_images_paths) <= scene_index: st.session_state.generated_images_paths.append(None)
80
- if generated_image_path and os.path.exists(generated_image_path):
81
- st.session_state.generated_images_paths[scene_index] = generated_image_path; return True
 
 
 
 
 
 
 
 
 
 
 
82
  else:
83
- st.session_state.generated_images_paths[scene_index] = None; return False
84
-
85
 
86
  # --- UI Sidebar ---
87
  with st.sidebar:
88
- st.title("🎬 CineGen AI Ultra")
89
- st.markdown("### Creative Controls")
90
- # ... (user_idea, genre, mood, num_scenes - same) ...
91
- user_idea = st.text_area("Core story idea:", "A lone astronaut discovers a glowing alien artifact on Mars, a sense of wonder and slight dread.", height=100, key="user_idea_input")
92
- genre = st.selectbox("Genre:", ["Cyberpunk", "Sci-Fi", "Fantasy", "Noir", "Thriller"], index=0, key="genre_select")
93
- mood = st.selectbox("Mood:", ["Wonder", "Suspenseful", "Mysterious", "Gritty", "Epic"], index=0, key="mood_select")
94
- num_scenes_val = st.slider("Number of Scenes:", 1, 3, 1, key="num_scenes_slider")
95
 
 
 
96
 
97
- if st.button("πŸš€ Generate Cinematic Masterpiece", type="primary", key="generate_masterpiece_btn", use_container_width=True):
98
- initialize_new_story()
99
- if not user_idea.strip(): st.warning("Please enter a story idea.")
100
  else:
101
- with st.status("Crafting your cinematic vision...", expanded=True) as status_main:
102
- st.write("Phase 1: Gemini is drafting the script... πŸ“œ")
103
- # ... (Story generation - same) ...
104
- story_prompt_text = create_story_breakdown_prompt(user_idea, genre, mood, num_scenes_val)
105
  try:
106
- st.session_state.story_scenes = st.session_state.gemini_handler.generate_story_breakdown(story_prompt_text)
107
- status_main.update(label="Script complete! βœ… Generating visuals...", state="running")
108
- num_actual_scenes = len(st.session_state.story_scenes)
109
- st.session_state.scene_image_prompts = [""] * num_actual_scenes
110
- st.session_state.generated_images_paths = [None] * num_actual_scenes
111
- except Exception as e: status_main.update(label=f"Script gen failed: {e}", state="error"); st.stop()
112
-
113
- if st.session_state.story_scenes:
114
- st.write("Phase 2: Creating visuals (DALL-E/Pexels)... πŸ–ΌοΈ")
115
- visual_success_count = 0
116
- for i, scene_data in enumerate(st.session_state.story_scenes):
117
- st.write(f" Processing Scene {scene_data.get('scene_number', i + 1)} visuals...")
118
- if generate_visual_for_scene_wrapper(i, scene_data, version_count=1): visual_success_count +=1
119
 
120
- if visual_success_count == 0 :
121
- status_main.update(label="Visual gen failed for all scenes.", state="error", expanded=False); st.stop()
122
 
123
- st.write("Phase 3: Generating narration script with Gemini... 🎀")
124
- narration_prompt = create_narration_script_prompt(st.session_state.story_scenes, mood, genre)
125
- try:
126
- narration_script = st.session_state.gemini_handler.generate_image_prompt(narration_prompt) # Re-use for text gen
127
- st.session_state.narration_script_for_display = narration_script
128
- status_main.update(label="Narration script ready! Generating voice...", state="running")
129
-
130
- st.write("Phase 4: Synthesizing voice with ElevenLabs... πŸ”Š")
131
- st.session_state.overall_narration_path = st.session_state.visual_engine.generate_narration_audio(
132
- narration_script, "overall_narration.mp3"
133
- )
134
- if st.session_state.overall_narration_path:
135
- status_main.update(label="Voiceover generated! ✨", state="running")
136
- else:
137
- status_main.update(label="Voiceover failed, proceeding without.", state="warning")
138
- except Exception as e:
139
- status_main.update(label=f"Narration/Voice gen failed: {e}", state="warning")
140
 
141
- status_main.update(label="All major components generated! Storyboard ready. πŸŽ‰", state="complete", expanded=False)
142
 
143
- st.markdown("---") # Advanced Options (Character, Style - same as previous full app.py)
144
- # ... (Character Consistency expander - same)
145
- with st.expander("Character Consistency", expanded=False):
146
- char_name_input = st.text_input("Character Name (e.g., Jax)", key="char_name_adv_input")
147
- char_desc_input = st.text_area("Character Description (e.g., 'male astronaut, rugged, dark short hair, blue eyes, wearing a worn white and orange spacesuit with a cracked visor helmet slung at his hip')", key="char_desc_adv_input", height=120)
148
- if st.button("Add/Update Character", key="add_char_adv_btn"):
149
- if char_name_input and char_desc_input: st.session_state.character_definitions[char_name_input.strip().lower()] = char_desc_input.strip(); st.success(f"Character '{char_name_input.strip()}' defined.")
150
- else: st.warning("Provide both name and description.")
 
 
151
  if st.session_state.character_definitions:
152
- st.caption("Defined Characters:")
153
- for char_key, desc_val in st.session_state.character_definitions.items(): st.markdown(f"**{char_key.title()}:** _{desc_val}_")
154
- # ... (Style Controls expander - same)
155
- with st.expander("Style Controls", expanded=True):
156
- predefined_styles = { "Default (Cinematic Photorealism)": "", "Gritty Neo-Noir": "neo-noir aesthetic, gritty realism, deep shadows...", "Epic Fantasy Matte Painting": "epic fantasy matte painting style...", "Impressionistic Dream": "impressionistic oil painting style...", "Vintage Sci-Fi (70s/80s Film)": "retro sci-fi aesthetic, analog film look...", "Modern Anime Key Visual": "high-detail modern anime key visual style..." }
157
- selected_preset = st.selectbox("Base Style Preset:", options=list(predefined_styles.keys()), key="style_preset_select_adv")
158
- custom_keywords = st.text_area("Add Custom Style Keywords:", key="custom_style_keywords_adv_input", height=80, placeholder="e.g., 'Dutch angle, fisheye lens'")
159
- current_style_desc = st.session_state.style_reference_description
160
- if st.button("Apply & Set Styles", key="apply_styles_adv_btn"):
 
 
161
  final_desc = predefined_styles[selected_preset];
162
  if custom_keywords.strip(): final_desc = f"{final_desc}, {custom_keywords.strip()}" if final_desc else custom_keywords.strip()
163
- st.session_state.style_reference_description = final_desc.strip(); current_style_desc = final_desc.strip()
164
- if current_style_desc: st.success("Styles applied!")
165
- else: st.info("Default style (no specific additions).")
166
- if current_style_desc: st.caption(f"Active style additions: \"{current_style_desc}\"")
167
- else: st.caption("No specific style prompt additions active.")
168
- # Conceptual Voice selection for ElevenLabs
169
  with st.expander("Voice Customization (ElevenLabs)", expanded=False):
170
- # In a real app, you'd fetch voice list from ElevenLabs API if key is present
171
- available_voices_conceptual = ["Rachel", "Adam", "Bella", "Antoni", "Elli", "Josh", "Arnold", "Callum"]
172
- selected_voice = st.selectbox("Choose Narrator Voice:", available_voices_conceptual,
173
- index=available_voices_conceptual.index(st.session_state.visual_engine.elevenlabs_voice_id) if st.session_state.visual_engine.elevenlabs_voice_id in available_voices_conceptual else 0,
174
- key="elevenlabs_voice_select")
175
- if st.button("Set Voice", key="set_voice_btn"):
176
- st.session_state.visual_engine.elevenlabs_voice_id = selected_voice
177
- st.success(f"Narrator voice set to: {selected_voice}")
178
 
179
 
180
  # --- Main Content Area ---
181
- # ... (Header, Scene Iteration, Details, Image Display, Edit Popovers - mostly the same as previous full app.py)
182
- # Key change: Pass character_definitions and style_reference_description to create_visual_regeneration_prompt
183
 
184
- st.header("πŸ“ Cinematic Storyboard")
185
- if st.session_state.narration_script_for_display: # Display narration script if generated
186
- with st.expander("View Generated Narration Script", expanded=False):
187
- st.markdown(st.session_state.narration_script_for_display)
188
 
189
- if not st.session_state.story_scenes:
190
- st.info("Enter your idea in the sidebar and click 'πŸš€ Generate Cinematic Masterpiece' to begin.")
191
  else:
192
- for i, scene_data_display in enumerate(st.session_state.story_scenes):
193
- # ... (scene_num_display, unique_key_part, subheader, columns, Scene Details, Image Display - same as previous)
194
- scene_num_display = scene_data_display.get('scene_number', i + 1); action_summary = scene_data_display.get('key_action', f"scene{i}"); key_part_raw = ''.join(e for e in action_summary if e.isalnum() or e.isspace()); unique_key_part = key_part_raw.replace(" ", "_")[:20]
195
- st.subheader(f"Scene {scene_num_display}: {scene_data_display.get('emotional_beat', 'Untitled Scene')}")
196
- col1, col2 = st.columns([2, 3])
197
- with col1:
198
- with st.expander("Scene Details", expanded=True):
199
- st.markdown(f"**Setting:** {scene_data_display.get('setting_description', 'N/A')}"); st.markdown(f"**Characters:** {', '.join(scene_data_display.get('characters_involved', []))}"); st.markdown(f"**Key Action:** {scene_data_display.get('key_action', 'N/A')}"); st.markdown(f"**Dialogue Snippet:** `\"{scene_data_display.get('dialogue_snippet', '...')}\"`"); st.markdown(f"**Visual Style Suggestion (Gemini):** {scene_data_display.get('visual_style_suggestion', 'N/A')}"); st.markdown(f"**Camera Suggestion (Gemini):** {scene_data_display.get('camera_angle_suggestion', 'N/A')}")
200
- current_textual_prompt = st.session_state.scene_image_prompts[i] if i < len(st.session_state.scene_image_prompts) else None
201
- if current_textual_prompt:
202
- with st.popover("View Full Image Prompt"): st.markdown(f"**Full Textual Prompt Sent to DALL-E:**"); st.code(current_textual_prompt, language='text')
203
- with col2:
204
- current_image_path = st.session_state.generated_images_paths[i] if i < len(st.session_state.generated_images_paths) else None
205
- if current_image_path and os.path.exists(current_image_path): st.image(current_image_path, caption=f"Visual Concept for Scene {scene_num_display}")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
206
  else:
207
- if st.session_state.story_scenes: st.caption("Visual for this scene is pending or failed.")
208
- with st.popover(f"✏️ Edit Scene {scene_num_display} Script"):
209
- # ... (Script edit logic - same, but uses updated generate_visual_for_scene_wrapper)
210
- feedback_script = st.text_area("Describe script changes:", key=f"script_feedback_{unique_key_part}_{i}", height=100)
211
- if st.button(f"πŸ”„ Update Scene {scene_num_display} Script", key=f"regen_script_btn_{unique_key_part}_{i}"):
212
- if feedback_script:
213
- with st.status(f"Updating Scene {scene_num_display}...", expanded=True) as status_script_regen:
214
- regen_prompt = create_scene_regeneration_prompt(scene_data_display, feedback_script, st.session_state.story_scenes)
 
215
  try:
216
- updated_scene_data = st.session_state.gemini_handler.regenerate_scene_script_details(regen_prompt); st.session_state.story_scenes[i] = updated_scene_data
217
- status_script_regen.update(label="Script updated! Regenerating visual...", state="running")
218
- version = 1
219
- if current_image_path: try: base, _ = os.path.splitext(os.path.basename(current_image_path)); version = int(base.split('_v')[-1]) + 1 if '_v' in base else 2 except: version = 2
220
- if generate_visual_for_scene_wrapper(i, updated_scene_data, is_regeneration=False, version_count=version): status_script_regen.update(label="Scene script & visual updated! πŸŽ‰", state="complete", expanded=False)
221
- else: status_script_regen.update(label="Script updated, visual failed.", state="warning", expanded=False)
 
 
 
 
222
  st.rerun()
223
- except Exception as e: status_script_regen.update(label=f"Error: {e}", state="error")
224
- else: st.warning("Please provide feedback.")
225
- with st.popover(f"🎨 Edit Scene {scene_num_display} Visuals"):
226
- # ... (Visual edit logic - same, but passes more context to create_visual_regeneration_prompt)
227
- prompt_for_edit_visuals = st.session_state.scene_image_prompts[i] if i < len(st.session_state.scene_image_prompts) else "No prompt."
228
- st.caption("Current Full Image Prompt:"); st.code(prompt_for_edit_visuals, language='text')
229
- feedback_visual = st.text_area("Describe visual changes for the prompt:", key=f"visual_feedback_{unique_key_part}_{i}", height=100)
230
- if st.button(f"πŸ”„ Update Scene {scene_num_display} Visuals", key=f"regen_visual_btn_{unique_key_part}_{i}"):
231
- if feedback_visual:
232
- with st.status(f"Refining prompt & regenerating visual...", expanded=True) as status_visual_regen:
233
- prompt_refinement_request = create_visual_regeneration_prompt(
234
- prompt_for_edit_visuals, feedback_visual, scene_data_display,
235
- st.session_state.character_definitions, st.session_state.style_reference_description # Pass these
 
236
  )
237
  try:
238
- refined_textual_image_prompt = st.session_state.gemini_handler.regenerate_image_prompt_from_feedback(prompt_refinement_request)
239
- st.session_state.scene_image_prompts[i] = refined_textual_image_prompt
240
- status_visual_regen.update(label="Prompt refined! Regenerating visual...", state="running")
241
- version = 1
242
- if current_image_path: try: base, _ = os.path.splitext(os.path.basename(current_image_path)); version = int(base.split('_v')[-1]) + 1 if '_v' in base else 2 except: version = 2
243
- if generate_visual_for_scene_wrapper(i, scene_data_display, is_regeneration=True, version_count=version): status_visual_regen.update(label="Visual updated! πŸŽ‰", state="complete", expanded=False)
244
- else: status_visual_regen.update(label="Prompt refined, visual failed.", state="warning", expanded=False)
 
 
 
245
  st.rerun()
246
- except Exception as e: status_visual_regen.update(label=f"Error: {e}", state="error")
247
- else: st.warning("Please provide feedback.")
248
  st.markdown("---")
249
 
250
- # Video Generation - Pass overall_narration_path
251
- if st.session_state.story_scenes and any(p for p in st.session_state.generated_images_paths if p is not None):
252
- if st.button("🎬 Assemble Narrated Masterpiece", key="assemble_narrated_video_btn", type="primary", use_container_width=True):
253
- with st.status("Assembling narrated animatic video...", expanded=True) as status_video:
254
- image_data_for_video = []
255
- # ... (image_data_for_video assembly - same) ...
256
- for idx, scene_info in enumerate(st.session_state.story_scenes):
257
- img_path = st.session_state.generated_images_paths[idx] if idx < len(st.session_state.generated_images_paths) else None
258
- if img_path and os.path.exists(img_path):
259
- image_data_for_video.append({'path':img_path, 'scene_num':scene_info.get('scene_number',idx+1), 'key_action':scene_info.get('key_action','')})
260
- st.write(f"Adding Scene {scene_info.get('scene_number', idx + 1)} to video.")
 
261
 
262
- if image_data_for_video:
263
- st.write("Calling video engine (with narration if available)...")
264
  st.session_state.video_path = st.session_state.visual_engine.create_video_from_images(
265
- image_data_for_video,
266
- overall_narration_path=st.session_state.overall_narration_path, # Pass narration
267
- output_filename="cinegen_narrated_masterpiece.mp4",
268
- duration_per_image=5, # Longer for narration
269
  fps=24
270
  )
271
  if st.session_state.video_path and os.path.exists(st.session_state.video_path):
272
- status_video.update(label="Narrated masterpiece assembled! πŸŽ‰", state="complete", expanded=False); st.balloons()
273
- else: status_video.update(label="Video assembly failed. Check logs.", state="error", expanded=False)
274
- else: status_video.update(label="No valid images to assemble video.", state="error", expanded=False)
275
- elif st.session_state.story_scenes: st.info("Generate visuals for scenes before assembling the video.")
276
 
277
- # Video display and download - (same)
278
  if st.session_state.video_path and os.path.exists(st.session_state.video_path):
279
- st.header("🎬 Generated Narrated Masterpiece")
280
  try:
281
  with open(st.session_state.video_path, 'rb') as vf_obj: video_bytes = vf_obj.read()
282
  st.video(video_bytes, format="video/mp4")
283
  with open(st.session_state.video_path, "rb") as fp_dl:
284
- st.download_button(label="Download Narrated Masterpiece", data=fp_dl,
285
  file_name=os.path.basename(st.session_state.video_path), mime="video/mp4",
286
- use_container_width=True, key="download_narrated_video_btn" )
287
  except Exception as e: st.error(f"Error displaying video: {e}")
288
 
289
  # --- Footer ---
290
  st.sidebar.markdown("---")
291
- st.sidebar.caption("CineGen AI Ultra | Powered by Gemini, DALL-E, ElevenLabs & Streamlit.")
 
3
  from core.gemini_handler import GeminiHandler
4
  from core.visual_engine import VisualEngine
5
  from core.prompt_engineering import (
6
+ create_cinematic_treatment_prompt, # UPDATED
7
+ construct_dalle_prompt, # UPDATED
8
+ create_narration_script_prompt_enhanced, # UPDATED
9
+ create_scene_regeneration_prompt, # UPDATED
10
+ create_visual_regeneration_prompt # UPDATED
11
  )
12
  import os
13
 
14
  # --- Configuration & Initialization ---
15
+ st.set_page_config(page_title="CineGen AI Ultra+", layout="wide", initial_sidebar_state="expanded")
16
 
17
  # --- Global State Variables & API Key Setup ---
 
18
  def load_api_key(key_name_streamlit, key_name_env):
19
+ key = None; secrets_available = hasattr(st, 'secrets')
20
  try:
21
+ if secrets_available and key_name_streamlit in st.secrets: key = st.secrets[key_name_streamlit]
22
+ except Exception: pass # Silently ignore if st.secrets access fails
 
23
  if not key and key_name_env in os.environ: key = os.environ[key_name_env]
24
  return key
25
 
26
+ # Initialize API Keys and handlers once
27
+ if 'keys_loaded' not in st.session_state:
28
  st.session_state.GEMINI_API_KEY = load_api_key("GEMINI_API_KEY", "GEMINI_API_KEY")
29
+ st.session_state.OPENAI_API_KEY = load_api_key("OPENAI_API_KEY", "OPENAI_API_KEY")
30
+ st.session_state.ELEVENLABS_API_KEY = load_api_key("ELEVENLABS_API_KEY", "ELEVENLABS_API_KEY")
31
+ st.session_state.PEXELS_API_KEY = load_api_key("PEXELS_API_KEY", "PEXELS_API_KEY")
32
+
33
+ if not st.session_state.GEMINI_API_KEY: st.error("Gemini API Key is essential and missing!"); st.stop()
34
+
35
  st.session_state.gemini_handler = GeminiHandler(api_key=st.session_state.GEMINI_API_KEY)
 
 
36
  st.session_state.visual_engine = VisualEngine(output_dir="temp_cinegen_media")
37
+ st.session_state.visual_engine.set_openai_api_key(st.session_state.OPENAI_API_KEY)
38
+ st.session_state.visual_engine.set_elevenlabs_api_key(st.session_state.ELEVENLABS_API_KEY)
39
+ st.session_state.visual_engine.set_pexels_api_key(st.session_state.PEXELS_API_KEY)
40
+ st.session_state.keys_loaded = True
41
 
42
+ # Initialize other session state variables
43
  for key, default_val in [
44
+ ('story_treatment_scenes', []), ('scene_dalle_prompts', []), ('generated_visual_paths', []),
45
+ ('video_path', None), ('character_definitions', {}), ('global_style_additions', ""),
46
+ ('overall_narration_audio_path', None), ('narration_script_display', "")
47
  ]:
48
  if key not in st.session_state: st.session_state[key] = default_val
 
 
49
 
50
+ # --- Helper Functions ---
51
+ def initialize_new_project():
52
+ st.session_state.story_treatment_scenes = []
53
+ st.session_state.scene_dalle_prompts = []
54
+ st.session_state.generated_visual_paths = []
55
  st.session_state.video_path = None
56
+ st.session_state.overall_narration_audio_path = None
57
+ st.session_state.narration_script_display = ""
58
 
59
+ def generate_visual_for_scene_core(scene_index, scene_data, version=1):
60
+ # scene_data here is one scene from story_treatment_scenes
61
+ dalle_prompt = construct_dalle_prompt(
62
+ scene_data,
63
+ st.session_state.character_definitions,
64
+ st.session_state.global_style_additions
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  )
66
+ if not dalle_prompt: return False
67
+
68
+ # Ensure lists are long enough
69
+ while len(st.session_state.scene_dalle_prompts) <= scene_index: st.session_state.scene_dalle_prompts.append("")
70
+ while len(st.session_state.generated_visual_paths) <= scene_index: st.session_state.generated_visual_paths.append(None)
71
+
72
+ st.session_state.scene_dalle_prompts[scene_index] = dalle_prompt
73
+
74
+ filename = f"scene_{scene_data.get('scene_number', scene_index+1)}_visual_v{version}.png"
75
+ # Pass the full scene_data to visual_engine for Pexels query construction if needed
76
+ img_path = st.session_state.visual_engine.generate_image_visual(dalle_prompt, scene_data, filename)
77
+
78
+ if img_path and os.path.exists(img_path):
79
+ st.session_state.generated_visual_paths[scene_index] = img_path; return True
80
  else:
81
+ st.session_state.generated_visual_paths[scene_index] = None; return False
 
82
 
83
  # --- UI Sidebar ---
84
  with st.sidebar:
85
+ st.title("🎬 CineGen AI Ultra+")
86
+ st.markdown("### Creative Seed")
87
+ user_idea = st.text_area("Core Story Idea / Theme:", "A lone wanderer searches for a mythical oasis in a vast, post-apocalyptic desert, haunted by mirages and mechanical scavengers.", height=120, key="user_idea_main")
88
+ genre = st.selectbox("Primary Genre:", ["Cyberpunk", "Sci-Fi", "Fantasy", "Noir", "Thriller", "Western", "Post-Apocalyptic"], index=6, key="genre_main")
89
+ mood = st.selectbox("Overall Mood:", ["Hopeful yet Desperate", "Mysterious & Eerie", "Gritty & Tense", "Epic & Awe-Inspiring", "Melancholy & Reflective"], index=0, key="mood_main")
90
+ num_scenes = st.slider("Number of Key Scenes:", 1, 4, 2, key="num_scenes_main") # Max 3-4 for API cost/time
 
91
 
92
+ creative_guidance_options = {"Standard": "standard", "More Artistic": "more_artistic", "Experimental Narrative": "experimental_narrative"}
93
+ selected_creative_guidance = st.selectbox("AI Creative Guidance Level:", options=list(creative_guidance_options.keys()), key="creative_guidance_select")
94
 
95
+ if st.button("🌌 Generate Cinematic Treatment", type="primary", key="generate_treatment_btn", use_container_width=True):
96
+ initialize_new_project()
97
+ if not user_idea.strip(): st.warning("Please provide a story idea.")
98
  else:
99
+ with st.status("AI Director is envisioning your masterpiece...", expanded=True) as status:
100
+ status.write("Phase 1: Gemini crafting cinematic treatment (scenes, style, camera, sound)... πŸ“œ")
101
+ treatment_prompt = create_cinematic_treatment_prompt(user_idea, genre, mood, num_scenes, creative_guidance_options[selected_creative_guidance])
 
102
  try:
103
+ st.session_state.story_treatment_scenes = st.session_state.gemini_handler.generate_story_breakdown(treatment_prompt) # Re-use for JSON list
104
+ num_gen_scenes = len(st.session_state.story_treatment_scenes)
105
+ st.session_state.scene_dalle_prompts = [""] * num_gen_scenes
106
+ st.session_state.generated_visual_paths = [None] * num_gen_scenes
107
+ status.update(label="Treatment complete! Generating visuals...", state="running")
108
+
109
+ visual_successes = 0
110
+ for i_scene, scene_content in enumerate(st.session_state.story_treatment_scenes):
111
+ status.write(f" Creating visual for Scene {scene_content.get('scene_number', i_scene+1)}: {scene_content.get('scene_title','')}...")
112
+ if generate_visual_for_scene_core(i_scene, scene_content, version=1): visual_successes += 1
 
 
 
113
 
114
+ if visual_successes == 0 and num_gen_scenes > 0:
115
+ status.update(label="Visual generation failed for all scenes. Check API keys/quota.", state="error", expanded=False); st.stop()
116
 
117
+ status.update(label="Visuals ready! Generating narration script...", state="running")
118
+ narration_prompt = create_narration_script_prompt_enhanced(st.session_state.story_treatment_scenes, mood, genre, st.session_state.get("selected_voice_style", "cinematic_trailer"))
119
+ narr_script = st.session_state.gemini_handler.generate_image_prompt(narration_prompt) # generate_image_prompt is just text gen
120
+ st.session_state.narration_script_display = narr_script
121
+ status.update(label="Narration script ready! Synthesizing voice...", state="running")
122
+
123
+ st.session_state.overall_narration_audio_path = st.session_state.visual_engine.generate_narration_audio(narr_script)
124
+ if st.session_state.overall_narration_audio_path: status.update(label="Voiceover ready! ✨", state="running")
125
+ else: status.update(label="Voiceover failed. Video will be silent.", state="warning")
126
+
127
+ status.update(label="All components ready! View storyboard. πŸš€", state="complete", expanded=False)
 
 
 
 
 
 
128
 
129
+ except Exception as e: status.update(label=f"Error during generation: {e}", state="error", expanded=True); st.stop()
130
 
131
+ st.markdown("---")
132
+ st.markdown("### Fine-Tuning Options")
133
+ # Character Definitions Expander (same as previous)
134
+ with st.expander("Define Characters", expanded=False):
135
+ # ... (UI for char_name_input, char_desc_input, add button - same as previous, ensure lowercase keys for definitions)
136
+ char_name_input = st.text_input("Character Name", key="char_name_adv_input_ultra")
137
+ char_desc_input = st.text_area("Detailed Visual Description", key="char_desc_adv_input_ultra", height=100, placeholder="e.g., Jax: rugged male astronaut, mid-40s, salt-and-pepper short hair, cybernetic left eye glowing faintly blue, wearing a patched-up crimson flight suit.")
138
+ if st.button("Save Character", key="add_char_adv_btn_ultra"):
139
+ if char_name_input and char_desc_input: st.session_state.character_definitions[char_name_input.strip().lower()] = char_desc_input.strip(); st.success(f"Character '{char_name_input.strip()}' saved.")
140
+ else: st.warning("Provide name and description.")
141
  if st.session_state.character_definitions:
142
+ st.caption("Current Characters:")
143
+ for k,v in st.session_state.character_definitions.items(): st.markdown(f"**{k.title()}:** _{v}_")
144
+
145
+ # Style Controls Expander (same as previous)
146
+ with st.expander("Global Style Overrides", expanded=False):
147
+ # ... (UI for predefined_styles, custom_style_keywords, apply button - same as previous) ...
148
+ predefined_styles = { "Default (Director's Choice)": "", "Hyper-Realistic Gritty Noir": "hyper-realistic gritty neo-noir, extreme detail, deep dynamic shadows, complex reflections on wet surfaces, cinematic film grain, desaturated palette with isolated vibrant neon accents (e.g. red, cyan), anamorphic lens distortion, atmospheric haze.", "Surreal Dreamscape Fantasy": "surreal dreamscape, epic fantasy elements, painterly with photorealistic details, impossible architecture, bioluminescent flora, otherworldly color palette (e.g., magenta skies, turquoise rivers), style of Roger Dean meets ZdzisΕ‚aw BeksiΕ„ski.", "Vintage Analog Sci-Fi": "70s/80s analog sci-fi film aesthetic, tangible practical effects look, subtle light leaks, lens flares, warm filmic tones mixed with cool blues, detailed retro-futuristic technology with chunky buttons and CRT screens."}
149
+ selected_preset = st.selectbox("Base Style Preset:", options=list(predefined_styles.keys()), key="style_preset_select_adv_ultra")
150
+ custom_keywords = st.text_area("Additional Custom Style Keywords:", key="custom_style_keywords_adv_input_ultra", height=80, placeholder="e.g., 'shot with Arri Alexa, shallow depth of field, golden hour tones'")
151
+ current_style_desc = st.session_state.global_style_additions
152
+ if st.button("Apply Global Styles", key="apply_styles_adv_btn_ultra"):
153
  final_desc = predefined_styles[selected_preset];
154
  if custom_keywords.strip(): final_desc = f"{final_desc}, {custom_keywords.strip()}" if final_desc else custom_keywords.strip()
155
+ st.session_state.global_style_additions = final_desc.strip(); current_style_desc = final_desc.strip()
156
+ if current_style_desc: st.success("Global styles applied!")
157
+ else: st.info("Global style additions cleared (using Director's per-scene choice).")
158
+ if current_style_desc: st.caption(f"Active global style additions: \"{current_style_desc}\"")
159
+
160
+ # Voice Customization Expander (same as previous)
161
  with st.expander("Voice Customization (ElevenLabs)", expanded=False):
162
+ # ... (UI for available_voices_conceptual, selected_voice, set button - same) ...
163
+ # In a real app, fetch from ElevenLabs API if key is present. This is a placeholder list.
164
+ elevenlabs_voices = ["Rachel", "Adam", "Bella", "Antoni", "Elli", "Josh", "Arnold", "Domi", "Fin", "Sarah"]
165
+ current_el_voice = st.session_state.visual_engine.elevenlabs_voice_id if hasattr(st.session_state, 'visual_engine') else "Rachel"
166
+ selected_el_voice = st.selectbox("Narrator Voice:", elevenlabs_voices, index=elevenlabs_voices.index(current_el_voice) if current_el_voice in elevenlabs_voices else 0, key="el_voice_select_ultra")
167
+ if st.button("Set Narrator Voice", key="set_voice_btn_ultra"):
168
+ if hasattr(st.session_state, 'visual_engine'): st.session_state.visual_engine.elevenlabs_voice_id = selected_el_voice
169
+ st.success(f"Narrator voice set to: {selected_el_voice}")
170
 
171
 
172
  # --- Main Content Area ---
173
+ st.header("🎬 Cinematic Storyboard & Treatment")
 
174
 
175
+ # Display Narration Script if available
176
+ if st.session_state.narration_script_display:
177
+ with st.expander("πŸ“œ View Full Narration Script", expanded=False):
178
+ st.markdown(f"> _{st.session_state.narration_script_display}_")
179
 
180
+ if not st.session_state.story_treatment_scenes:
181
+ st.info("Use the sidebar to generate your cinematic treatment.")
182
  else:
183
+ for i_main, scene_content_display in enumerate(st.session_state.story_treatment_scenes):
184
+ scene_num = scene_content_display.get('scene_number', i_main + 1)
185
+ scene_title = scene_content_display.get('scene_title', 'Untitled Scene')
186
+ unique_key_base = f"scene_{scene_num}_{''.join(filter(str.isalnum, scene_title[:10]))}" # For unique widget keys
187
+
188
+ st.subheader(f"SCENE {scene_num}: {scene_title.upper()}")
189
+
190
+ # Display Director's Notes if any (for experimental narrative)
191
+ if "director_note" in scene_content_display:
192
+ st.info(f"🎬 Director's Note for Scene {scene_num}: {scene_content_display['director_note']}")
193
+
194
+ col_details, col_visual = st.columns([0.45, 0.55]) # Adjust ratio
195
+
196
+ with col_details:
197
+ with st.expander("πŸ“ Scene Treatment Details", expanded=True):
198
+ st.markdown(f"**Emotional Beat:** {scene_content_display.get('emotional_beat', 'N/A')}")
199
+ st.markdown(f"**Setting:** {scene_content_display.get('setting_description', 'N/A')}")
200
+ st.markdown(f"**Characters:** {', '.join(scene_content_display.get('characters_involved', ['N/A']))}")
201
+ st.markdown(f"**Character Focus Moment:** _{scene_content_display.get('character_focus_moment', 'N/A')}_")
202
+ st.markdown(f"**Key Plot Beat:** {scene_content_display.get('key_plot_beat', 'N/A')}")
203
+ st.markdown(f"**Dialogue Hook:** `\"{scene_content_display.get('suggested_dialogue_hook', '...')}\"`")
204
+ st.markdown("---")
205
+ st.markdown(f"**🎬 Director's Visual Style:** {scene_content_display.get('PROACTIVE_visual_style_감독', 'N/A')}")
206
+ st.markdown(f"**πŸŽ₯ Director's Camera Work:** {scene_content_display.get('PROACTIVE_camera_work_감독', 'N/A')}")
207
+ st.markdown(f"**πŸ”Š Director's Sound Design:** {scene_content_display.get('PROACTIVE_sound_design_감독', 'N/A')}")
208
+
209
+ current_dalle_prompt = st.session_state.scene_dalle_prompts[i_main] if i_main < len(st.session_state.scene_dalle_prompts) else None
210
+ if current_dalle_prompt:
211
+ with st.popover("πŸ‘οΈ View DALL-E Prompt"):
212
+ st.markdown(f"**Full DALL-E Prompt:**"); st.code(current_dalle_prompt, language='text')
213
+
214
+ pexels_query_display = scene_content_display.get('pexels_search_query_감독', None)
215
+ if pexels_query_display:
216
+ st.caption(f"Suggested Pexels Query: `{pexels_query_display}`")
217
+
218
+
219
+ with col_visual:
220
+ current_img_path = st.session_state.generated_visual_paths[i_main] if i_main < len(st.session_state.generated_visual_paths) else None
221
+ if current_img_path and os.path.exists(current_img_path):
222
+ st.image(current_img_path, caption=f"Visual Concept for Scene {scene_num}: {scene_title}", use_column_width='always')
223
  else:
224
+ st.caption("Visual concept pending or failed.")
225
+
226
+ # Edit Popovers - logic for calling regeneration needs to use the new prompt structures
227
+ with st.popover(f"✏️ Edit Scene {scene_num} Treatment"):
228
+ feedback_script_edit = st.text_area("Describe changes to treatment details:", key=f"treat_feed_{unique_key_base}", height=150)
229
+ if st.button(f"πŸ”„ Update Scene {scene_num} Treatment", key=f"regen_treat_btn_{unique_key_base}"):
230
+ if feedback_script_edit:
231
+ with st.status(f"Updating Scene {scene_num} Treatment...", expanded=True) as status_treat_regen:
232
+ regen_prompt_text = create_scene_regeneration_prompt(scene_content_display, feedback_script_edit, st.session_state.story_treatment_scenes)
233
  try:
234
+ updated_scene_data = st.session_state.gemini_handler.regenerate_scene_script_details(regen_prompt_text) # Assumes this returns one scene obj
235
+ st.session_state.story_treatment_scenes[i_main] = updated_scene_data
236
+ status_treat_regen.update(label="Treatment updated! Regenerating visual & DALL-E prompt...", state="running")
237
+ version_num = 1
238
+ if current_img_path: try: base,_=os.path.splitext(os.path.basename(current_img_path)); version_num = int(base.split('_v')[-1])+1 if '_v' in base else 2 except: version_num=2
239
+
240
+ # Regenerate visual for the updated scene data
241
+ if generate_visual_for_scene_core(i_main, updated_scene_data, version=version_num):
242
+ status_treat_regen.update(label="Scene Treatment & Visual Updated! πŸŽ‰", state="complete", expanded=False)
243
+ else: status_treat_regen.update(label="Treatment updated, visual failed.", state="warning", expanded=False)
244
  st.rerun()
245
+ except Exception as e: status_treat_regen.update(label=f"Error: {e}", state="error")
246
+ else: st.warning("Please provide feedback for treatment regeneration.")
247
+
248
+ with st.popover(f"🎨 Edit Scene {scene_num} Visual Prompt"):
249
+ dalle_prompt_to_edit = st.session_state.scene_dalle_prompts[i_main] if i_main < len(st.session_state.scene_dalle_prompts) else "No DALL-E prompt."
250
+ st.caption("Current DALL-E Prompt:"); st.code(dalle_prompt_to_edit, language='text')
251
+ feedback_visual_edit = st.text_area("Describe changes for the DALL-E prompt:", key=f"visual_feed_{unique_key_base}", height=150)
252
+ if st.button(f"πŸ”„ Update Scene {scene_num} Visual Prompt & Image", key=f"regen_visual_btn_{unique_key_base}"):
253
+ if feedback_visual_edit:
254
+ with st.status(f"Refining DALL-E prompt & regenerating visual...", expanded=True) as status_visual_edit_regen:
255
+ # Gemini refines the DALL-E prompt
256
+ refinement_req_prompt = create_visual_regeneration_prompt(
257
+ dalle_prompt_to_edit, feedback_visual_edit, scene_content_display,
258
+ st.session_state.character_definitions, st.session_state.global_style_additions
259
  )
260
  try:
261
+ refined_dalle_prompt = st.session_state.gemini_handler.generate_image_prompt(refinement_req_prompt) # generate_image_prompt is just text gen
262
+ st.session_state.scene_dalle_prompts[i_main] = refined_dalle_prompt # Update stored DALL-E prompt
263
+ status_visual_edit_regen.update(label="DALL-E prompt refined! Regenerating visual...", state="running")
264
+ version_num = 1
265
+ if current_img_path: try: base,_=os.path.splitext(os.path.basename(current_img_path)); version_num = int(base.split('_v')[-1])+1 if '_v' in base else 2 except: version_num=2
266
+
267
+ # Generate visual with the NEW refined DALL-E prompt
268
+ if generate_visual_for_scene_core(i_main, scene_content_display, version=version_num): # scene_content_display is still relevant context
269
+ status_visual_edit_regen.update(label="Visual Updated! πŸŽ‰", state="complete", expanded=False)
270
+ else: status_visual_edit_regen.update(label="Prompt refined, visual failed.", state="warning", expanded=False)
271
  st.rerun()
272
+ except Exception as e: status_visual_edit_regen.update(label=f"Error: {e}", state="error")
273
+ else: st.warning("Please provide feedback for visual prompt regeneration.")
274
  st.markdown("---")
275
 
276
+ # Video Generation Button
277
+ if st.session_state.story_treatment_scenes and any(p for p in st.session_state.generated_visual_paths if p is not None):
278
+ if st.button("🎬 Assemble Narrated Cinematic Animatic", key="assemble_ultra_video_btn", type="primary", use_container_width=True):
279
+ with st.status("Assembling Ultra Animatic...", expanded=True) as status_vid:
280
+ image_data_for_vid = []
281
+ for i_vid, scene_c in enumerate(st.session_state.story_treatment_scenes):
282
+ img_p = st.session_state.generated_visual_paths[i_vid] if i_vid < len(st.session_state.generated_visual_paths) else None
283
+ if img_p and os.path.exists(img_p):
284
+ image_data_for_vid.append({
285
+ 'path':img_p, 'scene_num':scene_c.get('scene_number',i_vid+1),
286
+ 'key_action':scene_c.get('key_plot_beat','') # Use key_plot_beat for overlay
287
+ }); status_vid.write(f"Adding Scene {scene_c.get('scene_number', i_vid + 1)} to video.")
288
 
289
+ if image_data_for_vid:
290
+ status_vid.write("Calling video engine...")
291
  st.session_state.video_path = st.session_state.visual_engine.create_video_from_images(
292
+ image_data_for_vid,
293
+ overall_narration_path=st.session_state.overall_narration_audio_path,
294
+ output_filename="cinegen_ultra_animatic.mp4",
295
+ duration_per_image=st.session_state.visual_engine.video_overlay_font_size * 0.15, # Dynamic duration based on text overlay font size
296
  fps=24
297
  )
298
  if st.session_state.video_path and os.path.exists(st.session_state.video_path):
299
+ status_vid.update(label="Ultra animatic assembled! πŸŽ‰", state="complete", expanded=False); st.balloons()
300
+ else: status_vid.update(label="Video assembly failed. Check logs.", state="error", expanded=False)
301
+ else: status_vid.update(label="No valid images for video.", state="error", expanded=False)
302
+ elif st.session_state.story_treatment_scenes: st.info("Generate visuals before assembling video.")
303
 
304
+ # Video display and download
305
  if st.session_state.video_path and os.path.exists(st.session_state.video_path):
306
+ st.header("🎬 Generated Cinematic Animatic")
307
  try:
308
  with open(st.session_state.video_path, 'rb') as vf_obj: video_bytes = vf_obj.read()
309
  st.video(video_bytes, format="video/mp4")
310
  with open(st.session_state.video_path, "rb") as fp_dl:
311
+ st.download_button(label="Download Ultra Animatic", data=fp_dl,
312
  file_name=os.path.basename(st.session_state.video_path), mime="video/mp4",
313
+ use_container_width=True, key="download_ultra_video_btn" )
314
  except Exception as e: st.error(f"Error displaying video: {e}")
315
 
316
  # --- Footer ---
317
  st.sidebar.markdown("---")
318
+ st.sidebar.caption("CineGen AI Ultra+ | Visionary Cinematic Pre-Production")