Spaces:

drvsbrkcn
/

EceMotion_Pictures

Paused

App Files Files Community

EceMotion_Pictures / llm_script_generator.py

drvsbrkcn

Upload 3 files

404465b verified 30 days ago

raw

history blame contribute delete

15.1 kB

	"""
	LLM-powered script generation for EceMotion Pictures.
	Generates intelligent, structure-aware commercial scripts with timing markers.
	"""

	import logging
	import random
	from typing import Dict, List, Optional, Tuple
	from dataclasses import dataclass

	from config import (
	MODEL_LLM, MODEL_CONFIGS, VOICE_STYLES, STRUCTURE_TEMPLATES, TAGLINES,
	get_safe_model_name
	)

	logger = logging.getLogger(__name__)

	@dataclass
	class ScriptSegment:
	"""Represents a segment of the commercial script with timing information."""
	text: str
	duration_estimate: float
	segment_type: str # "hook", "flow", "benefit", "cta"
	timing_marker: Optional[str] = None

	@dataclass
	class GeneratedScript:
	"""Complete generated script with all segments and metadata."""
	segments: List[ScriptSegment]
	total_duration: float
	tagline: str
	voice_style: str
	word_count: int
	raw_script: str

	class LLMScriptGenerator:
	"""Generates commercial scripts using large language models with fallbacks."""

	def __init__(self, model_name: str = MODEL_LLM):
	self.model_name = get_safe_model_name(model_name, "llm")
	self.model = None
	self.tokenizer = None
	self.model_config = MODEL_CONFIGS.get(self.model_name, {})
	self.llm_available = False

	# Try to initialize LLM
	self._try_init_llm()

	def _try_init_llm(self):
	"""Try to initialize the LLM model."""
	try:
	if "dialo" in self.model_name.lower():
	self._init_dialogpt()
	elif "qwen" in self.model_name.lower():
	self._init_qwen()
	else:
	logger.warning(f"Unknown LLM model: {self.model_name}, using fallback")
	self.llm_available = False
	except Exception as e:
	logger.warning(f"Failed to initialize LLM {self.model_name}: {e}")
	self.llm_available = False

	def _init_dialogpt(self):
	"""Initialize DialoGPT model."""
	try:
	from transformers import AutoTokenizer, AutoModelForCausalLM

	self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)
	if self.tokenizer.pad_token is None:
	self.tokenizer.pad_token = self.tokenizer.eos_token

	self.model = AutoModelForCausalLM.from_pretrained(
	self.model_name,
	torch_dtype="auto",
	device_map="auto" if self._has_gpu() else "cpu"
	)
	self.llm_available = True
	logger.info(f"DialoGPT model {self.model_name} loaded successfully")

	except Exception as e:
	logger.error(f"Failed to load DialoGPT: {e}")
	self.llm_available = False

	def _init_qwen(self):
	"""Initialize Qwen model."""
	try:
	from transformers import AutoTokenizer, AutoModelForCausalLM

	self.tokenizer = AutoTokenizer.from_pretrained(
	self.model_name,
	trust_remote_code=True
	)

	if self.tokenizer.pad_token is None:
	self.tokenizer.pad_token = self.tokenizer.eos_token

	self.model = AutoModelForCausalLM.from_pretrained(
	self.model_name,
	torch_dtype="auto",
	device_map="auto" if self._has_gpu() else "cpu",
	trust_remote_code=True
	)
	self.llm_available = True
	logger.info(f"Qwen model {self.model_name} loaded successfully")

	except Exception as e:
	logger.error(f"Failed to load Qwen: {e}")
	self.llm_available = False

	def _has_gpu(self) -> bool:
	"""Check if GPU is available."""
	try:
	import torch
	return torch.cuda.is_available()
	except ImportError:
	return False

	def _create_system_prompt(self) -> str:
	"""Create system prompt for retro commercial script generation."""
	return """You are a professional copywriter specializing in 1980s-style TV commercials.
	Your task is to create engaging, persuasive commercial scripts that capture the authentic retro aesthetic.

	Key requirements:
	- Use 1980s commercial language and style
	- Include clear hooks, benefits, and calls-to-action
	- Keep scripts concise and punchy
	- Use active voice and emotional appeals
	- End with a memorable tagline

	Format your response as:
	HOOK: [Opening attention-grabber]
	FLOW: [Main content following the structure]
	BENEFIT: [Key value proposition]
	CTA: [Call to action with tagline]

	Keep each segment under 2-3 sentences. Use enthusiastic, confident language typical of 1980s advertising."""

	def _create_user_prompt(self, brand: str, structure: str, script_prompt: str,
	duration: int, voice_style: str) -> str:
	"""Create user prompt with specific requirements."""
	return f"""Create a {duration}-second retro commercial script for {brand}.

	Structure: {structure}
	Script idea: {script_prompt}
	Voice style: {voice_style}

	Make it authentic to 1980s TV commercials with the energy and style of that era."""

	def _parse_script_response(self, response: str) -> List[ScriptSegment]:
	"""Parse LLM response into structured script segments."""
	segments = []

	# Split by segment markers
	import re
	parts = re.split(r'(HOOK:\|FLOW:\|BENEFIT:\|CTA:)', response)

	for i in range(1, len(parts), 2):
	if i + 1 < len(parts):
	segment_type = parts[i].rstrip(':').lower()
	text = parts[i + 1].strip()

	if text:
	# Estimate duration based on word count (150 WPM)
	word_count = len(text.split())
	duration = (word_count / 150) * 60 # Convert to seconds

	segments.append(ScriptSegment(
	text=text,
	duration_estimate=duration,
	segment_type=segment_type,
	timing_marker=f"[{segment_type.upper()}]"
	))

	return segments

	def _extract_tagline(self, response: str) -> str:
	"""Extract tagline from the script response."""
	# Look for tagline in CTA section
	import re
	cta_match = re.search(r'CTA:.?([A-Z][^.!?][.!?])', response, re.DOTALL)
	if cta_match:
	cta_text = cta_match.group(1)
	# Extract the last sentence as potential tagline
	sentences = re.split(r'[.!?]+', cta_text)
	if sentences:
	tagline = sentences[-1].strip()
	if len(tagline) > 5: # Ensure it's substantial
	return tagline

	# Fallback to predefined taglines
	return random.choice(TAGLINES)

	def generate_script_with_llm(self, brand: str, structure: str, script_prompt: str,
	duration: int, voice_style: str, seed: int = 42) -> GeneratedScript:
	"""Generate script using LLM."""
	if not self.llm_available:
	raise RuntimeError("LLM not available")

	# Set random seed for reproducibility
	random.seed(seed)

	# Create prompts
	system_prompt = self._create_system_prompt()
	user_prompt = self._create_user_prompt(brand, structure, script_prompt, duration, voice_style)

	# Format for the model
	if "dialo" in self.model_name.lower():
	# DialoGPT format
	text = f"{user_prompt}\n\nResponse:"
	else:
	# Generic format
	text = f"System: {system_prompt}\n\nUser: {user_prompt}\n\nAssistant:"

	# Tokenize
	inputs = self.tokenizer(text, return_tensors="pt", padding=True, truncation=True, max_length=512)

	# Move inputs to same device as model
	device = next(self.model.parameters()).device
	inputs = {k: v.to(device) for k, v in inputs.items()}

	# Generate
	self.model.eval()
	outputs = self.model.generate(
	**inputs,
	max_new_tokens=self.model_config.get("max_tokens", 256),
	temperature=self.model_config.get("temperature", 0.7),
	top_p=self.model_config.get("top_p", 0.9),
	do_sample=True,
	pad_token_id=self.tokenizer.eos_token_id,
	eos_token_id=self.tokenizer.eos_token_id,
	num_return_sequences=1
	)

	# Decode response
	response = self.tokenizer.decode(outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True)

	logger.info(f"Generated script response: {response[:200]}...")

	# Parse response
	segments = self._parse_script_response(response)
	tagline = self._extract_tagline(response)

	# Calculate total duration
	total_duration = sum(segment.duration_estimate for segment in segments)

	# Calculate word count
	word_count = sum(len(segment.text.split()) for segment in segments)

	return GeneratedScript(
	segments=segments,
	total_duration=total_duration,
	tagline=tagline,
	voice_style=voice_style,
	word_count=word_count,
	raw_script=response
	)

	def generate_script_with_template(self, brand: str, structure: str, script_prompt: str,
	duration: int, voice_style: str, seed: int = 42) -> GeneratedScript:
	"""Generate script using template-based approach (fallback)."""
	random.seed(seed)

	# Select structure template
	structure_template = structure.strip() or random.choice(STRUCTURE_TEMPLATES)

	# Generate segments based on template
	segments = []

	# Hook
	hook_text = script_prompt or f"Introducing {brand} - the future is here!"
	segments.append(ScriptSegment(
	text=hook_text,
	duration_estimate=2.0,
	segment_type="hook",
	timing_marker="[HOOK]"
	))

	# Flow (based on structure)
	flow_text = f"With {structure_template.lower()}, {brand} delivers results like never before."
	segments.append(ScriptSegment(
	text=flow_text,
	duration_estimate=3.0,
	segment_type="flow",
	timing_marker="[FLOW]"
	))

	# Benefit
	benefit_text = "Faster, simpler, cooler - just like your favorite retro tech."
	segments.append(ScriptSegment(
	text=benefit_text,
	duration_estimate=2.5,
	segment_type="benefit",
	timing_marker="[BENEFIT]"
	))

	# CTA
	tagline = random.choice(TAGLINES)
	cta_text = f"Try {brand} today. {tagline}"
	segments.append(ScriptSegment(
	text=cta_text,
	duration_estimate=2.5,
	segment_type="cta",
	timing_marker="[CTA]"
	))

	# Calculate totals
	total_duration = sum(segment.duration_estimate for segment in segments)
	word_count = sum(len(segment.text.split()) for segment in segments)

	return GeneratedScript(
	segments=segments,
	total_duration=total_duration,
	tagline=tagline,
	voice_style=voice_style,
	word_count=word_count,
	raw_script=f"Template-based script for {brand}"
	)

	def generate_script(self, brand: str, structure: str, script_prompt: str,
	duration: int, voice_style: str, seed: int = 42) -> GeneratedScript:
	"""
	Generate a complete commercial script.
	"""
	try:
	if self.llm_available:
	return self.generate_script_with_llm(brand, structure, script_prompt, duration, voice_style, seed)
	else:
	logger.info("Using template-based script generation (LLM not available)")
	return self.generate_script_with_template(brand, structure, script_prompt, duration, voice_style, seed)
	except Exception as e:
	logger.error(f"Script generation failed: {e}")
	logger.info("Falling back to template-based generation")
	return self.generate_script_with_template(brand, structure, script_prompt, duration, voice_style, seed)

	def suggest_scripts(self, structure: str, n: int = 6, seed: int = 0) -> List[str]:
	"""
	Generate multiple script suggestions based on structure.
	"""
	try:
	suggestions = []
	for i in range(n):
	script = self.generate_script(
	brand="YourBrand",
	structure=structure,
	script_prompt="Create an engaging hook",
	duration=10,
	voice_style="Announcer '80s",
	seed=seed + i
	)

	# Extract hook from first segment
	if script.segments:
	hook = script.segments[0].text
	suggestions.append(hook)
	else:
	suggestions.append("Back to '87 - the future is now!")

	return suggestions

	except Exception as e:
	logger.warning(f"Script suggestion failed: {e}")
	# Fallback to original random generation
	return self._fallback_suggestions(structure, n, seed)

	def _fallback_suggestions(self, structure: str, n: int, seed: int) -> List[str]:
	"""Fallback to original random script generation."""
	random.seed(seed)

	base = (structure or "").lower().strip()
	ideas = []

	for _ in range(n):
	style = random.choice(["infomercial", "mall ad", "late-night", "newsflash", "arcade bumper"])
	shot = random.choice(["neon grid", "CRT scanlines", "vaporwave sunset", "shopping mall", "boombox close-up"])
	hook = random.choice([
	"Remember this sound?", "Back to '87.", "Deal of the decade.",
	"We paused time.", "Be kind, rewind your brand."
	])
	idea = f"{hook} {style} with {shot}."

	# Light correlation with structure
	for kw in ["montage", "testimonial", "news", "unboxing", "before", "after", "countdown", "logo", "cta"]:
	if kw in base and kw not in idea:
	idea += f" Includes {kw}."

	ideas.append(idea)

	return ideas

	def create_script_generator() -> LLMScriptGenerator:
	"""Factory function to create a script generator."""
	return LLMScriptGenerator()