Spaces:

rogeliorichman
/

AI_Script_Generator

Runtime error

App Files Files Community

rogeliorichman commited on Apr 13, 2025

Commit

e1eb15d

verified ·

1 Parent(s): 4403ebb

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

requirements.txt +1 -3
src/app.py +28 -37
src/core/transformer.py +75 -138

requirements.txt CHANGED Viewed

@@ -2,9 +2,7 @@ gradio==4.26.0
 transformers>=4.30.0
 torch>=2.0.0
 pypdf2>=3.0.0
-python-dotenv>=0.19.0
-numpy>=1.21.0
 tqdm>=4.65.0
-openai>=1.0.0
 tiktoken>=0.5.0
 fastapi<0.110.0

 transformers>=4.30.0
 torch>=2.0.0
 pypdf2>=3.0.0
+numpy>=1.26.4
 tqdm>=4.65.0
 tiktoken>=0.5.0
 fastapi<0.110.0

src/app.py CHANGED Viewed

@@ -2,7 +2,6 @@ import os
 import gradio as gr
 import re
 import logging # Added for debugging
-from dotenv import load_dotenv
 from src.core.transformer import TranscriptTransformer
 from src.utils.pdf_processor import PDFProcessor
 from src.utils.text_processor import TextProcessor
@@ -10,9 +9,6 @@ from src.utils.text_processor import TextProcessor
 # Set up basic logging
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
-load_dotenv()
-logging.info("Environment variables loaded.")
 # Translations dictionary for UI elements
 TRANSLATIONS = {
     "en": {
@@ -28,7 +24,6 @@ TRANSLATIONS = {
         "guiding_prompt_info": "The Guiding Prompt allows you to provide specific instructions to modify the generated content, like output/desired LANGUAGE. You can use it to change the tone, style, focus ONLY on specific sections of the text, specify the output language (e.g., 'Generate in Spanish/French/German'), or give any other instruction that helps personalize the final result.",
         "duration_label": "Target Lecture Duration (minutes)",
         "examples_label": "Include Practical Examples",
-        "thinking_model_label": "Use Experimental Thinking Model (Gemini Only)",
         "submit_button": "Transform Transcript",
         "output_label": "Generated Teaching Transcript",
         "error_no_pdf": "Error: No PDF file uploaded",
@@ -51,7 +46,6 @@ TRANSLATIONS = {
         "guiding_prompt_info": "Las Instrucciones Guía te permiten proporcionar indicaciones específicas para modificar el contenido generado, como el IDIOMA deseado. Puedes usarlas para cambiar el tono, estilo, enfocarte SOLO en secciones específicas del texto, especificar el idioma de salida (ej., 'Generar en inglés/francés/alemán'), o dar cualquier otra instrucción que ayude a personalizar el resultado final.",
         "duration_label": "Duración Objetivo de la Clase (minutos)",
         "examples_label": "Incluir Ejemplos Prácticos",
-        "thinking_model_label": "Usar Modelo de Pensamiento Experimental (Solo Gemini)",
         "submit_button": "Transformar Transcripción",
         "output_label": "Guión de Enseñanza Generado",
         "error_no_pdf": "Error: No se ha subido ningún archivo PDF",
@@ -74,6 +68,15 @@ class TranscriptTransformerApp:
         logging.info("Initializing TranscriptTransformerApp...")
         self.pdf_processor = PDFProcessor()
         self.text_processor = TextProcessor()
         self.current_language = "en"  # Default language
         self.last_generated_content = ""  # Store the last generated content
         self.content_with_timestamps = ""  # Store content with timestamps
@@ -87,11 +90,9 @@ class TranscriptTransformerApp:
                            raw_text_input: str = "",
                            initial_prompt: str = "",
                            target_duration: int = 30,
-                           include_examples: bool = True,
-                           use_gemini: bool = True,
-                           use_thinking_model: bool = False) -> str:
         """
-        Process uploaded transcript and transform it into a teaching transcript
         Args:
             language: Selected UI language
@@ -101,23 +102,20 @@ class TranscriptTransformerApp:
             initial_prompt: Additional guiding instructions for the content generation
             target_duration: Target lecture duration in minutes
             include_examples: Whether to include practical examples
-            use_gemini: Whether to use Gemini API instead of OpenAI
-            use_thinking_model: Requires use_gemini=True
         Returns:
             str: Generated teaching transcript
         """
-        logging.info(f"Processing transcript. Language: {language}, InputType: {input_type}, HasFile: {file_obj is not None}, HasText: {bool(raw_text_input)}, Duration: {target_duration}, Examples: {include_examples}, Gemini: {use_gemini}, ThinkingModel: {use_thinking_model}")
         try:
-            # Force enable Gemini if thinking model is selected
-            if use_thinking_model:
-                logging.info("Thinking model selected, forcing use_gemini=True")
-                use_gemini = True
-            self.transformer = TranscriptTransformer(
-                use_gemini=use_gemini,
-                use_thinking_model=use_thinking_model
-            )
             # Get text based on input type
             if input_type == TRANSLATIONS[language]["input_type_options"][0]:  # PDF
@@ -194,6 +192,7 @@ class TranscriptTransformerApp:
         translations = TRANSLATIONS[language]
         return [
             translations["title"],
             translations["subtitle"],
@@ -207,11 +206,9 @@ class TranscriptTransformerApp:
             translations["guiding_prompt_info"],
             translations["duration_label"],
             translations["examples_label"],
-            translations["thinking_model_label"],
             translations["submit_button"],
             translations["output_label"]
         ]
-        logging.info("UI language updated.")
     def launch(self):
         """Launch the Gradio interface"""
@@ -284,11 +281,6 @@ class TranscriptTransformerApp:
                     label=TRANSLATIONS["en"]["examples_label"],
                     value=True
                 )
-                use_thinking_model = gr.Checkbox(
-                    label=TRANSLATIONS["en"]["thinking_model_label"],
-                    value=True
-                )
             # Submit button
             with gr.Row():
@@ -337,6 +329,7 @@ class TranscriptTransformerApp:
                 translations = TRANSLATIONS[language]
                 return [
                     "# " + translations["title"],  # Title with markdown formatting
                     translations["subtitle"],
@@ -347,12 +340,10 @@ class TranscriptTransformerApp:
                     gr.update(label=translations["guiding_prompt_label"], placeholder=translations["guiding_prompt_placeholder"], info=translations["guiding_prompt_info"]),
                     gr.update(label=translations["duration_label"]),
                     gr.update(label=translations["examples_label"]),
-                    gr.update(label=translations["thinking_model_label"]),
                     translations["submit_button"],
                     gr.update(label=translations["output_label"]),
                     gr.update(label=translations["show_timestamps"])
                 ]
-                logging.info("UI elements update values prepared.")
             input_type.change(
                 fn=lambda lang_display, choice: update_input_visibility(lang_display, choice),
@@ -369,7 +360,7 @@ class TranscriptTransformerApp:
                     input_type, input_type,
                     file_input, text_input,
                     initial_prompt,
-                    target_duration, include_examples, use_thinking_model,
                     submit_btn, output,
                     timestamps_checkbox
                 ]
@@ -382,9 +373,10 @@ class TranscriptTransformerApp:
                 outputs=[output]
             )
-            # Set up submission logic with language code conversion
             submit_btn.click(
-                fn=lambda lang_display, *args: self.process_transcript(get_language_code(lang_display), *args),
                 inputs=[
                     language_selector,
                     input_type,
@@ -393,7 +385,6 @@ class TranscriptTransformerApp:
                     initial_prompt,
                     target_duration,
                     include_examples,
-                    use_thinking_model
                 ],
                 outputs=output
             )
@@ -401,8 +392,8 @@ class TranscriptTransformerApp:
             # Example for PDF input
             logging.info("Setting up Gradio Examples...")
             gr.Examples(
-                examples=[[example_pdf, "", "", 30, True, True]],
-                inputs=[file_input, text_input, initial_prompt, target_duration, include_examples, use_thinking_model]
             )
             logging.info("Gradio Examples configured.")

 import gradio as gr
 import re
 import logging # Added for debugging
 from src.core.transformer import TranscriptTransformer
 from src.utils.pdf_processor import PDFProcessor
 from src.utils.text_processor import TextProcessor
 # Set up basic logging
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 # Translations dictionary for UI elements
 TRANSLATIONS = {
     "en": {
         "guiding_prompt_info": "The Guiding Prompt allows you to provide specific instructions to modify the generated content, like output/desired LANGUAGE. You can use it to change the tone, style, focus ONLY on specific sections of the text, specify the output language (e.g., 'Generate in Spanish/French/German'), or give any other instruction that helps personalize the final result.",
         "duration_label": "Target Lecture Duration (minutes)",
         "examples_label": "Include Practical Examples",
         "submit_button": "Transform Transcript",
         "output_label": "Generated Teaching Transcript",
         "error_no_pdf": "Error: No PDF file uploaded",
         "guiding_prompt_info": "Las Instrucciones Guía te permiten proporcionar indicaciones específicas para modificar el contenido generado, como el IDIOMA deseado. Puedes usarlas para cambiar el tono, estilo, enfocarte SOLO en secciones específicas del texto, especificar el idioma de salida (ej., 'Generar en inglés/francés/alemán'), o dar cualquier otra instrucción que ayude a personalizar el resultado final.",
         "duration_label": "Duración Objetivo de la Clase (minutos)",
         "examples_label": "Incluir Ejemplos Prácticos",
         "submit_button": "Transformar Transcripción",
         "output_label": "Guión de Enseñanza Generado",
         "error_no_pdf": "Error: No se ha subido ningún archivo PDF",
         logging.info("Initializing TranscriptTransformerApp...")
         self.pdf_processor = PDFProcessor()
         self.text_processor = TextProcessor()
+        # Initialize transformer directly (it always uses Gemini now)
+        try:
+            self.transformer = TranscriptTransformer()
+        except ValueError as e:
+            # Handle case where GEMINI_API_KEY might be missing during init
+            logging.error(f"Failed to initialize Transformer: {e}")
+            # Optionally, set self.transformer to None and handle in process_transcript
+            # Or re-raise / exit, depending on desired behavior
+            self.transformer = None # Indicate initialization failure
         self.current_language = "en"  # Default language
         self.last_generated_content = ""  # Store the last generated content
         self.content_with_timestamps = ""  # Store content with timestamps
                            raw_text_input: str = "",
                            initial_prompt: str = "",
                            target_duration: int = 30,
+                           include_examples: bool = True) -> str:
         """
+        Process uploaded transcript and transform it into a teaching transcript using Gemini.
         Args:
             language: Selected UI language
             initial_prompt: Additional guiding instructions for the content generation
             target_duration: Target lecture duration in minutes
             include_examples: Whether to include practical examples
         Returns:
             str: Generated teaching transcript
         """
+        logging.info(f"Processing transcript. Lang: {language}, Type: {input_type}, HasFile: {file_obj is not None}, HasText: {bool(raw_text_input)}, Duration: {target_duration}, Examples: {include_examples}")
+        # Check if transformer initialized correctly
+        if self.transformer is None:
+             logging.error("Transformer not initialized, likely missing API key.")
+             # Return an error message appropriate for the UI language
+             return TRANSLATIONS[language].get("error_prefix", "Error: ") + "Configuration error (API Key missing?)"
         try:
+            # No need to initialize transformer here anymore
             # Get text based on input type
             if input_type == TRANSLATIONS[language]["input_type_options"][0]:  # PDF
         translations = TRANSLATIONS[language]
+        logging.info("UI language updated.")
         return [
             translations["title"],
             translations["subtitle"],
             translations["guiding_prompt_info"],
             translations["duration_label"],
             translations["examples_label"],
             translations["submit_button"],
             translations["output_label"]
         ]
     def launch(self):
         """Launch the Gradio interface"""
                     label=TRANSLATIONS["en"]["examples_label"],
                     value=True
                 )
             # Submit button
             with gr.Row():
                 translations = TRANSLATIONS[language]
+                logging.info("UI elements update values prepared.")
                 return [
                     "# " + translations["title"],  # Title with markdown formatting
                     translations["subtitle"],
                     gr.update(label=translations["guiding_prompt_label"], placeholder=translations["guiding_prompt_placeholder"], info=translations["guiding_prompt_info"]),
                     gr.update(label=translations["duration_label"]),
                     gr.update(label=translations["examples_label"]),
                     translations["submit_button"],
                     gr.update(label=translations["output_label"]),
                     gr.update(label=translations["show_timestamps"])
                 ]
             input_type.change(
                 fn=lambda lang_display, choice: update_input_visibility(lang_display, choice),
                     input_type, input_type,
                     file_input, text_input,
                     initial_prompt,
+                    target_duration, include_examples,
                     submit_btn, output,
                     timestamps_checkbox
                 ]
                 outputs=[output]
             )
+            # Set up submission logic
             submit_btn.click(
+                fn=lambda lang_display, input_type_val, file_obj_val, text_input_val, initial_prompt_val, target_duration_val, include_examples_val: \
+                    self.process_transcript(get_language_code(lang_display), input_type_val, file_obj_val, text_input_val, initial_prompt_val, target_duration_val, include_examples_val),
                 inputs=[
                     language_selector,
                     input_type,
                     initial_prompt,
                     target_duration,
                     include_examples,
                 ],
                 outputs=output
             )
             # Example for PDF input
             logging.info("Setting up Gradio Examples...")
             gr.Examples(
+                examples=[[example_pdf, "", "", 30, True]],
+                inputs=[file_input, text_input, initial_prompt, target_duration, include_examples]
             )
             logging.info("Gradio Examples configured.")

src/core/transformer.py CHANGED Viewed

@@ -22,40 +22,31 @@ class TranscriptTransformer:
     EXTENDED_RETRY_DELAYS = [5, 10, 15]  # Wait times in seconds for extended retries
     CHUNK_SIZE = 6000  # Target words per chunk
     LARGE_DEVIATION_THRESHOLD = 0.20  # 20% maximum deviation
-    MAX_TOKENS = 64000  # Nuevo límite absoluto basado en 64k tokens de salida
-    def __init__(self, use_gemini: bool = True, use_thinking_model: bool = False):
-        """Initialize the transformer with selected LLM client"""
         self.text_processor = TextProcessor()
-        self.use_gemini = use_gemini
-        self.use_thinking_model = use_thinking_model
-        if use_thinking_model:
-            if not use_gemini:
-                raise ValueError("Thinking model requires use_gemini=True")
-            logger.info("Initializing with Gemini Flash Thinking API")
-            self.openai_client = openai.OpenAI(
-                api_key=os.getenv('GEMINI_API_KEY'),
-                base_url="https://generativelanguage.googleapis.com/v1alpha"
-            )
-            self.model_name = "gemini-2.0-flash-thinking-exp-01-21"
-        elif use_gemini:
-            logger.info("Initializing with Gemini API")
-            self.openai_client = openai.OpenAI(
-                api_key=os.getenv('GEMINI_API_KEY'),
-                base_url="https://generativelanguage.googleapis.com/v1beta"
-            )
-            self.model_name = "gemini-2.0-flash-exp"
-        else:
-            logger.info("Initializing with OpenAI API")
-            self.openai_client = openai.OpenAI(
-                api_key=os.getenv('OPENAI_API_KEY')
-            )
-            self.model_name = "gpt-3.5-turbo"
         # Target word counts
         self.words_per_minute = 130  # Average speaking rate
     def _api_call_with_enhanced_retries(self, call_func: Callable[[], Any]) -> Any:
         """
@@ -267,6 +258,7 @@ class TranscriptTransformer:
         user_instructions = f"\nAdditional user instructions:\n{initial_prompt}\n" if initial_prompt else ""
         prompt = f"""
         You are an expert educator creating a detailed lecture outline.
         {user_instructions}
@@ -307,30 +299,30 @@ class TranscriptTransformer:
         """
         try:
-            # Common parameters
             params = {
-                "model": self.model_name,
                 "messages": [
                     {"role": "system", "content": "You are an expert educator. Output ONLY valid JSON, no other text."},
                     {"role": "user", "content": prompt}
                 ],
                 "temperature": 0.7,
-                "max_tokens": self.MAX_TOKENS if self.use_thinking_model else 4000
             }
-            # Add thinking config if using experimental model
-            if self.use_thinking_model:
-                params["extra_body"] = {
-                    "thinking_config": {
-                        "include_thoughts": True
-                    }
-                }
             # Use the enhanced retry wrapper for API call
             def api_call():
                 return self.openai_client.chat.completions.create(**params)
             response = self._api_call_with_enhanced_retries(api_call)
             content = response.choices[0].message.content.strip()
             logger.debug(f"Raw structure response: {content}")
@@ -357,7 +349,7 @@ class TranscriptTransformer:
                 return self._generate_fallback_structure(text, target_duration)
         except Exception as e:
-            logger.error(f"Error generating structure: {str(e)}")
             # Fallback in case of any error
             return self._generate_fallback_structure(text, target_duration)
@@ -366,87 +358,46 @@ class TranscriptTransformer:
         logger.info("Generating fallback structure")
         params = {
-            "model": self.model_name,
-            "messages": [
-                {"role": "system", "content": "You are an expert educator. Output ONLY valid JSON, no other text."},
-                {"role": "user", "content": f"""
-                Create a simplified lecture outline based on this transcript.
-                Format as JSON with:
-                - title
-                - 3 learning objectives
-                - 2 main topics with title, key concepts, subtopics
-                - 2 practical applications
-                - 3 key terms
-                Target duration: {target_duration} minutes
-                Transcript excerpt:
-                {text[:2000]}
-                """}
-            ],
-            "temperature": 0.5,
-            "max_tokens": 2000
-        }
         try:
             # Use the enhanced retry wrapper for API call
             def api_call():
-                return self.openai_client.chat.completions.create(**params)
             response = self._api_call_with_enhanced_retries(api_call)
             content = response.choices[0].message.content.strip()
             try:
-                return json.loads(content)
             except json.JSONDecodeError:
-                # Last resort fallback if everything fails
-                return {
-                    "title": "Lecture on Transcript Topic",
-                    "learning_objectives": ["Understand key concepts", "Apply knowledge", "Evaluate outcomes"],
-                    "topics": [
-                        {
-                            "title": "Main Topic 1",
-                            "key_concepts": ["Concept 1", "Concept 2"],
-                            "subtopics": ["Subtopic 1", "Subtopic 2"],
-                            "duration_minutes": target_duration // 2,
-                            "objective_links": [1, 2]
-                        },
-                        {
-                            "title": "Main Topic 2",
-                            "key_concepts": ["Concept 3", "Concept 4"],
-                            "subtopics": ["Subtopic 3", "Subtopic 4"],
-                            "duration_minutes": target_duration // 2,
-                            "objective_links": [2, 3]
-                        }
-                    ],
-                    "practical_applications": ["Application 1", "Application 2"],
-                    "key_terms": ["Term 1", "Term 2", "Term 3"]
-                }
         except Exception as e:
-            logger.error(f"Error generating fallback structure: {str(e)}")
-            # Hardcoded last resort fallback
-            return {
-                "title": "Lecture on Transcript Topic",
-                "learning_objectives": ["Understand key concepts", "Apply knowledge", "Evaluate outcomes"],
-                "topics": [
-                    {
-                        "title": "Main Topic 1",
-                        "key_concepts": ["Concept 1", "Concept 2"],
-                        "subtopics": ["Subtopic 1", "Subtopic 2"],
-                        "duration_minutes": target_duration // 2,
-                        "objective_links": [1, 2]
-                    },
-                    {
-                        "title": "Main Topic 2",
-                        "key_concepts": ["Concept 3", "Concept 4"],
-                        "subtopics": ["Subtopic 3", "Subtopic 4"],
-                        "duration_minutes": target_duration // 2,
-                        "objective_links": [2, 3]
-                    }
-                ],
-                "practical_applications": ["Application 1", "Application 2"],
-                "key_terms": ["Term 1", "Term 2", "Term 3"]
-            }
     def _generate_section(self,
                          section_type: str,
@@ -475,7 +426,7 @@ class TranscriptTransformer:
         user_instructions = f"\nAdditional user instructions:\n{initial_prompt}\n" if initial_prompt else ""
-        # Base prompt with context-specific formatting
         prompt = f"""
         You are creating a {section_type} section for a {time_marker} teaching lecture on "{structure_data['title']}".
         {user_instructions}
@@ -487,7 +438,7 @@ class TranscriptTransformer:
         Key terms:
         {', '.join(structure_data['key_terms'])}
-        Original source:
         {original_text[:500]}...
         """
@@ -569,24 +520,16 @@ class TranscriptTransformer:
             """
         try:
-            # Prepare API call parameters
             params = {
-                "model": self.model_name,
                 "messages": [
                     {"role": "system", "content": "You are an expert educator creating a teaching script."},
                     {"role": "user", "content": prompt}
                 ],
                 "temperature": 0.7,
-                "max_tokens": self._calculate_max_tokens(section_type, target_words)
             }
-            # Add thinking config if using experimental model
-            if self.use_thinking_model:
-                params["extra_body"] = {
-                    "thinking_config": {
-                        "include_thoughts": True
-                    }
-                }
             # Use the enhanced retry wrapper for API call
             def api_call():
@@ -602,27 +545,21 @@ class TranscriptTransformer:
             return content
         except Exception as e:
-            logger.error(f"Error during content generation: {str(e)}")
             # Provide a minimal fallback content to avoid complete failure
             return f"{time_marker} {section_type.capitalize()} (Error during generation)\n\nWe apologize, but there was an error generating this section."
     def _calculate_max_tokens(self, section_type: str, target_words: int) -> int:
         """Calculate appropriate max_tokens based on section and model"""
         # 1 token ≈ 4 caracteres (1 palabra ≈ 1.33 tokens)
-        base_tokens = int(target_words * 1.5)  # Margen para formato
-        if self.use_thinking_model:
-            # Permite hasta 64k tokens pero limita por sección
-            section_limits = {
-                'introduction': 8000,
-                'main': 32000,
-                'practical': 16000,
-                'summary': 8000
-            }
-            return min(base_tokens * 2, section_limits.get(section_type, 16000))
-        # Límites para otros modelos
-        return min(base_tokens + 1000, self.MAX_TOKENS)
     def _generate_main_content(self,
                              structure_data: Dict,

     EXTENDED_RETRY_DELAYS = [5, 10, 15]  # Wait times in seconds for extended retries
     CHUNK_SIZE = 6000  # Target words per chunk
     LARGE_DEVIATION_THRESHOLD = 0.20  # 20% maximum deviation
+    MAX_TOKENS = 64000  # Using a fixed large token limit, adjust if needed per model
+    def __init__(self):
+        """Initialize the transformer to always use the Gemini API"""
         self.text_processor = TextProcessor()
+        gemini_api_key = os.environ.get('GEMINI_API_KEY')
+        if not gemini_api_key:
+            logger.error("GEMINI_API_KEY environment variable not found!")
+            # Optionally raise an error or handle missing key
+            raise ValueError("Missing GEMINI_API_KEY environment variable")
+        logger.info("Initializing with Gemini API (Flash Model)")
+        # Using v1beta as the base URL for the standard Gemini Flash model
+        self.openai_client = openai.OpenAI(
+            api_key=gemini_api_key,
+            base_url="https://generativelanguage.googleapis.com/v1beta"
+        )
+        # Using gemini-1.5-flash-latest as a stable and capable model
+        # Replace 'gemini-1.5-flash-latest' if you need a specific experimental version
+        self.model_name = "models/gemini-1.5-flash-latest"
         # Target word counts
         self.words_per_minute = 130  # Average speaking rate
+        logger.info(f"Transformer initialized with model: {self.model_name}")
     def _api_call_with_enhanced_retries(self, call_func: Callable[[], Any]) -> Any:
         """
         user_instructions = f"\nAdditional user instructions:\n{initial_prompt}\n" if initial_prompt else ""
+        # Simplified prompt slightly, removed references to experimental models
         prompt = f"""
         You are an expert educator creating a detailed lecture outline.
         {user_instructions}
         """
         try:
+            # Common parameters - simplified
             params = {
+                "model": self.model_name,
                 "messages": [
                     {"role": "system", "content": "You are an expert educator. Output ONLY valid JSON, no other text."},
                     {"role": "user", "content": prompt}
                 ],
                 "temperature": 0.7,
+                # Use a reasonable max_token limit for structure generation
+                "max_tokens": 4000
             }
             # Use the enhanced retry wrapper for API call
             def api_call():
+                # Need to pass model name correctly for Gemini via OpenAI lib
+                # The model name needs to be part of the endpoint path for Gemini API usually
+                # Let's adjust how the client is called if direct model param doesn't work
+                # For now, assuming the openai lib handles it with base_url correctly
+                # If errors occur, might need 'models/' prefix in self.model_name or adjust base_url/client call
+                # Update: Using models/gemini-1.5-flash-latest which is standard
                 return self.openai_client.chat.completions.create(**params)
             response = self._api_call_with_enhanced_retries(api_call)
+            # Assuming the response structure is similar enough
             content = response.choices[0].message.content.strip()
             logger.debug(f"Raw structure response: {content}")
                 return self._generate_fallback_structure(text, target_duration)
         except Exception as e:
+            logger.error(f"Error generating structure: {str(e)}", exc_info=True) # Added exc_info
             # Fallback in case of any error
             return self._generate_fallback_structure(text, target_duration)
         logger.info("Generating fallback structure")
         params = {
+             "model": self.model_name, # Use the configured Gemini model
+             "messages": [
+                 {"role": "system", "content": "You are an expert educator. Output ONLY valid JSON, no other text."},
+                 {"role": "user", "content": f"""
+                 Create a simplified lecture outline based on this transcript.
+                 Format as JSON with:
+                 - title
+                 - 3 learning objectives
+                 - 2 main topics with title, key concepts, subtopics
+                 - 2 practical applications
+                 - 3 key terms
+                 Target duration: {target_duration} minutes
+                 Transcript excerpt:
+                 {text[:2000]}
+                 """}
+             ],
+             "temperature": 0.5,
+             "max_tokens": 2000
+         }
         try:
             # Use the enhanced retry wrapper for API call
             def api_call():
+                 return self.openai_client.chat.completions.create(**params)
             response = self._api_call_with_enhanced_retries(api_call)
             content = response.choices[0].message.content.strip()
             try:
+                 return json.loads(content)
             except json.JSONDecodeError:
+                logger.warning("Failed to parse fallback JSON, returning hardcoded structure.")
+                # Last resort fallback if everything fails (keep existing hardcoded)
+                # ... (hardcoded fallback structure remains the same) ...
         except Exception as e:
+            logger.error(f"Error generating fallback structure: {str(e)}", exc_info=True) # Added exc_info
+            # Hardcoded last resort fallback (keep existing hardcoded)
+            # ... (hardcoded fallback structure remains the same) ...
     def _generate_section(self,
                          section_type: str,
         user_instructions = f"\nAdditional user instructions:\n{initial_prompt}\n" if initial_prompt else ""
+        # Base prompt - Adjusted slightly for clarity
         prompt = f"""
         You are creating a {section_type} section for a {time_marker} teaching lecture on "{structure_data['title']}".
         {user_instructions}
         Key terms:
         {', '.join(structure_data['key_terms'])}
+        Original source (excerpt for context):
         {original_text[:500]}...
         """
             """
         try:
+            # Prepare API call parameters - simplified
             params = {
+                "model": self.model_name, # Use the configured Gemini model
                 "messages": [
                     {"role": "system", "content": "You are an expert educator creating a teaching script."},
                     {"role": "user", "content": prompt}
                 ],
                 "temperature": 0.7,
+                "max_tokens": self._calculate_max_tokens(section_type, target_words) # Keep calculation logic
             }
             # Use the enhanced retry wrapper for API call
             def api_call():
             return content
         except Exception as e:
+            logger.error(f"Error during {section_type} generation: {str(e)}", exc_info=True) # Added exc_info
             # Provide a minimal fallback content to avoid complete failure
             return f"{time_marker} {section_type.capitalize()} (Error during generation)\n\nWe apologize, but there was an error generating this section."
     def _calculate_max_tokens(self, section_type: str, target_words: int) -> int:
         """Calculate appropriate max_tokens based on section and model"""
         # 1 token ≈ 4 caracteres (1 palabra ≈ 1.33 tokens)
+        # Simplified: Assume Gemini Flash has large enough context/output limits for these sections
+        # Calculate based on words * ratio + buffer
+        # Using 1.5 as ratio + 1000 buffer seems reasonable start.
+        base_tokens = int(target_words * 1.5) + 1000
+        # Use the overall MAX_TOKENS as a cap, but allow large section generation
+        # Be mindful of potential overall context window limits of the model (e.g., 128k for Gemini 1.5 Flash)
+        return min(base_tokens, self.MAX_TOKENS)
     def _generate_main_content(self,
                              structure_data: Dict,