Spaces:

renesistech
/

Notes

Build error

File size: 31,774 Bytes

8aab118
 
 
 
 
 
bf21cca
8aab118
d3a14d0
8aab118
 
 
d3a14d0
 
08d62e8
 
8aab118
d3a14d0
8aab118
d3a14d0
 
8aab118
 
fce9899
8aab118
 
 
 
8e14ee9
e93bec0
 
 
 
8aab118
 
 
 
e637f4b
 
d3a14d0
ed5865d
d3a14d0
8aab118
6d1370d
 
08d62e8
97c9b4f
 
6d1370d
 
 
 
8aab118
 
 
fce9899
d3a14d0
 
 
 
 
 
e637f4b
 
 
d3a14d0
e637f4b
d3a14d0
 
e93bec0
d3a14d0
 
e637f4b
d3a14d0
 
 
 
 
 
2f296a0
e637f4b
 
d3a14d0
 
 
 
 
 
 
 
 
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6af84c5
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fce9899
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6d1370d
 
fce9899
 
 
 
d3a14d0
 
ebc9357
8aab118
d3a14d0
 
8aab118
d3a14d0
 
8aab118
d3a14d0
 
 
 
e637f4b
d3a14d0
8aab118
 
d3a14d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8aab118
d3a14d0
 
ebc9357
d3a14d0
ebc9357
e637f4b
8aab118
ebc9357
8aab118
 
d3a14d0
 
 
 
 
 
 
 
 
 
 
8aab118
d3a14d0
8aab118
d3a14d0
 
 
 
 
 
 
 
 
 
 
 
 
 
8aab118
ebc9357
8aab118
 
e637f4b
 
8aab118
 
 
 
bf21cca
2f4c18b
 
8aab118
 
bf21cca
 
 
2f4c18b
 
8aab118
 
 
2f4c18b
08d62e8
8aab118
 
 
6d1370d
08d62e8
2f4c18b
8aab118
2f4c18b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8aab118
 
2f4c18b
8aab118
2f4c18b
8aab118
 
 
 
2f4c18b
8aab118
 
 
2f4c18b
 
 
8aab118
 
 
 
2f4c18b
8aab118
2f4c18b
 
 
 
 
 
8aab118
 
 
2f4c18b
8aab118
 
2f4c18b
8aab118
2f4c18b
8aab118
 
 
 
 
 
e637f4b
8aab118
 
2f4c18b
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
bf21cca
 
2f4c18b
 
 
 
bf21cca
8aab118
bf21cca
8aab118
bf21cca
 
 
 
 
 
2f4c18b
 
8aab118
 
 
 
 
 
 
 
 
 
2f4c18b
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2f4c18b
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
08d62e8
 
8aab118
fce9899
 
 
 
 
8aab118
 
e637f4b
 
 
fce9899
e637f4b
 
 
fce9899
e637f4b
 
8aab118
 
 
 
d3a14d0
 
8aab118
d3a14d0
 
8aab118
d3a14d0
 
 
 
8aab118
d3a14d0
 
8aab118
d3a14d0
 
6d1370d
d3a14d0
 
 
 
 
8aab118
d3a14d0
 
 
 
08d62e8
d3a14d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8aab118
 
d3a14d0
 
 
 
 
8aab118
 
 
 
 
 
 
 
 
 
 
 
 
 
d3a14d0
 
 
6d1370d
d3a14d0
 
 
 
 
8aab118
d3a14d0
 
 
08d62e8
d3a14d0
8aab118
d3a14d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fce9899
d3a14d0
 
8aab118
 
d3a14d0
 
 
 
8aab118
 
 
d3a14d0
 
 
8aab118
 
 
 
 
 
 
 
6d1370d
d3a14d0
 
 
 
 
 
 
 
8aab118
08d62e8
d3a14d0
8aab118
d3a14d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8aab118
 
 
 
 
 
 
 
 
 
d3a14d0
 
 
 
 
8aab118
 
 
 
 
08d62e8
8aab118

import streamlit as st
from groq import Groq
import json
import os
import time
import numpy as np

import tempfile
from io import BytesIO
from md2pdf.core import md2pdf
from dotenv import load_dotenv
from datetime import datetime
import requests
from requests.exceptions import RequestException
from
 typing import Optional, Dict, Any
from download import download_video_audio, delete_download
from st_audiorec import st_audiorec  # Import the audio recorder component

# Set max file size for audio uploads (40MB)
MAX_FILE_SIZE = 41943040  # 40MB
FILE_TOO_LARGE_MESSAGE = "File too large. Maximum size is 40MB."

# Load environment variables - will also load from Hugging Face secrets
load_dotenv()

# Initialize session states
if 'api_key' not in st.session_state:
    st.session_state.api_key = os.environ.get("GROQ_API_KEY", "")
    # For Streamlit Cloud or Hugging Face
    if not st.session_state.api_key and st.secrets and "GROQ_API_KEY" in st.secrets:
        st.session_state.api_key = st.secrets["GROQ_API_KEY"]
    
    
if 'transcript' not in st.session_state:
    st.session_state.transcript = ""
    
if 'groq_client' not in st.session_state:
    st.session_state.groq_client = None
    
if 'transcription_error' not in st.session_state:
    st.session_state.transcription_error = None

# Set page configuration
st.set_page_config(
    page_title="NoteME",
    page_icon
="🧙‍♂️",
    layout="wide",
    initial_sidebar_state="expanded"
)

# Fixed model selections
LLM_MODEL = "deepseek-r1-distill-llama-70b"

# Configure retry parameters without backoff library
MAX_RETRIES = 5
INITIAL_WAIT = 0.5
MAX_WAIT = 30

# Initialize Groq client with improved error handling
def initialize_groq_client(api_key: str) -> Optional[Groq]:
    """Initialize Groq client with the provided API key"""
    if not api_key:
        return None
        
    try:
        client = Groq(api_key=api_key)
        # Perform a simple test call to validate the API key

        client.models.list()
        return client
    except Exception as e:
        error_msg = str(e)
        if "401" in error_msg:
            st.error("❌ Invalid API key: Authentication failed")
        elif "403" in error_msg:
            st.error("❌ API key doesn't have permission to access Groq API")
        else:
            st.error(f"❌ Failed to initialize Groq client: {error_msg}")
        return None

# Define custom exception for Groq API errors
class GroqAPIError(Exception):
    """Custom exception for Groq API errors"""
    def __init__(self, message, status_code=None, response=None):
        self.message = message
        self.status_code = status_code
        self.response = response
        super().__init__(self.message)

class GenerationStatistics:
    def __init__(self, input_time=0, output_time=0, input_tokens=0, output_tokens=0, total_time=0, model_name=LLM_MODEL):
        self.input_time = input_time
        self.output_time = output_time
        self.input_tokens = input_tokens
        self.output_tokens = output_tokens
        self.total_time = total_time # Sum of queue, prompt (input), and completion (output) times
        self.model_name = model_name

    def get_input_speed(self):
        """ Tokens per second calculation for input """
        if self.input_time != 0:
            return self.input_tokens / self.input_time
        else:
            return 0

    def get_output_speed(self):
        """ Tokens per second calculation for output """
        if self.output_time != 0:
            return self.output_tokens / self.output_time
        else:
            return 0

    def add(self, other):
        """ Add statistics from another GenerationStatistics object to this one. """
        if not isinstance(other, GenerationStatistics):
            raise TypeError("Can only add GenerationStatistics objects")
        self.input_time += other.input_time
        self.output_time += other.output_time
        self.input_tokens += other.input_tokens
        self.output_tokens += other.output_tokens
        self.total_time += other.total_time

    def __str__(self):
        return (f"\n## {self.get_output_speed():.2f} T/s ⚡\nRound trip time: {self.total_time:.2f}s Model: {self.model_name}\n\n"
                f"| Metric | Input | Output | Total |\n"
                f"|-----------------|----------------|-----------------|----------------|\n"
                f"| Speed (T/s) | {self.get_input_speed():.2f} | {self.get_output_speed():.2f} | {(self.input_tokens + self.output_tokens) / self.total_time if self.total_time != 0 else 0:.2f} |\n"
                f"| Tokens | {self.input_tokens} | {self.output_tokens} | {self.input_tokens + self.output_tokens} |\n"
                f"| Inference Time (s) | {self.input_time:.2f} | {self.output_time:.2f} | {self.total_time:.2f} |")

class NoteSection:
    def __init__(self, structure, transcript):
        self.structure = structure
        self.contents = {title: "" for title in self.flatten_structure(structure)}
        self.placeholders = {title: st.empty() for title in self.flatten_structure(structure)}
        
        with st.expander("Raw Transcript", expanded=False):
            st.markdown(transcript)

    def flatten_structure(self, structure):
        sections = []
        for title, content in structure.items():
            sections.append(title)
            if isinstance(content, dict):
                sections.extend(self.flatten_structure(content))
        return sections

    def update_content(self, title, new_content):
        try:
            self.contents[title] += new_content
            self.display_content(title)
        except TypeError as e:
            st.error(f"Error updating content: {e}")

    def display_content(self, title):
        if self.contents[title].strip():
            self.placeholders[title].markdown(f"## {title}\n{self.contents[title]}")

    def return_existing_contents(self, level=1) -> str:
        existing_content = ""
        for title, content in self.structure.items():
            if self.contents[title].strip():
                existing_content += f"{'#' * level} {title}\n{self.contents[title]}\n\n"
            if isinstance(content, dict):
                existing_content += self.get_markdown_content(content, level + 1)
        return existing_content

    def display_structure(self, structure=None, level=1):
        if structure is None:
            structure = self.structure
        for title, content in structure.items():
            if self.contents[title].strip():
                st.markdown(f"{'#' * level} {title}")
                self.placeholders[title].markdown(self.contents[title])
            if isinstance(content, dict):
                self.display_structure(content, level + 1)

    def display_toc(self, structure, columns, level=1, col_index=0):
        for title, content in structure.items():
            with columns[col_index % len(columns)]:
                st.markdown(f"{' ' * (level-1) * 2}- {title}")
            col_index += 1
            if isinstance(content, dict):
                col_index = self.display_toc(content, columns, level + 1, col_index)
        return col_index

    def get_markdown_content(self, structure=None, level=1):
        """ Returns the markdown styled pure string with the contents. """
        if structure is None:
            structure = self.structure
        markdown_content = ""
        for title, content in structure.items():
            if self.contents[title].strip():
                markdown_content += f"{'#' * level} {title}\n{self.contents[title]}\n\n"
            if isinstance(content, dict):
                markdown_content += self.get_markdown_content(content, level + 1)
        return markdown_content

# Manual implementation of retry logic (replacing backoff library)
def retry_with_exponential_backoff(max_tries=MAX_RETRIES, initial_wait=INITIAL_WAIT, max_wait=MAX_WAIT):
    """
    Custom retry decorator with exponential backoff
    """
    def decorator(func):
        def wrapper(*args, **kwargs):
            wait = initial_wait
            tries = 0
            
            while tries < max_tries:
                try:
                    return func(*args, **kwargs)
                except (RequestException, GroqAPIError) as e:
                    tries += 1
                    if tries == max_tries:
                        raise
                    
                    # Calculate next wait time with exponential backoff
                    wait = min(wait * 2, max_wait)
                    
                    # Add some jitter (±20%)
                    jitter = wait * 0.4 * (np.random.random() - 0.5)
                    wait_with_jitter = wait + jitter
                    
                    # Inform user of retry attempt
                    st.info(f"Retrying transcription... (Attempt {tries}/{max_tries})")
                    time.sleep(wait_with_jitter)
            
            return None  # This line should never be reached but is added to satisfy the function signature
        return wrapper
    return decorator

@retry_with_exponential_backoff()
def transcribe_audio_with_groq(audio_data) -> str:
    """
    Transcribe audio file using Groq's whisper-large-v3-turbo model
    
    Args:
        audio_data: Either file path string or binary audio data
        
    Returns:
        Transcribed text
        
    Raises:
        GroqAPIError: For API-related errors
        ValueError: For invalid input
    """
    if not st.session_state.groq_client:
        raise ValueError("Groq client is not initialized. Please check your API key.")
    
    try:
        # Save audio data to a temporary file if it's binary data
        if isinstance(audio_data, bytes):
            with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
                tmp_file.write(audio_data)
                audio_file_path = tmp_file.name
        else:
            # Assume it's a file path
            audio_file_path = audio_data
            if not os.path.exists(audio_file_path):
                raise ValueError(f"Audio file not found: {audio_file_path}")
        
        # Check file size before sending
        file_size = os.path.getsize(audio_file_path)
        if file_size > MAX_FILE_SIZE:
            raise ValueError(f"Audio file size ({file_size/1048576:.2f}MB) exceeds 40MB limit")
        
        with open(audio_file_path, "rb") as file:
            # Display a progress message since transcription can take time
            progress_placeholder = st.empty()
            progress_placeholder.info("Processing audio with whisper-large-v3-turbo...")
            
            # Use the whisper-large-v3-turbo model as requested
            transcription = st.session_state.groq_client.audio.transcriptions.create(
                file=(audio_file_path, file.read()),
                model="whisper-large-v3-turbo",
                response_format="verbose_json"
            )
            
            # Clear the progress message when done
            progress_placeholder.empty()
            
            if not hasattr(transcription, 'text') or not transcription.text:
                raise GroqAPIError("Empty transcription result returned")
                
            # Delete temp file if we created one
            if isinstance(audio_data, bytes) and os.path.exists(audio_file_path):
                os.unlink(audio_file_path)
                
            return transcription.text
            
    except Exception as e:
        error_msg = str(e)
        
        # Handle specific error cases
        if "401" in error_msg:
            raise GroqAPIError("Authentication failed. Please check your API key.", 401)
        elif "429" in error_msg:
            raise GroqAPIError("Rate limit exceeded. Please try again later.", 429)
        elif "413" in error_msg:
            raise GroqAPIError("Audio file too large for processing.", 413)
        elif "500" in error_msg or "502" in error_msg or "503" in error_msg or "504" in error_msg:
            raise GroqAPIError("Groq server error. Please try again later.", int(error_msg[:3]))
        else:
            # Re-raise as a GroqAPIError for consistent handling
            raise GroqAPIError(f"Error transcribing audio: {error_msg}")


def process_transcript(transcript):
    """Process transcript with Groq's DeepSeek model for highly structured notes"""
    if not st.session_state.groq_client:
        st.error("Groq client is not initialized. Please check your API key.")
        return None
    
    # Enhanced structure for better organization
    structure = {
        "Executive Summary": "",
        "Main Agenda": "",
        "Points Discussed": "",
        "Key Insights": "",
        "Questions & Considerations": "",
        "Detailed Analysis": {
            "Context & Background": "",
            "Supporting Evidence": "",
        },
        "Next Steps": ""
    }
    
    prompt = f"""
    You are an expert meeting notes organizer with exceptional skills in creating structured, clear, and comprehensive notes.
    Please analyze the following transcript and transform it into organized meeting notes in the same language as the Transcript ensuring Clarity:

    ```
    {transcript}
    ```
    
    Create a professional meeting notes document with the following specific sections:

    # Executive Summary
    - Provide a concise 3-5 sentence overview of the meeting purpose and key outcomes
    - Use clear, direct language focused on the most important takeaways
    
    # Main Agenda
    - Extract and list the primary agenda items that were discussed in the meeting
    - Format as a numbered or bulleted list
    - Include time allocations or priority levels if mentioned in the transcript
    
    # Points Discussed
    - Provide a comprehensive breakdown of what was discussed for each agenda item
    - Use subheadings for each major topic
    - Include who raised specific points when identifiable
    - Organize chronologically as they appeared in the discussion
    
    # Key Insights
    - Extract 5-7 critical insights as bullet points
    - Each insight should be **bolded** and followed by 1-2 supporting sentences
    - Organize these insights in order of importance
    
    # Questions & Considerations
    - List all questions raised during the discussion
    - Include concerns or areas needing further exploration
    - For each question, provide brief context explaining why it matters
    
    # Detailed Analysis
    
    ## Context & Background
    - Summarize relevant background information necessary to understand the discussion
    - Explain the context in which the meeting took place
    - Include references to prior meetings or decisions if mentioned
    
    ## Supporting Evidence
    - Create a table summarizing any data, evidence, or examples mentioned
    - Include source information when available
    - Format data clearly using markdown tables when appropriate
    
    # Next Steps
    - Create a table with these columns: Action | Owner/Responsible Party | Timeline | Priority
    - List all tasks, assignments, follow-up items, and decisions made
    - If information is not explicitly stated, indicate with "Not specified"
    - Include any deadlines or important dates mentioned
    - This section should be comprehensive, capturing ALL action items from the meeting

    Make extensive use of markdown formatting:
    - Use tables for structured information
    - Use **bold** for emphasis on important points
    - Use bullet points and numbered lists for clarity
    - Use headings and subheadings to organize content
    - Include blockquotes for direct citations with > symbol

    Your notes should be professional, comprehensive yet concise, focusing on extracting the maximum value from the transcript.
    """
    
    try:
        stats = GenerationStatistics(model_name=LLM_MODEL)
        start_time = time.time()
        
        response = st.session_state.groq_client.chat.completions.create(
            messages=[{"role": "user", "content": prompt}],
            model=LLM_MODEL,
            temperature=0.2,  # Slightly lower temperature for more consistent structure
            max_tokens=4096,
            top_p=0.95,
            stream=True
        )
        
        input_time = time.time() - start_time
        stats.input_time = input_time
        
        note_section = NoteSection(structure, transcript)
        current_section = None
        current_subsection = None
        notes_content = ""
        
        section_markers = {
            "# Executive Summary": "Executive Summary",
            "## Executive Summary": "Executive Summary",
            "# Main Agenda": "Main Agenda", 
            "## Main Agenda": "Main Agenda",
            "# Points Discussed": "Points Discussed",
            "## Points Discussed": "Points Discussed",
            "# Key Insights": "Key Insights",
            "## Key Insights": "Key Insights",
            "# Questions & Considerations": "Questions & Considerations",
            "## Questions & Considerations": "Questions & Considerations",
            "# Detailed Analysis": "Detailed Analysis",
            "## Detailed Analysis": "Detailed Analysis",
            "## Context & Background": "Context & Background",
            "### Context & Background": "Context & Background",
            "## Supporting Evidence": "Supporting Evidence",
            "### Supporting Evidence": "Supporting Evidence",
            "# Next Steps": "Next Steps",
            "## Next Steps": "Next Steps"
        }
        
        for chunk in response:
            if hasattr(chunk.choices[0].delta, 'content') and chunk.choices[0].delta.content is not None:
                content = chunk.choices[0].delta.content
                notes_content += content
                
                # Check for section markers in the accumulated content
                for marker, section in section_markers.items():
                    if marker in notes_content:
                        if section in ["Context & Background", "Supporting Evidence"]:
                            current_section = "Detailed Analysis"
                            current_subsection = section
                        else:
                            current_section = section
                            current_subsection = None
                
                # Update the appropriate section
                if current_section and current_section != "Detailed Analysis":
                    note_section.update_content(current_section, content)
                elif current_section == "Detailed Analysis" and current_subsection:
                    note_section.update_content(current_subsection, content)
        
        output_time = time.time() - start_time - input_time
        stats.output_time = output_time
        stats.total_time = time.time() - start_time
        
        # Display statistics in expandable section
        with st.expander("Generation Statistics", expanded=False):
            st.markdown(str(stats))
        
        return note_section
        
    except Exception as e:
        st.error(f"Error processing transcript: {e}")
        return None


def export_notes(notes, format="markdown"):
    """Export notes in the specified format"""
    if format == "markdown":
        markdown_content = notes.get_markdown_content()
        # Create a download button for the markdown file
        st.download_button(
            label="Download Markdown",
            data=markdown_content,
            file_name=f"notes_{datetime.now().strftime('%Y%m%d_%H%M%S')}.md",
            mime="text/markdown"
        )
    elif format == "pdf":
        markdown_content = notes.get_markdown_content()
        pdf_file = BytesIO()
        md2pdf(pdf_file, markdown_content)
        pdf_file.seek(0)
        
        # Create a download button for the PDF file
        st.download_button(
            label="Download PDF",
            data=pdf_file,
            file_name=f"notes_{datetime.now().strftime('%Y%m%d_%H%M%S')}.pdf",
            mime="application/pdf"
        )

def main():
    st.title("🧙‍♂️ Note")
    st.markdown("Transform speech into structured notes")
    
    # Initialize API key from environment (Hugging Face secrets)
    if st.session_state.api_key and not st.session_state.groq_client:
        st.session_state.groq_client = initialize_groq_client(st.session_state.api_key)
    
    # Display model info in the sidebar
    with st.sidebar:
        st.info("Using DeepSeek-R1-Distill-Llama-70B model for note generation and Distil Whisper for transcription")
    
    # Check if API key is valid before proceeding
    if not st.session_state.api_key:
        st.error("❌ No API key found. Please set the GROQ_API_KEY secret in your Hugging Face Space settings.")
        st.stop()
    
    if not st.session_state.groq_client:
        st.error("❌ Failed to initialize Groq client. Please check your API key secret in Hugging Face Space settings.")
        st.stop()
    
    # Input methods tabs
    input_method = st.radio("Choose input method:", ["Live Recording", "Upload Audio", "YouTube URL", "Text Input"])
    
    if input_method == "Live Recording":
        st.markdown("### Record Audio")
        st.markdown("Click the microphone button below to start recording. Click it again to stop.")
        
        # Use the streamlit-audiorec component for recording
        wav_audio_data = st_audiorec()
        
        # If audio data is returned, display and process it
        if wav_audio_data is not None:
            # Reset any previous transcription errors
            st.session_state.transcription_error = None
            
            # Display the audio
            st.audio(wav_audio_data, format='audio/wav')
            
            # Add a button to transcribe the recorded audio
            if st.button("Transcribe Recording", key="transcribe_rec"):
                with st.spinner("Transcribing audio with Groq..."):
                    try:
                        transcript = transcribe_audio_with_groq(wav_audio_data)
                        if transcript:
                            st.session_state.transcript = transcript
                            st.success("✅ Transcription complete!")
                            
                            with st.expander("View Transcript", expanded=True):
                                st.markdown(transcript)
                                
                            if st.button("Generate Structured Notes", key="generate_live"):
                                with st.spinner("Creating structured notes..."):
                                    notes = process_transcript(transcript)
                                    
                                    if notes:
                                        st.success("Notes generated successfully!")
                                        
                                        # Export options
                                        col1, col2 = st.columns(2)
                                        with col1:
                                            if st.button("Export as Markdown", key="md_live"):
                                                export_notes(notes, "markdown")
                                        with col2:
                                            if st.button("Export as PDF", key="pdf_live"):
                                                export_notes(notes, "pdf")
                    except (ValueError, GroqAPIError) as e:
                        st.session_state.transcription_error = str(e)
                        st.error(f"❌ Transcription failed: {str(e)}")
    
    elif input_method == "Upload Audio":
        uploaded_file = st.file_uploader(
            "Upload an audio file (max 40MB)", 
            type=["mp3", "wav", "m4a", "ogg"],
            help="Supported formats: MP3, WAV, M4A, OGG. Maximum size: 40MB"
        )
        
        if uploaded_file:
            file_size = uploaded_file.size
            if file_size > MAX_FILE_SIZE:
                st.error(f"File size ({file_size/1048576:.2f}MB) exceeds the maximum allowed size of 40MB.")
            else:
                # Save the uploaded file temporarily
                with tempfile.NamedTemporaryFile(delete=False, suffix="." + uploaded_file.name.split(".")[-1]) as tmp_file:
                    tmp_file.write(uploaded_file.getvalue())
                    audio_file_path = tmp_file.name
                
                st.audio(uploaded_file)
                
                if st.button("Transcribe and Generate Notes", key="transcribe_upload"):
                    # Reset any previous transcription errors
                    st.session_state.transcription_error = None
                    
                    with st.spinner("Transcribing audio with Groq..."):
                        try:
                            transcript = transcribe_audio_with_groq(audio_file_path)
                            if transcript:
                                st.session_state.transcript = transcript
                                st.success("✅ Transcription complete!")
                                
                                with st.expander("View Transcript", expanded=True):
                                    st.markdown(transcript)
                                
                                with st.spinner("Creating structured notes..."):
                                    notes = process_transcript(transcript)
                                    
                                    if notes:
                                        st.success("Notes generated successfully!")
                                        
                                        # Export options
                                        col1, col2 = st.columns(2)
                                        with col1:
                                            if st.button("Export as Markdown", key="md_upload"):
                                                export_notes(notes, "markdown")
                                        with col2:
                                            if st.button("Export as PDF", key="pdf_upload"):
                                                export_notes(notes, "pdf")
                        except (ValueError, GroqAPIError) as e:
                            st.session_state.transcription_error = str(e)
                            st.error(f"❌ Transcription failed: {str(e)}")
                            
                            # Provide helpful suggestions based on error type
                            if "Audio file too large" in str(e) or "exceeds" in str(e):
                                st.info("💡 Try trimming your audio file or uploading a shorter segment.")
                            elif "API key" in str(e) or "Authentication" in str(e):
                                st.info("💡 Check that your Groq API key is correct in your Hugging Face Space settings.")
                            elif "Rate limit" in str(e):
                                st.info("💡 You've hit Groq's rate limits. Please wait a few minutes before trying again.")
            
    elif input_method == "YouTube URL":
        youtube_url = st.text_input(
            "Enter YouTube URL:",
            help="Enter the full URL of a YouTube video (e.g., https://www.youtube.com/watch?v=example)"
        )
        
        if youtube_url:
            if st.button("Process YouTube Content", key="process_yt"):
                # Reset any previous errors
                st.session_state.transcription_error = None
                
                with st.spinner("Downloading YouTube content..."):
                    try:
                        audio_path = download_video_audio(youtube_url)
                        
                        if audio_path:
                            st.success("Video downloaded successfully!")
                            st.audio(audio_path)
                            
                            with st.spinner("Transcribing audio with Groq..."):
                                try:
                                    transcript = transcribe_audio_with_groq(audio_path)
                                    if transcript:
                                        st.session_state.transcript = transcript
                                        st.success("✅ Transcription complete!")
                                        
                                        with st.expander("View Transcript", expanded=True):
                                            st.markdown(transcript)
                                        
                                        with st.spinner("Creating structured notes..."):
                                            notes = process_transcript(transcript)
                                            
                                            if notes:
                                                st.success("Notes generated successfully!")
                                                
                                                # Export options
                                                col1, col2 = st.columns(2)
                                                with col1:
                                                    if st.button("Export as Markdown", key="md_yt"):
                                                        export_notes(notes, "markdown")
                                                with col2:
                                                    if st.button("Export as PDF", key="pdf_yt"):
                                                        export_notes(notes, "pdf")
                                
                                except (ValueError, GroqAPIError) as e:
                                    st.session_state.transcription_error = str(e)
                                    st.error(f"❌ Transcription failed: {str(e)}")
                                                
                            # Clean up downloaded files
                            delete_download(audio_path)
                    
                    except Exception as e:
                        if "exceeds maximum allowed size" in str(e):
                            st.error(f"{FILE_TOO_LARGE_MESSAGE} Try a shorter video.")
                        else:
                            st.error(f"Error processing YouTube video: {e}")
    
    else:  # Text Input
        transcript = st.text_area(
            "Enter transcript text:", 
            height=300,
            help="Paste or type your transcript text here for generating structured notes"
        )
        
        if transcript:
            st.session_state.transcript = transcript
            
            if st.button("Generate Structured Notes", key="process_text"):
                with st.spinner("Creating structured notes..."):
                    notes = process_transcript(transcript)
                    
                    if notes:
                        st.success("Notes generated successfully!")
                        
                        # Export options
                        col1, col2 = st.columns(2)
                        with col1:
                            if st.button("Export as Markdown", key="md_text"):
                                export_notes(notes, "markdown")
                        with col2:
                            if st.button("Export as PDF", key="pdf_text"):
                                export_notes(notes, "pdf")

if __name__ == "__main__":
    main()