Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -16,14 +16,13 @@ from download import download_video_audio, delete_download
|
|
16 |
MAX_FILE_SIZE = 41943040 # 40MB in bytes
|
17 |
FILE_TOO_LARGE_MESSAGE = "File too large. Maximum size is 40MB."
|
18 |
|
19 |
-
# Load environment variables
|
20 |
load_dotenv()
|
21 |
-
GROQ_API_KEY = os.environ.get("GROQ_API_KEY", None)
|
22 |
-
audio_file_path = None
|
23 |
|
24 |
# Initialize session states
|
25 |
if 'api_key' not in st.session_state:
|
26 |
-
|
|
|
27 |
|
28 |
if 'recording' not in st.session_state:
|
29 |
st.session_state.recording = False
|
@@ -34,9 +33,8 @@ if 'audio_data' not in st.session_state:
|
|
34 |
if 'transcript' not in st.session_state:
|
35 |
st.session_state.transcript = ""
|
36 |
|
37 |
-
if '
|
38 |
-
|
39 |
-
st.session_state.groq = Groq(api_key=st.session_state.api_key)
|
40 |
|
41 |
# Set page configuration
|
42 |
st.set_page_config(
|
@@ -50,6 +48,17 @@ st.set_page_config(
|
|
50 |
LLM_MODEL = "deepseek-r1-distill-llama-70b"
|
51 |
TRANSCRIPTION_MODEL = "distil-whisper-large-v3-en"
|
52 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
53 |
class GenerationStatistics:
|
54 |
def __init__(self, input_time=0, output_time=0, input_tokens=0, output_tokens=0, total_time=0, model_name=LLM_MODEL):
|
55 |
self.input_time = input_time
|
@@ -205,15 +214,13 @@ class AudioRecorder:
|
|
205 |
|
206 |
def transcribe_audio_with_groq(audio_file_path):
|
207 |
"""Transcribe audio file using Groq's transcription API"""
|
208 |
-
if not st.session_state.
|
209 |
-
st.error("
|
210 |
return ""
|
211 |
|
212 |
-
client = Groq(api_key=st.session_state.api_key)
|
213 |
-
|
214 |
try:
|
215 |
with open(audio_file_path, "rb") as file:
|
216 |
-
transcription =
|
217 |
file=(audio_file_path, file.read()),
|
218 |
model=TRANSCRIPTION_MODEL,
|
219 |
response_format="verbose_json"
|
@@ -225,12 +232,10 @@ def transcribe_audio_with_groq(audio_file_path):
|
|
225 |
|
226 |
def process_transcript(transcript):
|
227 |
"""Process transcript with Groq's DeepSeek model for highly structured notes"""
|
228 |
-
if not st.session_state.
|
229 |
-
st.error("
|
230 |
return None
|
231 |
|
232 |
-
client = Groq(api_key=st.session_state.api_key)
|
233 |
-
|
234 |
# Enhanced structure for better organization
|
235 |
structure = {
|
236 |
"Executive Summary": "",
|
@@ -309,7 +314,7 @@ def process_transcript(transcript):
|
|
309 |
stats = GenerationStatistics(model_name=LLM_MODEL)
|
310 |
start_time = time.time()
|
311 |
|
312 |
-
response =
|
313 |
messages=[{"role": "user", "content": prompt}],
|
314 |
model=LLM_MODEL,
|
315 |
temperature=0.3, # Lower temperature for more structured output
|
@@ -415,16 +420,55 @@ def main():
|
|
415 |
# Sidebar for configuration
|
416 |
with st.sidebar:
|
417 |
st.header("Configuration")
|
418 |
-
api_key = st.text_input("Groq API Key", value=st.session_state.api_key or "", type="password")
|
419 |
|
420 |
-
|
421 |
-
|
422 |
-
|
423 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
424 |
|
425 |
st.markdown("---")
|
426 |
st.info("Using DeepSeek-R1-Distill-Llama-70B model for note generation and Distil Whisper for transcription")
|
427 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
428 |
# Input methods tabs
|
429 |
input_method = st.radio("Choose input method:", ["Live Recording", "Upload Audio", "YouTube URL", "Text Input"])
|
430 |
|
|
|
16 |
MAX_FILE_SIZE = 41943040 # 40MB in bytes
|
17 |
FILE_TOO_LARGE_MESSAGE = "File too large. Maximum size is 40MB."
|
18 |
|
19 |
+
# Load environment variables in a secure way
|
20 |
load_dotenv()
|
|
|
|
|
21 |
|
22 |
# Initialize session states
|
23 |
if 'api_key' not in st.session_state:
|
24 |
+
# Try to get API key from environment variable first
|
25 |
+
st.session_state.api_key = os.environ.get("GROQ_API_KEY", "")
|
26 |
|
27 |
if 'recording' not in st.session_state:
|
28 |
st.session_state.recording = False
|
|
|
33 |
if 'transcript' not in st.session_state:
|
34 |
st.session_state.transcript = ""
|
35 |
|
36 |
+
if 'groq_client' not in st.session_state:
|
37 |
+
st.session_state.groq_client = None
|
|
|
38 |
|
39 |
# Set page configuration
|
40 |
st.set_page_config(
|
|
|
48 |
LLM_MODEL = "deepseek-r1-distill-llama-70b"
|
49 |
TRANSCRIPTION_MODEL = "distil-whisper-large-v3-en"
|
50 |
|
51 |
+
# Initialize Groq client function
|
52 |
+
def initialize_groq_client(api_key):
|
53 |
+
"""Initialize Groq client with the provided API key"""
|
54 |
+
if not api_key:
|
55 |
+
return None
|
56 |
+
try:
|
57 |
+
return Groq(api_key=api_key)
|
58 |
+
except Exception as e:
|
59 |
+
st.error(f"Failed to initialize Groq client: {e}")
|
60 |
+
return None
|
61 |
+
|
62 |
class GenerationStatistics:
|
63 |
def __init__(self, input_time=0, output_time=0, input_tokens=0, output_tokens=0, total_time=0, model_name=LLM_MODEL):
|
64 |
self.input_time = input_time
|
|
|
214 |
|
215 |
def transcribe_audio_with_groq(audio_file_path):
|
216 |
"""Transcribe audio file using Groq's transcription API"""
|
217 |
+
if not st.session_state.groq_client:
|
218 |
+
st.error("Groq client is not initialized. Please check your API key.")
|
219 |
return ""
|
220 |
|
|
|
|
|
221 |
try:
|
222 |
with open(audio_file_path, "rb") as file:
|
223 |
+
transcription = st.session_state.groq_client.audio.transcriptions.create(
|
224 |
file=(audio_file_path, file.read()),
|
225 |
model=TRANSCRIPTION_MODEL,
|
226 |
response_format="verbose_json"
|
|
|
232 |
|
233 |
def process_transcript(transcript):
|
234 |
"""Process transcript with Groq's DeepSeek model for highly structured notes"""
|
235 |
+
if not st.session_state.groq_client:
|
236 |
+
st.error("Groq client is not initialized. Please check your API key.")
|
237 |
return None
|
238 |
|
|
|
|
|
239 |
# Enhanced structure for better organization
|
240 |
structure = {
|
241 |
"Executive Summary": "",
|
|
|
314 |
stats = GenerationStatistics(model_name=LLM_MODEL)
|
315 |
start_time = time.time()
|
316 |
|
317 |
+
response = st.session_state.groq_client.chat.completions.create(
|
318 |
messages=[{"role": "user", "content": prompt}],
|
319 |
model=LLM_MODEL,
|
320 |
temperature=0.3, # Lower temperature for more structured output
|
|
|
420 |
# Sidebar for configuration
|
421 |
with st.sidebar:
|
422 |
st.header("Configuration")
|
|
|
423 |
|
424 |
+
# Improved API key handling
|
425 |
+
api_key_input = st.text_input(
|
426 |
+
"Groq API Key",
|
427 |
+
value=st.session_state.api_key,
|
428 |
+
type="password",
|
429 |
+
help="Enter your Groq API key. Get one at https://console.groq.com/keys"
|
430 |
+
)
|
431 |
+
|
432 |
+
# Only update if changed
|
433 |
+
if api_key_input != st.session_state.api_key:
|
434 |
+
st.session_state.api_key = api_key_input
|
435 |
+
# Reinitialize client with new key
|
436 |
+
st.session_state.groq_client = initialize_groq_client(api_key_input)
|
437 |
+
|
438 |
+
if st.session_state.groq_client:
|
439 |
+
st.success("✅ API key validated!")
|
440 |
+
|
441 |
+
# Initialize client if not done already
|
442 |
+
if st.session_state.api_key and not st.session_state.groq_client:
|
443 |
+
st.session_state.groq_client = initialize_groq_client(st.session_state.api_key)
|
444 |
+
|
445 |
+
# API key instructions
|
446 |
+
with st.expander("How to get a Groq API key"):
|
447 |
+
st.markdown("""
|
448 |
+
1. Visit [Groq Cloud Console](https://console.groq.com/)
|
449 |
+
2. Sign up or log in to your account
|
450 |
+
3. Navigate to API Keys in the sidebar
|
451 |
+
4. Click "Create API Key" and give it a name
|
452 |
+
5. Copy the generated key (you won't see it again!)
|
453 |
+
|
454 |
+
**Security tip**: For production use, store your API key as an environment variable:
|
455 |
+
```bash
|
456 |
+
export GROQ_API_KEY="your-api-key-here"
|
457 |
+
```
|
458 |
+
""")
|
459 |
|
460 |
st.markdown("---")
|
461 |
st.info("Using DeepSeek-R1-Distill-Llama-70B model for note generation and Distil Whisper for transcription")
|
462 |
+
|
463 |
+
# Check if API key is valid before proceeding
|
464 |
+
if not st.session_state.api_key:
|
465 |
+
st.warning("⚠️ Please enter your Groq API key in the sidebar to use ScribeWizard")
|
466 |
+
st.stop()
|
467 |
+
|
468 |
+
if not st.session_state.groq_client:
|
469 |
+
st.error("❌ Failed to initialize Groq client. Please check your API key.")
|
470 |
+
st.stop()
|
471 |
+
|
472 |
# Input methods tabs
|
473 |
input_method = st.radio("Choose input method:", ["Live Recording", "Upload Audio", "YouTube URL", "Text Input"])
|
474 |
|