Spaces:

kambris
/

EsTu

Sleeping

App Files Files Community

EsTu / app.py

kambris

Update app.py

1fbc1f9 verified 5 months ago

raw

history blame contribute delete

10.2 kB

	import gradio as gr
	import requests
	import os
	from datetime import datetime
	from collections import defaultdict

	HF_TOKEN = os.getenv("HUGGINGFACE_TOKEN")
	MODEL = "meta-llama/Llama-3.3-70B-Instruct"

	class LearningTracker:
	def __init__(self):
	self.vocabulary = set()
	self.grammar_points = set()
	self.error_patterns = defaultdict(int)
	self.review_items = []
	self.session_start = datetime.now()

	def add_vocabulary(self, words):
	self.vocabulary.update(words)

	def add_grammar(self, point):
	self.grammar_points.add(point)

	def log_error(self, error_type):
	self.error_patterns[error_type] += 1

	def get_stats(self):
	session_duration = (datetime.now() - self.session_start).seconds // 60
	return {
	'vocabulary_count': len(self.vocabulary),
	'grammar_points': len(self.grammar_points),
	'errors': dict(self.error_patterns),
	'review_queue': len(self.review_items),
	'session_minutes': session_duration
	}

	tracker = LearningTracker()

	def build_system_prompt(stats):
	error_focus = ""
	if stats['errors']:
	top_errors = sorted(stats['errors'].items(), key=lambda x: x[1], reverse=True)[:3]
	error_list = ", ".join([f"{e[0]} ({e[1]}x)" for e in top_errors])
	error_focus = f"\n\nCOMMON ERRORS TO ADDRESS: {error_list}\nGently reinforce these areas in conversation."

	memory_context = ""
	if stats['vocabulary_count'] > 0:
	memory_context = f"\n\nLEARNING PROGRESS:\n- Vocabulary introduced: {stats['vocabulary_count']} words\n- Grammar points covered: {stats['grammar_points']}\n- Items ready for review: {stats['review_queue']}\nReference previous topics naturally in conversation."

	return f"""You're tutoring a linguistics PhD student learning Spanish (A2-B1 level). They're fluent in English, French, and Arabic.

	Use B1-level Spanish for all conversation. Adapt to whatever they need - conversation practice, grammar questions, vocabulary building, or scenario practice.

	Balance accessible comparisons with metalinguistic insight:
	- Simple: "Spanish 'he comido' = French 'j'ai mangé' = English 'I have eaten'"
	- Analytical: "Notice the pro-drop here - Spanish allows null subjects unlike French"
	- Pattern recognition: "The subjunctive after 'querer que' works like French 'vouloir que' + subjonctif"

	For grammar questions, give clear side-by-side comparisons with linguistic depth:
	- "Spanish: 'Yo como' / French: 'Je mange' / English: 'I eat' / Arabic: 'آكل' (subject optional in Spanish/Arabic)"
	- Discuss: "Both Spanish and Arabic are pro-drop languages, unlike French and English"
	- Show conjugation patterns across languages, note morphological strategies

	For vocabulary, start with practical comparisons, layer in analysis:
	- Spanish: "almohada" / Arabic: "المخدة" (al-mikhadda) → discuss Arabic substrate
	- Spanish: "importante" / French: "important" / English: "important" → Latin cognates
	- Note each new word you introduce by marking it: [VOCAB: word]

	For errors, gently recast and mark the pattern: [ERROR: ser/estar] or [ERROR: subjunctive] or [ERROR: preterite/imperfect]
	When you see repeated error patterns, address them directly but kindly.{error_focus}{memory_context}

	SPACED REPETITION: Every 5-7 messages, naturally weave in a review question about vocabulary or grammar from earlier in the conversation."""

	def extract_learning_data(text):
	vocab = []
	grammar = []
	errors = []

	if '[VOCAB:' in text:
	parts = text.split('[VOCAB:')
	for part in parts[1:]:
	word = part.split(']')[0].strip()
	vocab.append(word)

	if '[GRAMMAR:' in text:
	parts = text.split('[GRAMMAR:')
	for part in parts[1:]:
	point = part.split(']')[0].strip()
	grammar.append(point)

	if '[ERROR:' in text:
	parts = text.split('[ERROR:')
	for part in parts[1:]:
	error_type = part.split(']')[0].strip()
	errors.append(error_type)

	return vocab, grammar, errors

	def get_progress_display():
	stats = tracker.get_stats()

	progress_text = f"""### 📊 Your Progress

	Session Stats:
	- ⏱️ Time: {stats['session_minutes']} minutes
	- 📚 Vocabulary: {stats['vocabulary_count']} words
	- 📖 Grammar points: {stats['grammar_points']}
	- 🔄 Review queue: {stats['review_queue']} items
	"""

	if stats['errors']:
	progress_text += "\nError Patterns (focus areas):\n"
	for error, count in sorted(stats['errors'].items(), key=lambda x: x[1], reverse=True):
	progress_text += f"- {error}: {count}x\n"

	return progress_text

	def query_model(messages, stream=True):
	API_URL = "https://router.huggingface.co/v1/chat/completions"
	headers = {
	"Authorization": f"Bearer {HF_TOKEN}",
	"Content-Type": "application/json"
	}

	payload = {
	"model": MODEL,
	"messages": messages,
	"max_tokens": 1000,
	"temperature": 0.7,
	"stream": stream
	}

	response = requests.post(API_URL, headers=headers, json=payload, timeout=120, stream=stream)
	return response

	def request_review(history):
	if history is None:
	history = []

	stats = tracker.get_stats()

	if stats['review_queue'] == 0 and stats['vocabulary_count'] == 0:
	review_msg = "No hay nada que revisar todavía. (Nothing to review yet. Keep conversing!)"
	else:
	review_msg = "Dame un repaso de lo que hemos aprendido. (Give me a review of what we've learned.)"

	return history + [[review_msg, None]]

	with gr.Blocks() as demo:
	gr.Markdown("# 🇪🇸 Spanish Tutor - Advanced Learning System")
	gr.Markdown("Powered by Llama 3.3 70B with memory, spaced repetition, and progress tracking")

	with gr.Row():
	with gr.Column(scale=2):
	chatbot = gr.Chatbot(height=500)
	msg = gr.Textbox(label="Message", placeholder="Type in Spanish, English, French, or Arabic...")

	with gr.Row():
	send = gr.Button("Send", variant="primary")
	review = gr.Button("📝 Request Review", variant="secondary")
	clear = gr.Button("Clear")

	with gr.Column(scale=1):
	progress_display = gr.Markdown(get_progress_display())

	gr.Markdown("""
	### 💡 Tips

	The tutor tracks:
	- New vocabulary you learn
	- Grammar points covered
	- Your common error patterns
	- Items for spaced repetition

	Error patterns help focus practice on:
	- ser/estar confusion
	- subjunctive usage
	- preterite/imperfect
	- gender agreement

	Click Request Review for spaced repetition practice.
	""")

	def user_submit(user_message, history):
	return "", history + [[user_message, None]]

	def bot_respond(history):
	if history is None or len(history) == 0:
	return history, get_progress_display()

	user_message = history[-1][0]
	stats = tracker.get_stats()

	messages = [
	{"role": "system", "content": build_system_prompt(stats)}
	]

	for user_msg, assistant_msg in history[:-1]:
	if user_msg:
	messages.append({"role": "user", "content": user_msg})
	if assistant_msg:
	messages.append({"role": "assistant", "content": assistant_msg})

	messages.append({"role": "user", "content": user_message})

	try:
	response_obj = query_model(messages, stream=True)

	if response_obj.status_code == 200:
	full_response = ""
	for line in response_obj.iter_lines():
	if line:
	line = line.decode('utf-8')
	if line.startswith('data: '):
	line = line[6:]
	if line.strip() == '[DONE]':
	break
	try:
	import json
	chunk = json.loads(line)
	if 'choices' in chunk and len(chunk['choices']) > 0:
	delta = chunk['choices'][0].get('delta', {})
	content = delta.get('content', '')
	if content:
	full_response += content
	history[-1][1] = full_response
	yield history, get_progress_display()
	except:
	continue

	vocab, grammar, errors = extract_learning_data(full_response)
	tracker.add_vocabulary(vocab)
	for g in grammar:
	tracker.add_grammar(g)
	for e in errors:
	tracker.log_error(e)
	else:
	history[-1][1] = f"Error {response_obj.status_code}: {response_obj.text}"
	yield history, get_progress_display()

	except Exception as e:
	history[-1][1] = f"Error: {str(e)}"
	yield history, get_progress_display()

	msg.submit(user_submit, [msg, chatbot], [msg, chatbot], queue=False).then(
	bot_respond, chatbot, [chatbot, progress_display]
	)
	send.click(user_submit, [msg, chatbot], [msg, chatbot], queue=False).then(
	bot_respond, chatbot, [chatbot, progress_display]
	)

	review.click(request_review, chatbot, chatbot, queue=False).then(
	bot_respond, chatbot, [chatbot, progress_display]
	)
	clear.click(lambda: [], None, chatbot, queue=False)

	if __name__ == "__main__":
	demo.launch()