Spaces:

shaheerawan3
/

Edu_Slide

Sleeping

App Files Files Community

Edu_Slide / app.py

shaheerawan3

Update app.py

7ed817f verified 9 months ago

raw

history blame contribute delete

13.5 kB

	import streamlit as st
	from transformers import pipeline
	from PIL import Image
	import io
	from pptx import Presentation
	from pptx.util import Inches, Pt
	from pptx.dml.color import RGBColor
	from pptx.enum.text import PP_ALIGN
	import docx
	import PyPDF2
	from pptx import Presentation as PPTXPresentation
	import pandas as pd
	import numpy as np
	from typing import List, Dict, Any, Optional, Tuple
	import time
	import requests
	from bs4 import BeautifulSoup
	import re
	import tempfile
	import logging
	from pathlib import Path
	import json

	# Configure logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# Nutrition-specific knowledge base
	NUTRITION_FIELDS = {
	"Clinical Nutrition": [
	"Medical Nutrition Therapy",
	"Disease-Specific Diets",
	"Nutritional Assessment",
	"Hospital Dietetics",
	"Nutrition Care Process"
	],
	"Sports Nutrition": [
	"Performance Nutrition",
	"Sports Supplements",
	"Hydration Strategies",
	"Pre/Post Workout Nutrition",
	"Recovery Nutrition"
	],
	"Community Nutrition": [
	"Public Health Nutrition",
	"Food Security",
	"Population Health",
	"School Nutrition",
	"Cultural Food Practices"
	],
	"Therapeutic Nutrition": [
	"Diet Therapy",
	"Disease Management",
	"Metabolic Disorders",
	"Diabetes Management",
	"Cardiovascular Nutrition"
	]
	}

	class ContentEnricher:
	@staticmethod
	def fetch_open_images(topic: str) -> Optional[str]:
	"""Fetch free images from Unsplash's public website"""
	try:
	url = f"https://source.unsplash.com/featured/?{topic.replace(' ', ',')}"
	response = requests.get(url, stream=True)
	if response.status_code == 200:
	return url
	except Exception as e:
	logger.warning(f"Error fetching image: {e}")
	return None

	@staticmethod
	def fetch_pubmed_content(topic: str) -> str:
	"""Fetch content from PubMed's public RSS feed"""
	try:
	url = f"https://pubmed.ncbi.nlm.nih.gov/rss/search/1?term={topic.replace(' ', '+')}"
	response = requests.get(url)
	if response.status_code == 200:
	soup = BeautifulSoup(response.content, 'xml')
	items = soup.find_all('item')
	content = []
	for item in items[:3]: # Get first 3 articles
	title = item.title.text
	desc = item.description.text
	content.append(f"{title}\n{desc}")
	return "\n\n".join(content)
	except Exception as e:
	logger.warning(f"Error fetching PubMed content: {e}")
	return ""

	@staticmethod
	def fetch_nutrition_gov(topic: str) -> str:
	"""Fetch content from nutrition.gov public pages"""
	try:
	url = f"https://www.nutrition.gov/search/{topic.replace(' ', '+')}"
	response = requests.get(url)
	if response.status_code == 200:
	soup = BeautifulSoup(response.content, 'html.parser')
	content = []
	for p in soup.find_all('p')[:5]:
	content.append(p.text.strip())
	return "\n".join(content)
	except Exception as e:
	logger.warning(f"Error fetching Nutrition.gov content: {e}")
	return ""

	class FileProcessor:
	@staticmethod
	def process_txt(file) -> str:
	return file.read().decode('utf-8')

	@staticmethod
	def process_docx(file) -> str:
	doc = docx.Document(file)
	return "\n".join([paragraph.text for paragraph in doc.paragraphs])

	@staticmethod
	def process_pdf(file) -> str:
	pdf_reader = PyPDF2.PdfReader(file)
	return "\n".join([page.extract_text() for page in pdf_reader.pages])

	@staticmethod
	def process_pptx(file) -> str:
	prs = PPTXPresentation(file)
	text_content = []
	for slide in prs.slides:
	for shape in slide.shapes:
	if hasattr(shape, "text"):
	text_content.append(shape.text)
	return "\n".join(text_content)

	class PresentationGenerator:
	def __init__(self):
	self.text_generator = self.load_text_generator()
	self.content_enricher = ContentEnricher()
	self.file_processor = FileProcessor()

	@staticmethod
	@st.cache_resource
	def load_text_generator():
	return pipeline("text-generation", model="gpt2-medium")

	def add_image_to_slide(self, slide, image_url: str):
	try:
	response = requests.get(image_url, stream=True)
	if response.status_code == 200:
	img_path = tempfile.NamedTemporaryFile(delete=False, suffix=".jpg").name
	with open(img_path, "wb") as f:
	f.write(response.content)
	slide.shapes.add_picture(img_path, Inches(1), Inches(1), Inches(4), Inches(3))
	except Exception as e:
	logger.warning(f"Failed to add image to slide: {e}")

	def create_slide(self, prs: Presentation, title: str, points: List[str], image_url: Optional[str], template_style: str) -> None:
	slide = prs.slides.add_slide(prs.slide_layouts[1])

	# Set title
	title_shape = slide.shapes.title
	title_shape.text = title

	# Style based on template
	if template_style == "Professional":
	title_shape.text_frame.paragraphs[0].font.size = Pt(40)
	title_shape.text_frame.paragraphs[0].font.color.rgb = RGBColor(0, 51, 102)

	# Add content
	content_shape = slide.shapes.placeholders[1]
	text_frame = content_shape.text_frame

	for point in points:
	p = text_frame.add_paragraph()
	p.text = "• " + point
	p.font.size = Pt(18)
	p.font.color.rgb = RGBColor(51, 51, 51)

	# Add image if available
	if image_url:
	self.add_image_to_slide(slide, image_url)

	def generate_content(self, topic: str, base_content: str, category: str) -> Dict[str, Any]:
	"""Generate enhanced content with multiple sources"""
	try:
	# Combine content from multiple sources
	pubmed_content = self.content_enricher.fetch_pubmed_content(topic)
	nutrition_gov_content = self.content_enricher.fetch_nutrition_gov(topic)

	combined_content = f"{base_content}\n{pubmed_content}\n{nutrition_gov_content}"

	# Generate with context
	prompt = f"Create educational content about {topic} in {category}:\n{combined_content}"
	generated = self.text_generator(
	prompt,
	max_length=500,
	num_return_sequences=1,
	temperature=0.7
	)[0]['generated_text']

	# Process into sections
	sections = self.process_content(generated)

	return {
	'content': generated,
	'sections': sections,
	'topic': topic,
	'category': category
	}
	except Exception as e:
	logger.error(f"Error generating content: {e}")
	st.error(f"Error generating content: {str(e)}")
	return None

	def process_content(self, content: str, max_points: int = 5) -> List[Dict]:
	"""Process content into well-structured sections"""
	sections = []
	current_section = {'title': '', 'points': []}

	for line in content.split('\n'):
	line = line.strip()
	if not line:
	continue

	if line.endswith(':'):
	if current_section['points']:
	sections.append(current_section)
	current_section = {'title': line.rstrip(':'), 'points': []}
	elif line.startswith(('•', '*', '-')):
	if len(current_section['points']) < max_points:
	current_section['points'].append(line.lstrip('•*- '))
	else:
	sentences = line.split('. ')
	for sentence in sentences[:max_points - len(current_section['points'])]:
	if sentence.strip():
	current_section['points'].append(sentence.strip())

	if current_section['points']:
	sections.append(current_section)

	return sections

	def create_presentation(self, title: str, content: Dict[str, Any],
	template: str) -> Optional[io.BytesIO]:
	try:
	prs = Presentation()

	# Title slide
	title_slide = prs.slides.add_slide(prs.slide_layouts[0])
	title_slide.shapes.title.text = title

	# Process sections
	progress_bar = st.progress(0)
	for idx, section in enumerate(content['sections']):
	image_url = self.content_enricher.fetch_open_images(section['title'])
	self.create_slide(prs, section['title'], section['points'], image_url, template)
	progress_bar.progress((idx + 1) / len(content['sections']))

	# Save
	output = io.BytesIO()
	prs.save(output)
	output.seek(0)
	return output

	except Exception as e:
	logger.error(f"Error creating presentation: {e}")
	st.error(f"Error creating presentation: {str(e)}")
	return None

	def main():
	st.set_page_config(page_title="DietitianSlide AI", layout="wide", page_icon="🥗")

	generator = PresentationGenerator()

	st.title("🥗 DietitianSlide AI - Professional Nutrition Presentations")

	# Sidebar settings
	with st.sidebar:
	category = st.selectbox("Nutrition Field", list(NUTRITION_FIELDS.keys()))
	topic = st.selectbox("Specific Topic", NUTRITION_FIELDS[category])

	template = st.selectbox("Template Style",
	["Professional", "Academic", "Modern", "Clinical"])

	max_points = st.slider("Points per Slide", 3, 8, 5)

	# Main content area
	col1, col2 = st.columns([2, 1])

	with col1:
	st.subheader("Content Input")
	content_method = st.radio("Input Method",
	["Write Content", "Upload Files", "Both"])

	user_content = ""
	if content_method in ["Write Content", "Both"]:
	user_content = st.text_area("Enter your content", height=150)

	if content_method in ["Upload Files", "Both"]:
	uploaded_file = st.file_uploader(
	"Upload File",
	type=["txt", "docx", "pdf", "pptx"]
	)

	if uploaded_file:
	file_content = ""
	if uploaded_file.type == "text/plain":
	file_content = generator.file_processor.process_txt(uploaded_file)
	elif uploaded_file.type == "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
	file_content = generator.file_processor.process_docx(uploaded_file)
	elif uploaded_file.type == "application/pdf":
	file_content = generator.file_processor.process_pdf(uploaded_file)
	elif uploaded_file.type == "application/vnd.openxmlformats-officedocument.presentationml.presentation":
	file_content = generator.file_processor.process_pptx(uploaded_file)

	if file_content:
	st.text_area("Extracted Content", file_content, height=100)
	user_content = f"{user_content}\n{file_content}" if user_content else file_content

	with col2:
	st.subheader("Preview & Generate")
	if st.button("Generate Presentation", type="primary"):
	if not user_content:
	st.error("Please provide some content!")
	return

	with st.spinner("Generating your presentation..."):
	content = generator.generate_content(topic, user_content, category)

	if content:
	output = generator.create_presentation(
	f"{category}: {topic}",
	content,
	template
	)

	if output:
	st.success("Presentation generated successfully!")
	st.download_button(
	"📥 Download Presentation",
	output,
	f"nutrition_{topic.lower().replace(' ', '_')}.pptx",
	"application/vnd.openxmlformats-officedocument.presentationml.presentation"
	)

	# Preview content
	st.subheader("Content Preview")
	for section in content['sections']:
	st.write(f"{section['title']}")
	for point in section['points']:
	st.write(f"• {point}")

	if __name__ == "__main__":
	main()