| | """ |
| | Main Streamlit Application - GEO SEO AI Optimizer |
| | Entry point for the application with UI components |
| | """ |
| |
|
| | import streamlit as st |
| | import os |
| | import tempfile |
| | import json |
| | from typing import Dict, Any, List |
| |
|
| | |
| | from utils.parser import PDFParser, TextParser, WebpageParser |
| | from utils.scorer import GEOScorer |
| | from utils.optimizer import ContentOptimizer |
| | from utils.chunker import VectorChunker |
| | from utils.export import ResultExporter |
| | from utils.lang_utils import detect_language, translate_text |
| |
|
| |
|
| | |
| | from langchain_groq import ChatGroq |
| | from langchain_community.embeddings import HuggingFaceEmbeddings |
| | from langdetect import detect |
| | from deep_translator import GoogleTranslator |
| | def detect_and_translate_to_english(text: str) -> str: |
| | try: |
| | lang = detect(text) |
| | if lang != "en": |
| | st.warning(f"Detected Language: {lang}. Translating to English...") |
| | translated_text = GoogleTranslator(source='auto', target='en').translate(text) |
| | return translated_text |
| | else: |
| | return text |
| | except Exception as e: |
| | st.error(f"Translation failed: {e}") |
| | return text |
| |
|
| |
|
| | class GEOSEOApp: |
| | """Main application class that orchestrates all components""" |
| | |
| | def __init__(self): |
| | self.setup_config() |
| | self.setup_models() |
| | self.setup_parsers() |
| | self.setup_components() |
| | |
| | def setup_config(self): |
| | """Initialize configuration and API keys""" |
| | self.groq_api_key = os.getenv("GROQ_API_KEY", "your-groq-api-key") |
| | self.hf_api_key = os.getenv("HUGGINGFACE_API_KEY", "your-huggingface-api-key") |
| | |
| | |
| | os.makedirs("data/uploaded_files", exist_ok=True) |
| | |
| | def setup_models(self): |
| | """Initialize LLM and embedding models""" |
| | self.llm = ChatGroq( |
| | api_key=self.groq_api_key, |
| | model_name="llama3-8b-8192", |
| | temperature=0.1 |
| | ) |
| | |
| | self.embeddings = HuggingFaceEmbeddings( |
| | model_name="sentence-transformers/all-MiniLM-L6-v2", |
| | cache_folder="./hf_cache", |
| | ) |
| | |
| | def setup_parsers(self): |
| | """Initialize content parsers""" |
| | self.pdf_parser = PDFParser() |
| | self.text_parser = TextParser() |
| | self.webpage_parser = WebpageParser() |
| | |
| | def setup_components(self): |
| | """Initialize processing components""" |
| | self.geo_scorer = GEOScorer(self.llm) |
| | self.content_optimizer = ContentOptimizer(self.llm) |
| | self.vector_chunker = VectorChunker(self.embeddings) |
| | self.result_exporter = ResultExporter() |
| | |
| | def run(self): |
| | """Main application runner""" |
| | st.set_page_config( |
| | page_title="GEO SEO AI Optimizer", |
| | page_icon="π", |
| | layout="wide" |
| | ) |
| | |
| | st.title("π GEO SEO AI Optimizer") |
| | st.markdown("*Optimize your content for AI search engines and LLM systems*") |
| | |
| | |
| | self.render_sidebar() |
| | |
| | |
| | tab1, tab2, tab3,tab4 = st.tabs([ |
| | "π Website GEO Analysis", |
| | "π§ Content Enhancement", |
| | "π Document Q&A", |
| | "π Translation" |
| | ]) |
| | |
| | with tab1: |
| | self.render_website_analysis_tab() |
| | |
| | with tab2: |
| | self.render_content_enhancement_tab() |
| | |
| | with tab3: |
| | self.render_document_qa_tab() |
| | with tab4: |
| | self.render_multilingual_tab() |
| | |
| | def render_sidebar(self): |
| | """Render sidebar with information and controls""" |
| | st.sidebar.title("π οΈ GEO Tools") |
| | st.sidebar.markdown("- π Document Q&A with RAG") |
| | st.sidebar.markdown("- π§ Content Enhancement") |
| | st.sidebar.markdown("- π Website GEO Analysis") |
| | st.sidebar.markdown("- π AI-First SEO Scoring") |
| | |
| | st.sidebar.markdown("---") |
| | st.sidebar.markdown("### π§ Configuration") |
| | st.sidebar.markdown("Set your API keys:") |
| | st.sidebar.code("export GROQ_API_KEY='your-key'") |
| | |
| | st.sidebar.markdown("---") |
| | st.sidebar.markdown("### π GEO Metrics") |
| | st.sidebar.markdown("**AI Search Visibility**: How likely AI engines will surface your content") |
| | st.sidebar.markdown("**Query Intent Matching**: How well content matches user queries") |
| | st.sidebar.markdown("**Conversational Readiness**: Suitability for AI chat responses") |
| | st.sidebar.markdown("**Citation Worthiness**: Probability of being cited by AI") |
| | |
| | st.sidebar.markdown("---") |
| | st.sidebar.markdown("### βΉοΈ Components") |
| | st.sidebar.markdown("- **Parser**: Extract content from various sources") |
| | st.sidebar.markdown("- **Scorer**: Analyze GEO performance") |
| | st.sidebar.markdown("- **Optimizer**: Enhance content for AI") |
| | st.sidebar.markdown("- **Chunker**: Create vector embeddings") |
| | st.sidebar.markdown("- **Exporter**: Generate reports") |
| | |
| | def render_document_qa_tab(self): |
| | """Render Document Q&A tab""" |
| | st.header("π Document Question Answering") |
| | st.markdown("Upload documents or paste text to ask questions using RAG.") |
| | |
| | |
| | uploaded_file = st.file_uploader("Upload a PDF file", type=["pdf"]) |
| | |
| | |
| | pasted_text = st.text_area("Or paste text directly:", height=150) |
| | |
| | |
| | user_query = st.text_input("Ask a question about the content:") |
| | |
| | |
| | if st.button("π Ask Question", key="qa_submit"): |
| | if not user_query.strip(): |
| | st.warning("Please enter a question.") |
| | return |
| | |
| | try: |
| | |
| | documents = [] |
| | |
| | if uploaded_file: |
| | with st.spinner("Processing PDF..."): |
| | temp_path = self.save_uploaded_file(uploaded_file) |
| | documents = self.pdf_parser.parse(temp_path) |
| | os.unlink(temp_path) |
| |
|
| | |
| | for doc in documents: |
| | doc.page_content = detect_and_translate_to_english(doc.page_content) |
| |
|
| | |
| | elif pasted_text.strip(): |
| | with st.spinner("Processing text..."): |
| | translated_text = detect_and_translate_to_english(pasted_text) |
| | documents = self.text_parser.parse(translated_text) |
| |
|
| |
|
| | else: |
| | st.warning("Please upload a PDF or paste some text.") |
| | return |
| | |
| | |
| | with st.spinner("Creating embeddings and searching..."): |
| | qa_chain = self.vector_chunker.create_qa_chain(documents, self.llm) |
| | result = qa_chain({"query": user_query}) |
| | |
| | |
| | st.markdown("### π¬ Answer") |
| | st.write(result["result"]) |
| | |
| | |
| | with st.expander("π Source Documents"): |
| | for i, doc in enumerate(result.get("source_documents", [])): |
| | st.write(f"**Source {i+1}:**") |
| | content = doc.page_content |
| | st.write(content[:500] + "..." if len(content) > 500 else content) |
| | if hasattr(doc, 'metadata') and doc.metadata: |
| | st.write(f"*Metadata: {doc.metadata}*") |
| | st.write("---") |
| | |
| | except Exception as e: |
| | st.error(f"An error occurred: {str(e)}") |
| | |
| | def render_content_enhancement_tab(self): |
| | """Render Content Enhancement tab""" |
| | st.header("π§ Content Enhancement") |
| | st.markdown("Analyze and optimize your content for better AI/LLM performance.") |
| | |
| | |
| | input_text = st.text_area( |
| | "Enter content to analyze and enhance:", |
| | height=200, |
| | key="enhancement_input" |
| | ) |
| | |
| | |
| | col1, col2 = st.columns(2) |
| | with col1: |
| | analyze_only = st.checkbox("Analysis only (no rewriting)", value=False) |
| | with col2: |
| | include_keywords = st.checkbox("Include keyword suggestions", value=True) |
| | |
| | |
| | if st.button("π§ Analyze & Enhance", key="enhancement_submit"): |
| | if not input_text.strip(): |
| | st.warning("Please enter some content to analyze.") |
| | return |
| | |
| | try: |
| | with st.spinner("Analyzing content..."): |
| | |
| | result = self.content_optimizer.optimize_content( |
| | input_text, |
| | analyze_only=analyze_only, |
| | include_keywords=include_keywords |
| | ) |
| | |
| | if result.get("error"): |
| | st.error(f"Analysis failed: {result['error']}") |
| | return |
| | |
| | |
| | if analyze_only: |
| | st.success("Content analysis and enhancement completed successfully!") |
| | st.markdown("### π Analysis Results") |
| | |
| | |
| | scores = result.get("scores", {}) |
| | if scores: |
| | col1, col2, col3 = st.columns(3) |
| |
|
| | with col1: |
| | clarity = scores.get("clarity", 0) |
| | st.metric("Clarity", f"{clarity}/10") |
| |
|
| | with col2: |
| | structure = scores.get("structuredness", 0) |
| | st.metric("Structure", f"{structure}/10") |
| |
|
| | with col3: |
| | answerability = scores.get("answerability", 0) |
| | st.metric("Answerability", f"{answerability}/10") |
| |
|
| | |
| | keywords = result.get("keywords", []) |
| | if keywords: |
| | st.markdown("#### π Key Terms") |
| | st.write(", ".join(keywords)) |
| | |
| | |
| | optimized_text = result.get("optimized_text", "") |
| | |
| | if optimized_text : |
| | st.markdown("#### β¨ Optimized Content") |
| | st.text_area( |
| | "Enhanced version:", |
| | value=optimized_text, |
| | height=200, |
| | key="optimized_output" |
| | ) |
| | |
| | |
| | if st.button("π₯ Export Results"): |
| | export_data = self.result_exporter.export_enhancement_results(result) |
| | st.download_button( |
| | label="Download Analysis Report", |
| | data=json.dumps(export_data, indent=2), |
| | file_name=f"content_analysis_{int(time.time())}.json", |
| | mime="application/json" |
| | ) |
| | |
| | except Exception as e: |
| | st.error(f"An error occurred: {str(e)}") |
| | |
| | def render_website_analysis_tab(self): |
| | """Render Website GEO Analysis tab""" |
| | st.header("π Website GEO Analysis") |
| | st.markdown("Analyze websites for Generative Engine Optimization (GEO) performance.") |
| | |
| | |
| | col1, col2 = st.columns([3, 1]) |
| | |
| | with col1: |
| | website_url = st.text_input( |
| | "Enter website URL:", |
| | placeholder="https://example.com" |
| | ) |
| | |
| | with col2: |
| | max_pages = st.selectbox("Pages to analyze:", [1, 3, 5], index=0) |
| | |
| | |
| | col1, col2 = st.columns(2) |
| | with col1: |
| | include_subpages = st.checkbox("Include subpages", value=False) |
| | with col2: |
| | detailed_analysis = st.checkbox("Detailed analysis", value=True) |
| | |
| | |
| | if st.button("π Analyze Website", key="website_analyze"): |
| | if not website_url.strip(): |
| | st.warning("Please enter a website URL.") |
| | return |
| | |
| | try: |
| | |
| | if not website_url.startswith(('http://', 'https://')): |
| | website_url = 'https://' + website_url |
| | |
| | with st.spinner(f"Analyzing website: {website_url}"): |
| | |
| | pages_data = self.webpage_parser.parse_website( |
| | website_url, |
| | max_pages=max_pages, |
| | include_subpages=include_subpages |
| | ) |
| | |
| | if not pages_data: |
| | st.error("Could not extract content from the website.") |
| | return |
| | |
| | st.success(f"Successfully extracted content from {len(pages_data)} page(s)") |
| | |
| | |
| | with st.spinner("Calculating GEO scores..."): |
| | geo_results = [] |
| | |
| | for i, page_data in enumerate(pages_data): |
| | with st.spinner(f"Analyzing page {i+1}/{len(pages_data)}..."): |
| | analysis = self.geo_scorer.analyze_page_geo( |
| | page_data['content'], |
| | page_data['title'], |
| | detailed=detailed_analysis |
| | ) |
| | |
| | if not analysis.get('error'): |
| | analysis['page_data'] = page_data |
| | geo_results.append(analysis) |
| | else: |
| | st.warning(f"Could not analyze page {i+1}: {analysis['error']}") |
| | |
| | if not geo_results: |
| | st.error("Could not analyze any pages from the website.") |
| | return |
| | |
| | |
| | self.display_geo_results(geo_results, website_url) |
| | |
| | |
| | st.markdown("### π₯ Export Results") |
| | if st.button("π Generate Full Report"): |
| | report_data = self.result_exporter.export_geo_results( |
| | geo_results, |
| | website_url |
| | ) |
| | |
| | st.download_button( |
| | label="Download GEO Report", |
| | data=json.dumps(report_data, indent=2), |
| | file_name=f"geo_analysis_{website_url.replace('https://', '').replace('/', '_')}.json", |
| | mime="application/json" |
| | ) |
| | |
| | except Exception as e: |
| | st.error(f"An error occurred during website analysis: {str(e)}") |
| |
|
| | def render_multilingual_tab(self): |
| | st.markdown("### π Multilingual Translator") |
| | st.write("Detect language and translate text into a target language.") |
| |
|
| | text = st.text_area("Enter text:") |
| | if text: |
| | detected_lang = detect_language(text) |
| | st.write(f"Detected Language: **{detected_lang}**") |
| |
|
| | target = st.selectbox("Select target language", ["en", "fr", "es", "de", "ur", "hi", "zh", "ar", "ru"]) |
| | if st.button("Translate"): |
| | result = translate_text(text, target) |
| | st.success("Translation:") |
| | st.write(result) |
| |
|
| | |
| | def display_geo_results(self, geo_results: List[Dict], website_url: str): |
| | """Display GEO analysis results""" |
| | st.markdown("## π GEO Analysis Results") |
| | |
| | |
| | avg_scores = self.calculate_average_scores(geo_results) |
| | overall_avg = sum(avg_scores.values()) / len(avg_scores) if avg_scores else 0 |
| | |
| | |
| | col1, col2, col3 = st.columns([1, 2, 1]) |
| | with col2: |
| | st.metric( |
| | "Overall GEO Score", |
| | f"{overall_avg:.1f}/10", |
| | delta=f"{overall_avg - 7.0:.1f}" if overall_avg != 7.0 else None |
| | ) |
| | |
| | |
| | st.markdown("### π Detailed GEO Metrics") |
| | |
| | |
| | col1, col2, col3, col4 = st.columns(4) |
| | metrics_row1 = [ |
| | ("AI Search Visibility", "ai_search_visibility"), |
| | ("Query Intent Match", "query_intent_matching"), |
| | ("Factual Accuracy", "factual_accuracy"), |
| | ("Conversational Ready", "conversational_readiness") |
| | ] |
| | |
| | for i, (display_name, key) in enumerate(metrics_row1): |
| | with [col1, col2, col3, col4][i]: |
| | score = avg_scores.get(key, 0) |
| | st.metric(display_name, f"{score:.1f}") |
| | |
| | |
| | col1, col2, col3, col4 = st.columns(4) |
| | metrics_row2 = [ |
| | ("Semantic Richness", "semantic_richness"), |
| | ("Context Complete", "context_completeness"), |
| | ("Citation Worthy", "citation_worthiness"), |
| | ("Multi-Query Cover", "multi_query_coverage") |
| | ] |
| | |
| | for i, (display_name, key) in enumerate(metrics_row2): |
| | with [col1, col2, col3, col4][i]: |
| | score = avg_scores.get(key, 0) |
| | st.metric(display_name, f"{score:.1f}") |
| | |
| | |
| | self.display_recommendations(geo_results) |
| | |
| | |
| | with st.expander("π Detailed Page Analysis"): |
| | for i, analysis in enumerate(geo_results): |
| | page_data = analysis.get('page_data', {}) |
| | st.markdown(f"#### Page {i+1}: {page_data.get('title', 'Unknown Title')}") |
| | st.write(f"**URL**: {page_data.get('url', 'Unknown')}") |
| | st.write(f"**Word Count**: {page_data.get('word_count', 0)}") |
| | |
| | |
| | if 'primary_topics' in analysis: |
| | st.write(f"**Topics**: {', '.join(analysis['primary_topics'])}") |
| | |
| | if 'entities' in analysis: |
| | st.write(f"**Entities**: {', '.join(analysis['entities'])}") |
| | |
| | |
| | if 'geo_scores' in analysis: |
| | scores = analysis['geo_scores'] |
| | score_text = ", ".join([f"{k}: {v:.1f}" for k, v in scores.items()]) |
| | st.write(f"**Scores**: {score_text}") |
| | |
| | st.write("---") |
| | |
| | |
| | def display_recommendations(self, geo_results: List[Dict]): |
| | """Display optimization recommendations""" |
| | st.markdown("### π‘ Optimization Recommendations") |
| | |
| | |
| | all_recommendations = [] |
| | all_opportunities = [] |
| | |
| | for analysis in geo_results: |
| | all_recommendations.extend(analysis.get('recommendations', [])) |
| | all_opportunities.extend(analysis.get('optimization_opportunities', [])) |
| | |
| | |
| | unique_recommendations = list(set(all_recommendations)) |
| | |
| | if unique_recommendations: |
| | for i, rec in enumerate(unique_recommendations[:5], 1): |
| | st.write(f"**{i}.** {rec}") |
| | |
| | |
| | if all_opportunities: |
| | st.markdown("#### π Priority Optimizations") |
| | |
| | high_priority = [opp for opp in all_opportunities if opp.get('priority') == 'high'] |
| | medium_priority = [opp for opp in all_opportunities if opp.get('priority') == 'medium'] |
| | |
| | if high_priority: |
| | st.markdown("##### π΄ High Priority") |
| | for opp in high_priority[:3]: |
| | st.write(f"**{opp.get('type', 'Optimization')}**: {opp.get('description', 'No description')}") |
| | |
| | if medium_priority: |
| | st.markdown("##### π‘ Medium Priority") |
| | for opp in medium_priority[:3]: |
| | st.write(f"**{opp.get('type', 'Optimization')}**: {opp.get('description', 'No description')}") |
| | |
| | def calculate_average_scores(self, geo_results: List[Dict]) -> Dict[str, float]: |
| | """Calculate average GEO scores across all pages""" |
| | if not geo_results: |
| | return {} |
| | |
| | |
| | score_keys = list(geo_results[0].get('geo_scores', {}).keys()) |
| | avg_scores = {} |
| | |
| | for key in score_keys: |
| | scores = [ |
| | result['geo_scores'][key] |
| | for result in geo_results |
| | if 'geo_scores' in result and key in result['geo_scores'] |
| | ] |
| | avg_scores[key] = sum(scores) / len(scores) if scores else 0 |
| | |
| | return avg_scores |
| | |
| | def save_uploaded_file(self, uploaded_file) -> str: |
| | """Save uploaded file to temporary location""" |
| | with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as tmp_file: |
| | tmp_file.write(uploaded_file.read()) |
| | return tmp_file.name |
| |
|
| |
|
| | def main(): |
| | """Main entry point""" |
| | app = GEOSEOApp() |
| | app.run() |
| |
|
| |
|
| | if __name__ == "__main__": |
| | main() |