Spaces:

OEvortex
/

Webscout-API

Running

App Files Files Community

Webscout-API / app.py

KingNish

Update app.py

70a0c4d verified 2 months ago

raw

history blame

No virus

16.1 kB

	from fastapi import FastAPI, HTTPException, Query # Make sure Query is imported
	from fastapi.responses import JSONResponse
	from webscout import WEBS, transcriber, LLM
	from typing import Optional, List, Dict, Union # Import List, Dict, Union
	from fastapi.encoders import jsonable_encoder
	from bs4 import BeautifulSoup
	import requests
	import urllib.parse

	app = FastAPI()

	@app.get("/")
	async def root():
	return {"message": "API documentation can be found at /docs"}

	@app.get("/health")
	async def health_check():
	return {"status": "OK"}

	@app.get("/api/search")
	async def search(
	q: str,
	max_results: int = 10,
	timelimit: Optional[str] = None,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	backend: str = "api"
	):
	"""Perform a text search."""
	try:
	with WEBS() as webs:
	results = webs.text(keywords=q, region=region, safesearch=safesearch, timelimit=timelimit, backend=backend, max_results=max_results)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during search: {e}")

	@app.get("/api/images")
	async def images(
	q: str,
	max_results: int = 10,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	timelimit: Optional[str] = None,
	size: Optional[str] = None,
	color: Optional[str] = None,
	type_image: Optional[str] = None,
	layout: Optional[str] = None,
	license_image: Optional[str] = None
	):
	"""Perform an image search."""
	try:
	with WEBS() as webs:
	results = webs.images(keywords=q, region=region, safesearch=safesearch, timelimit=timelimit, size=size, color=color, type_image=type_image, layout=layout, license_image=license_image, max_results=max_results)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during image search: {e}")

	@app.get("/api/videos")
	async def videos(
	q: str,
	max_results: int = 10,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	timelimit: Optional[str] = None,
	resolution: Optional[str] = None,
	duration: Optional[str] = None,
	license_videos: Optional[str] = None
	):
	"""Perform a video search."""
	try:
	with WEBS() as webs:
	results = webs.videos(keywords=q, region=region, safesearch=safesearch, timelimit=timelimit, resolution=resolution, duration=duration, license_videos=license_videos, max_results=max_results)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during video search: {e}")

	@app.get("/api/news")
	async def news(
	q: str,
	max_results: int = 10,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	timelimit: Optional[str] = None
	):
	"""Perform a news search."""
	try:
	with WEBS() as webs:
	results = webs.news(keywords=q, region=region, safesearch=safesearch, timelimit=timelimit, max_results=max_results)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during news search: {e}")

	@app.get("/api/llm")
	async def llm_chat(
	model: str,
	message: str,
	system_prompt: str = Query(None, description="Optional custom system prompt")
	):
	"""Interact with a specified large language model with an optional system prompt."""
	try:
	messages = [{"role": "user", "content": message}]
	if system_prompt:
	messages.insert(0, {"role": "system", "content": system_prompt}) # Add system message at the beginning

	llm = LLM(model=model)
	response = llm.chat(messages=messages)
	return JSONResponse(content={"response": response})
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during LLM chat: {e}")


	@app.get("/api/answers")
	async def answers(q: str):
	"""Get instant answers for a query."""
	try:
	with WEBS() as webs:
	results = webs.answers(keywords=q)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error getting instant answers: {e}")

	@app.get("/api/suggestions")
	async def suggestions(q: str, region: str = "wt-wt"):
	"""Get search suggestions for a query."""
	try:
	with WEBS() as webs:
	results = webs.suggestions(keywords=q, region=region)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error getting search suggestions: {e}")

	@app.get("/api/chat")
	async def chat(
	q: str,
	model: str = "gpt-3.5"
	):
	"""Perform a text search."""
	try:
	with WEBS() as webs:
	results = webs.chat(keywords=q, model=model)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error getting chat results: {e}")

	def extract_text_from_webpage(html_content):
	"""Extracts visible text from HTML content using BeautifulSoup."""
	soup = BeautifulSoup(html_content, "html.parser")
	# Remove unwanted tags
	for tag in soup(["script", "style", "header", "footer", "nav"]):
	tag.extract()
	# Get the remaining visible text
	visible_text = soup.get_text(strip=True)
	return visible_text

	@app.get("/api/web_extract")
	async def web_extract(
	url: str,
	max_chars: int = 12000, # Adjust based on token limit
	):
	"""Extracts text from a given URL."""
	try:
	response = requests.get(url, headers={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/111.0"})
	response.raise_for_status()
	visible_text = extract_text_from_webpage(response.text)
	if len(visible_text) > max_chars:
	visible_text = visible_text[:max_chars] + "..."
	return {"url": url, "text": visible_text}
	except requests.exceptions.RequestException as e:
	raise HTTPException(status_code=500, detail=f"Error fetching or processing URL: {e}")

	@app.get("/api/search-and-extract")
	async def web_search_and_extract(
	q: str,
	max_results: int = 3,
	timelimit: Optional[str] = None,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	backend: str = "api",
	max_chars: int = 6000,
	extract_only: bool = False
	):
	"""
	Searches using WEBS, extracts text from the top results, and returns both.
	"""
	try:
	with WEBS() as webs:
	# Perform WEBS search
	search_results = webs.text(keywords=q, region=region, safesearch=safesearch,
	timelimit=timelimit, backend=backend, max_results=max_results)

	# Extract text from each result's link
	extracted_results = []
	for result in search_results:
	if 'href' in result:
	link = result['href']
	try:
	response = requests.get(link, headers={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/111.0"})
	response.raise_for_status()
	visible_text = extract_text_from_webpage(response.text)
	if len(visible_text) > max_chars:
	visible_text = visible_text[:max_chars] + "..."
	extracted_results.append({"link": link, "text": visible_text})
	except requests.exceptions.RequestException as e:
	print(f"Error fetching or processing {link}: {e}")
	extracted_results.append({"link": link, "text": None})
	else:
	extracted_results.append({"link": None, "text": None})
	if extract_only:
	return JSONResponse(content=jsonable_encoder({extracted_results}))
	else:
	return JSONResponse(content=jsonable_encoder({"search_results": search_results, "extracted_results": extracted_results}))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during search and extraction: {e}")

	@app.get("/api/adv_web_search")
	async def adv_web_search(
	q: str,
	model: str = "gpt-3.5",
	max_results: int = 3,
	timelimit: Optional[str] = None,
	safesearch: str = "moderate",
	region: str = "wt-wt",
	backend: str = "api",
	max_chars: int = 6000,
	system_prompt: str = Query(None, description="Optional custom system prompt")
	):
	"""
	Combines web search, web extraction, and LLM chat for advanced search.
	"""
	try:
	with WEBS() as webs:
	# 1. Perform the web search
	search_results = webs.text(keywords=q, region=region,
	safesearch=safesearch,
	timelimit=timelimit, backend=backend,
	max_results=max_results)

	# 2. Extract text from top search result URLs
	extracted_text = ""
	for result in search_results:
	if 'href' in result:
	link = result['href']
	try:
	response = requests.get(link, headers={"User-Agent": "Mozilla/5.0"})
	response.raise_for_status()
	visible_text = extract_text_from_webpage(response.text)
	if len(visible_text) > max_chars:
	visible_text = visible_text[:max_chars] + "..."
	extracted_text += f"## Content from: {link}\n\n{visible_text}\n\n"
	except requests.exceptions.RequestException as e:
	print(f"Error fetching or processing {link}: {e}")
	else:
	pass

	# 3. Construct the prompt for the LLM
	llm_prompt = f"Query by user: {q} , Answerthe query asked by user using these search results, Which contains real time data, Try to give best response: {extracted_text}"

	# 4. Get the LLM's response using LLM class (similar to /api/llm)
	messages = [{"role": "user", "content": llm_prompt}]
	if system_prompt:
	messages.insert(0, {"role": "system", "content": system_prompt})

	llm = LLM(model=model)
	llm_response = llm.chat(messages=messages)

	# 5. Return the results
	return JSONResponse(content=jsonable_encoder({ "llm_response": llm_response }))

	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during advanced search: {e}")


	@app.get("/api/website_summarizer")
	async def website_summarizer(url: str):
	"""Summarizes the content of a given URL using a chat model."""
	try:
	# Extract text from the given URL
	response = requests.get(url, headers={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/111.0"})
	response.raise_for_status()
	visible_text = extract_text_from_webpage(response.text)
	if len(visible_text) > 7500: # Adjust max_chars based on your needs
	visible_text = visible_text[:7500] + "..."

	# Use chat model to summarize the extracted text
	with WEBS() as webs:
	summary_prompt = f"Summarize this in detail in Paragraph: {visible_text}"
	summary_result = webs.chat(keywords=summary_prompt, model="gpt-3.5")

	# Return the summary result
	return JSONResponse(content=jsonable_encoder({summary_result}))

	except requests.exceptions.RequestException as e:
	raise HTTPException(status_code=500, detail=f"Error fetching or processing URL: {e}")
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during summarization: {e}")

	@app.get("/api/ask_website")
	async def ask_website(url: str, question: str, model: str = "llama-3-70b"):
	"""
	Asks a question about the content of a given website.
	"""
	try:
	# Extract text from the given URL
	response = requests.get(url, headers={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/111.0"})
	response.raise_for_status()
	visible_text = extract_text_from_webpage(response.text)
	if len(visible_text) > 7500: # Adjust max_chars based on your needs
	visible_text = visible_text[:7500] + "..."

	# Construct a prompt for the chat model
	prompt = f"Based on the following text, answer this question in Paragraph: [QUESTION] {question} [TEXT] {visible_text}"

	# Use chat model to get the answer
	with WEBS() as webs:
	answer_result = webs.chat(keywords=prompt, model=model)

	# Return the answer result
	return JSONResponse(content=jsonable_encoder({answer_result}))

	except requests.exceptions.RequestException as e:
	raise HTTPException(status_code=500, detail=f"Error fetching or processing URL: {e}")
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during question answering: {e}")

	@app.get("/api/maps")
	async def maps(
	q: str,
	place: Optional[str] = None,
	street: Optional[str] = None,
	city: Optional[str] = None,
	county: Optional[str] = None,
	state: Optional[str] = None,
	country: Optional[str] = None,
	postalcode: Optional[str] = None,
	latitude: Optional[str] = None,
	longitude: Optional[str] = None,
	radius: int = 0,
	max_results: int = 10
	):
	"""Perform a maps search."""
	try:
	with WEBS() as webs:
	results = webs.maps(keywords=q, place=place, street=street, city=city, county=county, state=state, country=country, postalcode=postalcode, latitude=latitude, longitude=longitude, radius=radius, max_results=max_results)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during maps search: {e}")

	@app.get("/api/translate")
	async def translate(
	q: str,
	from_: Optional[str] = None,
	to: str = "en"
	):
	"""Translate text."""
	try:
	with WEBS() as webs:
	results = webs.translate(keywords=q, from_=from_, to=to)
	return JSONResponse(content=jsonable_encoder(results))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error during translation: {e}")

	@app.get("/api/youtube/transcript")
	async def youtube_transcript(
	video_id: str,
	languages: str = "en",
	preserve_formatting: bool = False
	):
	"""Get the transcript of a YouTube video."""
	try:
	languages_list = languages.split(",")
	transcript = transcriber.get_transcript(video_id, languages=languages_list, preserve_formatting=preserve_formatting)
	return JSONResponse(content=jsonable_encoder(transcript))
	except Exception as e:
	raise HTTPException(status_code=500, detail=f"Error getting YouTube transcript: {e}")

	import requests
	@app.get("/weather/json/{location}")
	def get_weather_json(location: str):
	url = f"https://wttr.in/{location}?format=j1"
	response = requests.get(url)
	if response.status_code == 200:
	return response.json()
	else:
	return {"error": f"Unable to fetch weather data. Status code: {response.status_code}"}

	@app.get("/weather/ascii/{location}")
	def get_ascii_weather(location: str):
	url = f"https://wttr.in/{location}"
	response = requests.get(url, headers={'User-Agent': 'curl'})
	if response.status_code == 200:
	return response.text
	else:
	return {"error": f"Unable to fetch weather data. Status code: {response.status_code}"}

	# Run the API server if this script is executed
	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(app, host="0.0.0.0", port=8083)