Spaces:

protectai
/

llm-guard-playground

Running

App Files Files Community

llm-guard-playground / app.py

asofter

* upgrade version of llm-guard with new features

ca9549b about 1 year ago

raw

history blame

4.3 kB

	import logging
	import time
	import traceback
	from datetime import timedelta

	import pandas as pd
	import streamlit as st
	from output import init_settings as init_output_settings
	from output import scan as scan_output
	from prompt import init_settings as init_prompt_settings
	from prompt import scan as scan_prompt

	from llm_guard.vault import Vault

	PROMPT = "prompt"
	OUTPUT = "output"
	vault = Vault()

	st.set_page_config(
	page_title="LLM Guard Playground",
	layout="wide",
	initial_sidebar_state="expanded",
	menu_items={
	"About": "https://laiyer-ai.github.io/llm-guard/",
	},
	)

	logger = logging.getLogger("llm-guard-playground")
	logger.setLevel(logging.INFO)

	# Sidebar
	st.sidebar.header(
	"""
	Scanning prompt and output using [LLM Guard](https://laiyer-ai.github.io/llm-guard/)
	"""
	)

	scanner_type = st.sidebar.selectbox("Type", [PROMPT, OUTPUT], index=0)

	st_fail_fast = st.sidebar.checkbox(
	"Fail fast", value=False, help="Stop scanning after first failure"
	)

	enabled_scanners = None
	settings = None
	if scanner_type == PROMPT:
	enabled_scanners, settings = init_prompt_settings()
	elif scanner_type == OUTPUT:
	enabled_scanners, settings = init_output_settings()

	# Main pannel
	with st.expander("About", expanded=False):
	st.info(
	"""LLM-Guard is a comprehensive tool designed to fortify the security of Large Language Models (LLMs).
	\n\n[Code](https://github.com/laiyer-ai/llm-guard) \|
	[Documentation](https://laiyer-ai.github.io/llm-guard/)"""
	)

	st.markdown(
	"[![Pypi Downloads](https://img.shields.io/pypi/dm/llm-guard.svg)](https://img.shields.io/pypi/dm/llm-guard.svg)" # noqa
	"[![MIT license](https://img.shields.io/badge/license-MIT-brightgreen.svg)](https://opensource.org/licenses/MIT)"
	"![GitHub Repo stars](https://img.shields.io/github/stars/laiyer-ai/llm-guard?style=social)"
	)

	analyzer_load_state = st.info("Starting LLM Guard...")

	analyzer_load_state.empty()

	# Read default text
	with open("prompt_text.txt") as f:
	demo_prompt_text = f.readlines()

	with open("output_text.txt") as f:
	demo_output_text = f.readlines()

	# Before:
	st.subheader("Guard Prompt" if scanner_type == PROMPT else "Guard Output")

	if scanner_type == PROMPT:
	st_prompt_text = st.text_area(
	label="Enter prompt", value="".join(demo_prompt_text), height=200, key="prompt_text_input"
	)
	elif scanner_type == OUTPUT:
	col1, col2 = st.columns(2)
	st_prompt_text = col1.text_area(
	label="Enter prompt", value="".join(demo_prompt_text), height=300, key="prompt_text_input"
	)

	st_output_text = col2.text_area(
	label="Enter output", value="".join(demo_output_text), height=300, key="output_text_input"
	)

	st_result_text = None
	st_analysis = None
	st_is_valid = None
	st_time_delta = None

	try:
	with st.form("text_form", clear_on_submit=False):
	submitted = st.form_submit_button("Process")
	if submitted:
	results_valid = {}
	results_score = {}

	start_time = time.monotonic()
	if scanner_type == PROMPT:
	st_result_text, results_valid, results_score = scan_prompt(
	vault, enabled_scanners, settings, st_prompt_text, st_fail_fast
	)
	elif scanner_type == OUTPUT:
	st_result_text, results_valid, results_score = scan_output(
	vault, enabled_scanners, settings, st_prompt_text, st_output_text, st_fail_fast
	)
	end_time = time.monotonic()
	st_time_delta = timedelta(seconds=end_time - start_time)

	st_is_valid = all(results_valid.values())
	st_analysis = [
	{"scanner": k, "is valid": results_valid[k], "risk score": results_score[k]}
	for k in results_valid
	]

	except Exception as e:
	logger.error(e)
	traceback.print_exc()
	st.error(e)

	# After:
	if st_is_valid is not None:
	st.subheader(
	f"Results - {'valid' if st_is_valid else 'invalid'} ({round(st_time_delta.total_seconds())} seconds)"
	)

	col1, col2 = st.columns(2)

	with col1:
	st.text_area(label="Sanitized text", value=st_result_text, height=400)

	with col2:
	st.table(pd.DataFrame(st_analysis))