import streamlit as st import json from datasets import load_dataset import sqlparse st.set_page_config(page_title="Proofsteps from Proof-Pile-V2", layout="wide") st.markdown("

Proofsteps Insepction 🔍

", unsafe_allow_html=True) st.markdown(""" Here you can inspect proofsteps from [Proof-Pile-V2](https://huggingface.co/datasets/EleutherAI/proof-pile-2). """) @st.cache(max_entries=100) def load_data(lang): if lang == "Lean Proofsteps": split = "lean_proofsteps" elif lang == "Isabelle Proofsteps": split = "isa_proofsteps" ds = load_dataset("xu3kev/proof-pile-2-proofsteps", split=f"{split}[:5%]") return ds list_languages = ['Lean Proofsteps', 'Isabelle Proofsteps'] chosen_language = st.sidebar.selectbox( label="Select a Proof Language", options=list_languages, index=0 ) print(chosen_language) samples = load_data(chosen_language) st.sidebar.header('Sample Selection') index_example = st.sidebar.number_input(f"Choose a sample from the existing {len(samples)} samples:", min_value=0, max_value=max(0, len(samples)-1), value=0, step=1) #db_id = samples[index_example]["db_id"] #st.markdown(f'

{index_example} Question:

', unsafe_allow_html=True) #st.code(samples[index_example]["question"]) #sql_str = samples[index_example]["SQL"] #sql_str_pretty = sqlparse.format(sql_str, reindent=True, keyword_case='upper') #st.markdown(f'

SQL:

', unsafe_allow_html=True) #st.code(sql_str_pretty) st.markdown(f'

Content:

', unsafe_allow_html=True) st.code(samples[index_example]["text"]) #st.markdown(f'

Metadata:

', unsafe_allow_html=True) #st.code(samples[index_example]["meta"])