import streamlit as st
import json
from datasets import load_dataset
import sqlparse
st.set_page_config(page_title="Proofsteps from Proof-Pile-V2", layout="wide")
st.markdown("
Proofsteps Insepction 🔍
", unsafe_allow_html=True)
st.markdown("""
Here you can inspect proofsteps from [Proof-Pile-V2](https://huggingface.co./datasets/EleutherAI/proof-pile-2).
""")
@st.cache(max_entries=100)
def load_data(lang):
if lang == "Lean Proofsteps":
split = "lean_proofsteps"
elif lang == "Isabelle Proofsteps":
split = "isa_proofsteps"
ds = load_dataset("xu3kev/proof-pile-2-proofsteps", split=f"{split}[:5%]")
return ds
list_languages = ['Lean Proofsteps', 'Isabelle Proofsteps']
chosen_language = st.sidebar.selectbox(
label="Select a Proof Language", options=list_languages, index=0
)
print(chosen_language)
samples = load_data(chosen_language)
st.sidebar.header('Sample Selection')
index_example = st.sidebar.number_input(f"Choose a sample from the existing {len(samples)} samples:", min_value=0, max_value=max(0, len(samples)-1), value=0, step=1)
#db_id = samples[index_example]["db_id"]
#st.markdown(f'{index_example} Question:
', unsafe_allow_html=True)
#st.code(samples[index_example]["question"])
#sql_str = samples[index_example]["SQL"]
#sql_str_pretty = sqlparse.format(sql_str, reindent=True, keyword_case='upper')
#st.markdown(f'SQL:
', unsafe_allow_html=True)
#st.code(sql_str_pretty)
st.markdown(f'Content:
', unsafe_allow_html=True)
st.code(samples[index_example]["text"])
#st.markdown(f'Metadata:
', unsafe_allow_html=True)
#st.code(samples[index_example]["meta"])