Spaces:

XINZHANG-Geotab
/

RelevancyApp

Running

App Files Files Community

RelevancyApp / app.py

XINZHANG-Geotab

added

62c4367 9 months ago

raw

history blame contribute delete

9.3 kB

	from utils import (
	container_emphasis_css,
	container_regular_css,
	question_font,
	modify_sql_guid_injection
	)

	import streamlit as st
	import json
	import pandas as pd
	from datetime import datetime
	from streamlit_extras.stylable_container import stylable_container

	@st.cache_data
	def load_data(file):
	return pd.read_csv(file)

	st.set_page_config(layout="wide", initial_sidebar_state="expanded")
	st.title("Relevancy Compare App")
	st.divider()
	st.markdown(question_font, unsafe_allow_html=True)


	def edit_df_data_change():
	edited_rows: dict = st.session_state.edit_df_data['edited_rows']
	st.session_state.previous_row_index = st.session_state.previous_row_index
	st.session_state.current_row_index = next(iter(edited_rows))
	st.session_state.df = st.session_state.df.assign(selected=False)
	update_dict = {idx: values for idx, values in edited_rows.items()}
	st.session_state.df.update(pd.DataFrame.from_dict(update_dict, orient='index'))


	st.need_rerun = False
	if "df" not in st.session_state:
	role_pick = st.selectbox("You are?", options=["Kyle", "Shadi", "Daniel", "Xin"], index=None, key='role_pick')
	uploaded_file = st.file_uploader("Choose a CSV file", type="csv")
	st.session_state.role = role_pick
	st.need_rerun = True
	else:
	uploaded_file = st.session_state.df
	if uploaded_file is not None and 'role' in st.session_state:
	"You are modifying as :", st.session_state.role
	with st.container():
	if "df" not in st.session_state:
	df = load_data(uploaded_file)
	st.session_state.df_shape = df.shape
	# selected load
	select_values = [False] * len(df)

	if "Comment" not in df.columns:
	comments = [''] * len(df)
	df.insert(0, 'Comment', comments)
	st.session_state.default_row_index = 0

	if "LastModified" not in df.columns:
	modifies = [''] * len(df)
	df.insert(0, 'LastModified', modifies)

	else:
	df['Comment'] = df['Comment'].astype(str)
	df['LastModified'] = df['LastModified'].astype(str)
	comments = [c if c != 'nan' else '' for c in df['Comment'].tolist()]
	modifies = [c if c != 'nan' else '' for c in df['LastModified'].tolist()]
	df['Comment'] = comments
	df['LastModified'] = modifies
	first_nan = 0
	for i, c in enumerate(comments):
	if not c:
	first_nan = i
	break
	st.session_state.default_row_index = first_nan

	st.session_state.current_row_index = st.session_state.default_row_index
	st.session_state.previous_row_index = st.session_state.current_row_index

	df.insert(0, 'Select', select_values)
	df.at[st.session_state.current_row_index, 'Select'] = True
	st.session_state['df'] = df

	df_col, = st.columns(1)

	st.session_state.previous_row_index = st.session_state.current_row_index
	with st.container():
	bcol1, bcol2, _ = st.columns([1, 1, 5])
	with bcol1:
	previous_row = st.button("Prev Row")
	with bcol2:
	next_row = st.button("Next Row")


	if "current_row_index" in st.session_state and previous_row:
	if st.session_state.current_row_index > 0:
	st.session_state.previous_row_index = st.session_state.current_row_index
	st.session_state.current_row_index -= 1

	if "current_row_index" in st.session_state and next_row:
	if st.session_state.current_row_index < st.session_state.df_shape[0] - 1:
	st.session_state.previous_row_index = st.session_state.current_row_index
	st.session_state.current_row_index += 1

	row_index = st.session_state.current_row_index
	row_data = st.session_state.df.loc[row_index]
	question = row_data['question']
	pred_relevant_choice = row_data['pred_relevant_choice']
	correct_response = row_data['correct_response']
	relative_relevancy = json.loads(row_data['relative_relevancy'])
	reason = relative_relevancy['reason']
	most_relevant = relative_relevancy['most_relevant']
	options=['first', 'second', 'both']
	default_index = options.index(most_relevant)
	default_comment = row_data['Comment']
	first_css = container_regular_css
	second_css = container_regular_css
	first_color = ':black'
	second_color = ':black'


	st.write(f"##### Row {row_index}/{st.session_state.df_shape[0]-1}")
	with st.container(border=True):
	# st.write(f"Question: {question}")
	st.markdown(f'<p class="question-font">[Q]: {question}</p>', unsafe_allow_html=True)
	select_by = st.selectbox("Mark By: ", ["pred_relevant_choice", "correct_response"], key='mark_by_dropdown')
	col1_res, col2_res, _ = st.columns([0.2, 0.2, 0.6])
	if select_by == 'pred_relevant_choice':
	col1_res.write(f":blue[pred_relevant_choice: {pred_relevant_choice}]")
	col2_res.write(f"correct_response: {correct_response}")
	else:
	col1_res.write(f"pred_relevant_choice: {pred_relevant_choice}")
	col2_res.write(f":blue[correct_response: {correct_response}]")


	if row_data[select_by].lower() == 'first' or row_data[select_by].lower() == 'both':
	first_css = container_emphasis_css
	first_color = ':blue'

	if row_data[select_by].lower() == 'both':
	second_css = container_emphasis_css
	second_color = ':blue'
	else:
	second_css = container_emphasis_css
	second_color = ':blue'

	col1, col2 = st.columns(2)
	with col1:
	st.write("Target SQL:", use_container_width=True)
	with stylable_container(
	key="first_sql_container",
	css_styles=first_css
	):
	target_sql_text = modify_sql_guid_injection(row_data['target_sql'].strip())
	#st.write(f"{first_color}[{target_sql_text}]", use_container_width=True)
	col1, _ = st.columns([0.99, 0.01])
	with col1:
	st.code(
	target_sql_text,
	language="sql"
	)
	# st.code(
	# "\n".join(
	# tw.wrap(
	# target_sql_text,
	# width=60,
	# )
	# ),
	# language="sql"
	# )

	with col2:
	st.write("Predicted SQL:", use_container_width=True)
	with stylable_container(
	key="second_sql_container",
	css_styles=second_css
	):
	predicted_sql_text = modify_sql_guid_injection(row_data['predicted_sql'].strip())
	# st.write(f"{second_color}[{predicted_sql_text}]")
	col1, _ = st.columns([0.99, 0.01])
	with col1:
	st.code(
	predicted_sql_text,
	language="sql"
	)
	col1_comment, col2_comment = st.columns([1, 1])
	with col1_comment:
	select_most_relevant = st.selectbox("most_relevant", options=options, index=default_index, key='most_relevant_drop_down')
	reason_box = st.text_area("reason", value=reason, key='reason_text')
	with col2_comment:
	comment = st.text_area("Comment", value=default_comment, key='comment_text')

	with st.container():
	bcol1, bcol2, _, _, _, _, _, _, _, _ = st.columns(10)
	with bcol1:
	save = st.button("Save")
	with bcol2:
	download = st.button("Download")

	if save:
	updated_relative_relevancy = json.dumps({'most_relevant': select_most_relevant, "reason": reason_box})
	st.session_state.df.at[row_index, 'Comment'] = comment
	st.session_state.df.at[row_index, 'relative_relevancy'] = updated_relative_relevancy
	st.session_state.df.at[row_index, 'correct_response'] = select_most_relevant
	current_time = datetime.now()
	current_time_str = current_time.strftime("%Y-%m-%d %H:%M:%S")
	st.session_state.df.at[row_index, 'LastModified'] = f"{st.session_state.role}@{current_time_str}"
	df = st.session_state.df.drop('Select', axis=1)
	df.to_csv('modified.csv', index=False)
	st.rerun()

	if download:
	with open('modified.csv') as f:
	st.download_button('Download modified CSV', f, file_name='modified.csv')

	st.session_state.df['Select'] = False
	st.session_state.df.at[st.session_state.current_row_index, 'Select'] = True

	edited_df = df_col.data_editor(st.session_state.df, num_rows="fixed", use_container_width=True, key='edit_df_data', on_change=edit_df_data_change)

	#st.session_state.mannul_select = edited_df[edited_df['Select']].index
	st.session_state.df = edited_df

	if st.need_rerun:
	st.need_rerun = False
	st.rerun()