import os import json import glob from collections import defaultdict import pandas as pd import gradio as gr from content import * from css import * import glob ARC = "arc" HELLASWAG = "hellaswag" MMLU = "mmlu" TRUTHFULQA = "truthfulqa" BENCHMARKS = [ARC, HELLASWAG, MMLU, TRUTHFULQA] METRICS = ["acc_norm", "acc_norm", "acc_norm", "mc2"] LANGS = 'ar,bn,ca,da,de,es,eu,fr,gu,hi,hr,hu,hy,id,it,kn,ml,mr,ne,nl,pt,ro,ru,sk,sr,sv,ta,te,uk,vi,zh'.split(',') LANG_NAME = { 'ar': 'Arabic', 'bn': 'Bengali', 'ca': 'Catalan', 'da': 'Danish', 'de': 'German', 'es': 'Spanish', 'eu': 'Basque', 'fr': 'French', 'gu': 'Gujarati', 'hi': 'Hindi', 'hr': 'Croatian', 'hu': 'Hungarian', 'hy': 'Armenian', 'id': 'Indonesian', 'it': 'Italian', 'kn': 'Kannada', 'ml': 'Malayalam', 'mr': 'Marathi', 'ne': 'Nepali', 'nl': 'Dutch', 'pt': 'Portuguese', 'ro': 'Romanian', 'ru': 'Russian', 'sk': 'Slovak', 'sr': 'Serbian', 'sv': 'Swedish', 'ta': 'Tamil', 'te': 'Telugu', 'uk': 'Ukrainian', 'vi': 'Vietnamese', 'zh': 'Chinese' } NONE_COL = "None" COLS = ["Method", "Model" , "SS Easy", "SS Medium", "SS Hard", "MS Easy", "MS Meduium", "MS Hard", "Overall", NONE_COL] TYPES = ["str", "str", "number", "number", "number", "number", "number", "number", "number", "number" , "number"] df = [] row = ["React", "Qwen-plus" , "10.5", "20.6", "30.4", "10.5", "20.6", "30.4", "20", NONE_COL] df.append(row) df.append(row) df.append(row) df.append(row) df = pd.DataFrame.from_records(df, columns=COLS) df = df.sort_values(by=["Method", "Overall"], ascending=False) df = df[COLS] demo = gr.Blocks(css=CUSTOM_CSS) with demo: gr.HTML(TITLE) gr.Markdown(INTRO_TEXT, elem_classes="markdown-text") gr.Markdown(HOW_TO, elem_classes="markdown-text") print(TYPES) print(df.columns) with gr.Group(): with gr.Tab("Results: Agent"): leaderboard_table_test = gr.components.Dataframe( value=df, datatype=TYPES, interactive=False, column_widths = ["20%"] * len(df.columns) ) with gr.Tab("Results: RAG-system"): leaderboard_table_val = gr.components.Dataframe( value=df, datatype=TYPES, interactive=False, column_widths=["20%"] ) gr.Markdown(CREDIT, elem_classes="markdown-text") gr.Markdown(CITATION, elem_classes="markdown-text") demo.launch(share=True)