File size: 2,763 Bytes
e9f938b
 
 
 
 
 
 
 
 
 
 
 
 
19236c8
e9f938b
19236c8
ddab103
e9f938b
19236c8
e9f938b
 
 
 
 
 
 
 
 
 
c323af3
e9f938b
cc6b025
e9f938b
 
2628b21
e9f938b
 
c323af3
 
 
 
e9f938b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e0ed415
e9f938b
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import gradio as gr
from gradio_leaderboard import Leaderboard, SelectColumns, ColumnFilter
from pathlib import Path

from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css, jsonl_to_dataframe, add_average_column_to_df, apply_markdown_format_for_columns, submit, PART_LOGO, sort_dataframe_by_column



abs_path = Path(__file__).parent

# Any pandas-compatible data
leaderboard_df = jsonl_to_dataframe(str(abs_path / "leaderboard_data.jsonl"))

average_column_name = "Average Accuracy"

all_columns = ["Model", average_column_name, "Precision", "#Params (B)", "Part Multiple Choice", "ARC Easy", "ARC Challenge", "MMLU Pro", "AUT Multiple Choice Persian"]
columns_to_average = ["Part Multiple Choice", "ARC Easy", "ARC Challenge", "MMLU Pro", "AUT Multiple Choice Persian"]



leaderboard_df = add_average_column_to_df(leaderboard_df, columns_to_average, index=3, average_column_name=average_column_name)

leaderboard_df = apply_markdown_format_for_columns(df=leaderboard_df, model_column_name="Model")
leaderboard_df = sort_dataframe_by_column(leaderboard_df, column_name=average_column_name)

columns_data_type = ["markdown" for i in range(len(leaderboard_df.columns))]
# "str", "number", "bool", "date", "markdown"
# columns_data_type[0] = "markdown"

NUM_MODELS=len(leaderboard_df)

with gr.Blocks(css=custom_css,theme=gr.themes.Default(font=["sans-serif","ui-sans-serif","system-ui"], font_mono=["monospace","ui-monospace","Consolas"])) as demo:
    # gr.HTML(PART_LOGO)
    gr.Markdown("""
    # Open Persian LLM Leaderboard
    """)

    gr.Markdown(f"""
    - **Total Models**: {NUM_MODELS}
    """)

    with gr.Tab("πŸŽ–οΈ Persian Leaderboard"):
        Leaderboard(
        value=leaderboard_df,
        datatype=columns_data_type,
        select_columns=SelectColumns(
            default_selection=all_columns,
            cant_deselect=["Model"],
            label="Select Columns to Show",
        ),
        search_columns=["model_name_for_query"],
        hide_columns=["model_name_for_query",],
        filter_columns=["Precision", "#Params (B)"],
    )
    with gr.TabItem("πŸ“ About"):
        gr.Markdown(LLM_BENCHMARKS_ABOUT_TEXT)

    with gr.Tab("βœ‰οΈ Submit"):
        gr.Markdown(LLM_BENCHMARKS_SUBMIT_TEXT)
        model_name = gr.Textbox(label="Model name")
        model_id = gr.Textbox(label="username/space e.g PartAI/Dorna-Llama3-8B-Instruct")
        contact_email = gr.Textbox(label="Contact E-Mail")
        submit_btn = gr.Button("Submit")

        submit_btn.click(submit, inputs=[model_name, model_id, contact_email], outputs=[])

        gr.Markdown("""
        Please find more information about Part DP AI on [partdp.ai](https://partdp.ai)""")

if __name__ == "__main__":
    demo.launch()