ArmBench-LLM / main.py
daniel7an
commit
d21b14f
raw
history blame
1.3 kB
import gradio as gr
import pandas as pd
import plotly.express as px
def display_table():
df = pd.read_csv('benchmark_results.csv')
return df
def create_bar_chart():
df = pd.read_csv('benchmark_results.csv')
fig = px.bar(df,
x='average_score',
y='model',
color='average_score',
color_continuous_scale='tealrose',
hover_data=['armenian_language_score', 'armenian_history_score', 'mathematics_score'],
labels={'average_score': 'Average Score', 'model': 'Model'},
title='Average Score per Model',
orientation='h',
range_color=[0, 20])
fig.update_layout(
xaxis=dict(range=[0, 20]),
title=dict(text='Average Score per Model', font=dict(size=16)),
xaxis_title=dict(font=dict(size=12)),
yaxis_title=dict(font=dict(size=12)),
yaxis=dict(autorange="reversed"),
hoverlabel=dict(
bgcolor="white",
font_size=12,
font_family="Arial",
font_color="black"
)
)
return fig
with gr.Blocks() as app:
gr.Markdown("# ArmBench Leaderboard")
table_output = gr.DataFrame(value=display_table())
plot_output = gr.Plot(create_bar_chart)
app.launch(share=True)