Spaces:
Running
Running
Update src/streamlit_app.py
Browse files- src/streamlit_app.py +20 -2
src/streamlit_app.py
CHANGED
@@ -66,7 +66,7 @@ score_cols = [f"T{i}" for i in range(1, 12)] + ["Avg"]
|
|
66 |
max_ranks = {col: df[f"{col}_rank"].max() for col in score_cols}
|
67 |
|
68 |
# βββ Tabs ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
69 |
-
tab1, tab2, tab3 = st.tabs(["πLeaderboard", "πBenchmark Details", "π€Submit Your Model"])
|
70 |
|
71 |
with tab1:
|
72 |
# st.markdown("**Leaderboard:** higher scores shaded green; best models bolded.")
|
@@ -129,7 +129,7 @@ with tab2:
|
|
129 |
)
|
130 |
|
131 |
with tab3:
|
132 |
-
st.markdown('## π€ Submit
|
133 |
st.write(
|
134 |
"""
|
135 |
We provide both public and private subsets of the dataset.
|
@@ -141,3 +141,21 @@ with tab3:
|
|
141 |
π You can submit your model through the following link: [https://forms.gle/mWa6joCfgQnwXsxeA](https://forms.gle/mWa6joCfgQnwXsxeA)
|
142 |
"""
|
143 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
max_ranks = {col: df[f"{col}_rank"].max() for col in score_cols}
|
67 |
|
68 |
# βββ Tabs ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
69 |
+
tab1, tab2, tab3, tab4 = st.tabs(["π Leaderboard", "π Benchmark Details", "π€ Submit Your Model", "π§© Community Contributions Welcome"])
|
70 |
|
71 |
with tab1:
|
72 |
# st.markdown("**Leaderboard:** higher scores shaded green; best models bolded.")
|
|
|
129 |
)
|
130 |
|
131 |
with tab3:
|
132 |
+
st.markdown('## π€ Submit Your Model')
|
133 |
st.write(
|
134 |
"""
|
135 |
We provide both public and private subsets of the dataset.
|
|
|
141 |
π You can submit your model through the following link: [https://forms.gle/mWa6joCfgQnwXsxeA](https://forms.gle/mWa6joCfgQnwXsxeA)
|
142 |
"""
|
143 |
)
|
144 |
+
|
145 |
+
with tab4:
|
146 |
+
st.markdown('## π’ We Welcome Contributions from the Community')
|
147 |
+
st.write(
|
148 |
+
"""
|
149 |
+
We actively encourage contributions from the research community β including:
|
150 |
+
|
151 |
+
- β
Proposing new tasks and contributing data
|
152 |
+
- π Suggesting improvements to existing ones
|
153 |
+
- π§ Sharing domain-specific insights βοΈπ§ͺπ₯π
|
154 |
+
|
155 |
+
Your input is invaluable in making ExpertLongBench more representative and impactful across expert domains.
|
156 |
+
|
157 |
+
If you're interested in contributing or collaborating, feel free to reach out to us: Jie Ruan (jieruan@umich.edu@umich.edu), Inderjeet Nair (inair@umich.edu), Shuyang Cao (caoshuy@umich.edu), Lu Wang (wangluxy@umich.edu).
|
158 |
+
|
159 |
+
Letβs build better evaluations for expert-level AI β together ππ€
|
160 |
+
"""
|
161 |
+
)
|