Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -28,7 +28,12 @@ TABLE_INTRODUCTION = """The table below shows the performance of various models
|
|
28 |
"""
|
29 |
|
30 |
CITATION_BUTTON_LABEL = "If you find AutoEval-Video useful for your research and applications, please copy the following snippet to cite these results: "
|
31 |
-
CITATION_BUTTON_TEXT = """
|
|
|
|
|
|
|
|
|
|
|
32 |
style = """<style>
|
33 |
.dataframe-container {
|
34 |
overflow-x: auto;
|
@@ -37,6 +42,7 @@ style = """<style>
|
|
37 |
import gradio as gr
|
38 |
import pandas as pd
|
39 |
import json
|
|
|
40 |
import time
|
41 |
import random
|
42 |
from huggingface_hub import CommitScheduler, login
|
@@ -65,7 +71,7 @@ def prediction_analyse(prediction_content,questiontype_list):
|
|
65 |
|
66 |
results = {i: {"correct": 0, "total": 0} for i in questiontype_list}
|
67 |
|
68 |
-
for prediction in predictions:
|
69 |
# pdb.set_trace()
|
70 |
prediction = prediction.strip()
|
71 |
if not prediction:
|
|
|
28 |
"""
|
29 |
|
30 |
CITATION_BUTTON_LABEL = "If you find AutoEval-Video useful for your research and applications, please copy the following snippet to cite these results: "
|
31 |
+
CITATION_BUTTON_TEXT = """@article{chen2023autoevalvideo,
|
32 |
+
title={AutoEval-Video: An Automatic Benchmark for Assessing Large Vision Language Models in Open-Ended Video Question Answering},
|
33 |
+
author={Xiuyuan Chen and Yuan Lin and Yuchen Zhang and Weiran Huang},
|
34 |
+
year={2023},
|
35 |
+
journal={arXiv preprint arXiv:2311.14906}
|
36 |
+
}"""
|
37 |
style = """<style>
|
38 |
.dataframe-container {
|
39 |
overflow-x: auto;
|
|
|
42 |
import gradio as gr
|
43 |
import pandas as pd
|
44 |
import json
|
45 |
+
from tqdm import tqdm
|
46 |
import time
|
47 |
import random
|
48 |
from huggingface_hub import CommitScheduler, login
|
|
|
71 |
|
72 |
results = {i: {"correct": 0, "total": 0} for i in questiontype_list}
|
73 |
|
74 |
+
for prediction in tqdm(predictions):
|
75 |
# pdb.set_trace()
|
76 |
prediction = prediction.strip()
|
77 |
if not prediction:
|