HoneyTian commited on
Commit
97eebc6
·
1 Parent(s): 33d6ee9
.gitignore CHANGED
@@ -3,6 +3,7 @@
3
  .idea/
4
 
5
  #/data/
 
6
  #/data/eval_data
7
  /data/raw_dataset
8
  /dotenv/
 
3
  .idea/
4
 
5
  #/data/
6
+ /data/comment
7
  #/data/eval_data
8
  /data/raw_dataset
9
  /dotenv/
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7ad13e353f4db5a95c5fa2c293324c7e526a5a09230c60ef48437056f9613b4
3
- size 228210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a1a8ef591a4d981abb0f04cabc68b7917dc6cb3ccc1e57befbfa9fc4b2c8a22
3
+ size 875834
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl.raw CHANGED
The diff for this file is too large to render. See raw diff
 
examples/test_metrics/lingoace_chat_metric.py CHANGED
@@ -43,12 +43,12 @@ python3 azure_openai.py --model_name gpt-4o-mini \
43
  )
44
  parser.add_argument(
45
  "--eval_data_file",
46
- default=(project_path / "data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl.raw").as_posix(),
47
  type=str
48
  )
49
  parser.add_argument(
50
  "--output_file",
51
- default=(project_path / "data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl").as_posix(),
52
  type=str
53
  )
54
  parser.add_argument(
 
43
  )
44
  parser.add_argument(
45
  "--eval_data_file",
46
+ default=(project_path / "data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl.raw").as_posix(),
47
  type=str
48
  )
49
  parser.add_argument(
50
  "--output_file",
51
+ default=(project_path / "data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl").as_posix(),
52
  type=str
53
  )
54
  parser.add_argument(
llm_eval_script/azure_openai_chat.py CHANGED
@@ -72,7 +72,7 @@ python3 azure_openai.py --model_name gpt-4o-mini \
72
  )
73
  parser.add_argument(
74
  "--interval",
75
- default=0,
76
  type=int
77
  )
78
  args = parser.parse_args()
@@ -91,7 +91,7 @@ def main():
91
  tz = ZoneInfo("Asia/Shanghai")
92
  now = datetime.now(tz)
93
  create_time_str = now.strftime("%Y%m%d_%H%M%S")
94
- # create_time_str = "20250722_173400"
95
  else:
96
  create_time_str = args.create_time_str
97
 
 
72
  )
73
  parser.add_argument(
74
  "--interval",
75
+ default=5,
76
  type=int
77
  )
78
  args = parser.parse_args()
 
91
  tz = ZoneInfo("Asia/Shanghai")
92
  now = datetime.now(tz)
93
  create_time_str = now.strftime("%Y%m%d_%H%M%S")
94
+ create_time_str = "20250723_170505"
95
  else:
96
  create_time_str = args.create_time_str
97
 
main.py CHANGED
@@ -293,34 +293,11 @@ def main():
293
  board_button = gr.Button(value="View", variant="primary", visible=True)
294
  board_board = gr.DataFrame(value=llm_ranking_board, max_height=800, min_width=160, label="board", show_search="search")
295
 
296
- board_button.click(
297
- fn=when_click_board_button,
298
- inputs=[board_columns],
299
- outputs=[board_board],
300
- )
301
- with gr.TabItem("dataset"):
302
- dataset_name = gr.Textbox(label="name")
303
- dataset_desc = gr.Textbox(label="desc")
304
- dataset_filename = gr.Textbox(label="filename")
305
-
306
- gr.Examples(
307
- examples=dataset_examples_list,
308
- inputs=[dataset_name, dataset_desc, dataset_filename],
309
- outputs=None,
310
  )
311
- dataset_button = gr.Button(value="View", variant="primary", visible=True)
312
- dataset_df = gr.DataFrame(
313
- value=None, label="dataset", interactive=True,
314
- show_search="search",
315
- elem_id="dataset_df"
316
- )
317
- dataset_button.click(
318
- fn=when_click_view_dataset_button,
319
- inputs=[dataset_filename],
320
- outputs=[dataset_df],
321
- )
322
- _ = get_fs_tab()
323
- _ = get_shell_tab()
324
  with gr.TabItem("view_chat"):
325
  view_chat_company = gr.Textbox(label="company", visible=False)
326
  view_chat_model_name = gr.Textbox(label="model_name", visible=False)
@@ -334,7 +311,9 @@ def main():
334
  with gr.Row():
335
  view_chat_button = gr.Button(value="View", variant="primary", visible=True)
336
  view_chat_df = gr.DataFrame(
337
- value=None, label="dataset", interactive=True,
 
 
338
  show_search="search",
339
  elem_id="view_chat_df"
340
  )
@@ -343,6 +322,29 @@ def main():
343
  inputs=[view_chat_filename],
344
  outputs=[view_chat_df],
345
  )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
346
 
347
  # http://127.0.0.1:7861/
348
  # http://10.75.27.247:7861/
 
293
  board_button = gr.Button(value="View", variant="primary", visible=True)
294
  board_board = gr.DataFrame(value=llm_ranking_board, max_height=800, min_width=160, label="board", show_search="search")
295
 
296
+ board_button.click(
297
+ fn=when_click_board_button,
298
+ inputs=[board_columns],
299
+ outputs=[board_board],
 
 
 
 
 
 
 
 
 
 
300
  )
 
 
 
 
 
 
 
 
 
 
 
 
 
301
  with gr.TabItem("view_chat"):
302
  view_chat_company = gr.Textbox(label="company", visible=False)
303
  view_chat_model_name = gr.Textbox(label="model_name", visible=False)
 
311
  with gr.Row():
312
  view_chat_button = gr.Button(value="View", variant="primary", visible=True)
313
  view_chat_df = gr.DataFrame(
314
+ value=None,
315
+ max_height = 1000, min_width = 160,
316
+ label="dataset", interactive=True,
317
  show_search="search",
318
  elem_id="view_chat_df"
319
  )
 
322
  inputs=[view_chat_filename],
323
  outputs=[view_chat_df],
324
  )
325
+ with gr.TabItem("dataset"):
326
+ dataset_name = gr.Textbox(label="name")
327
+ dataset_desc = gr.Textbox(label="desc")
328
+ dataset_filename = gr.Textbox(label="filename")
329
+
330
+ gr.Examples(
331
+ examples=dataset_examples_list,
332
+ inputs=[dataset_name, dataset_desc, dataset_filename],
333
+ outputs=None,
334
+ )
335
+ dataset_button = gr.Button(value="View", variant="primary", visible=True)
336
+ dataset_df = gr.DataFrame(
337
+ value=None, label="dataset", interactive=True,
338
+ show_search="search",
339
+ elem_id="dataset_df"
340
+ )
341
+ dataset_button.click(
342
+ fn=when_click_view_dataset_button,
343
+ inputs=[dataset_filename],
344
+ outputs=[dataset_df],
345
+ )
346
+ _ = get_fs_tab()
347
+ _ = get_shell_tab()
348
 
349
  # http://127.0.0.1:7861/
350
  # http://10.75.27.247:7861/