from dataclasses import dataclass from enum import Enum @dataclass class EvalDimension: metric: str col_name: str # Select your tasks here # --------------------------------------------------- class EvalDimensions(Enum): d0 = EvalDimension("speed", "Speed (words/sec)") d1 = EvalDimension("contamination_score", "Contamination Score") d2 = EvalDimension("paraphrasing", "Paraphrasing") d3 = EvalDimension("sentiment analysis", "Sentiment Analysis") d4 = EvalDimension("coding", "Coding") d5 = EvalDimension("function calling", "Function Calling") d6 = EvalDimension("rag qa", "RAG QA") d7 = EvalDimension("reading comprehension", "Reading Comprehension") d8 = EvalDimension("entity extraction", "Entity Extraction") d9 = EvalDimension("summarization", "Summarization") d10 = EvalDimension("long context", "Long Context") d11 = EvalDimension("mmlu", "MMLU") d12 = EvalDimension("arabic language & grammar", "Arabic Language & Grammar") d13 = EvalDimension("general knowledge", "General Knowledge") d14 = EvalDimension("translation (incl dialects)", "Translation (incl Dialects)") d15 = EvalDimension("trust & safety","Trust & Safety") d16 = EvalDimension("writing (incl dialects)", "Writing (incl Dialects)") d17 = EvalDimension("dialect detection", "Dialect Detection") d18 = EvalDimension("reasoning & math", "Reasoning & Math") d19 = EvalDimension("diacritization", "Diacritization") d20 = EvalDimension("instruction following", "Instruction Following") d21 = EvalDimension("transliteration", "Transliteration") d22 = EvalDimension("structuring", "Structuring") d23 = EvalDimension("hallucination", "Hallucination") NUM_FEWSHOT = 0 # Change with your few shot # --------------------------------------------------- # Your leaderboard name TITLE = """