Spaces:
Running on CPU Upgrade
Running on CPU Upgrade
adding new benchmarks
Browse files- backend/config.py +6 -0
backend/config.py
CHANGED
|
@@ -30,6 +30,12 @@ TASKS: List[Tuple[str, str, str]] = [
|
|
| 30 |
"MedArabiQ",
|
| 31 |
),
|
| 32 |
("qimma-ArablegalEval-QA|0", "BERTScore-F", "ArabLegalQA"),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
]
|
| 34 |
|
| 35 |
# --- 3. Model Metadata ---
|
|
|
|
| 30 |
"MedArabiQ",
|
| 31 |
),
|
| 32 |
("qimma-ArablegalEval-QA|0", "BERTScore-F", "ArabLegalQA"),
|
| 33 |
+
("acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "qimma-GAT:_average|0", "GAT"),
|
| 34 |
+
("acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "qimma-MedAraBench:_average|0", "MedAraBench"),
|
| 35 |
+
("humaneval_scores", "humaneval_plus", "HumanEval+"),
|
| 36 |
+
("mbpp_scores", "mbpp_plus", "MBPP+"),
|
| 37 |
+
("fann", "fann", "FANN"),
|
| 38 |
+
("flop", "flop", "FLOP"),
|
| 39 |
]
|
| 40 |
|
| 41 |
# --- 3. Model Metadata ---
|