Alyafeai commited on
Commit
b828f6c
·
1 Parent(s): 0da0ffb

adding new benchmarks

Browse files
Files changed (1) hide show
  1. backend/config.py +6 -0
backend/config.py CHANGED
@@ -30,6 +30,12 @@ TASKS: List[Tuple[str, str, str]] = [
30
  "MedArabiQ",
31
  ),
32
  ("qimma-ArablegalEval-QA|0", "BERTScore-F", "ArabLegalQA"),
 
 
 
 
 
 
33
  ]
34
 
35
  # --- 3. Model Metadata ---
 
30
  "MedArabiQ",
31
  ),
32
  ("qimma-ArablegalEval-QA|0", "BERTScore-F", "ArabLegalQA"),
33
+ ("acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "qimma-GAT:_average|0", "GAT"),
34
+ ("acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "qimma-MedAraBench:_average|0", "MedAraBench"),
35
+ ("humaneval_scores", "humaneval_plus", "HumanEval+"),
36
+ ("mbpp_scores", "mbpp_plus", "MBPP+"),
37
+ ("fann", "fann", "FANN"),
38
+ ("flop", "flop", "FLOP"),
39
  ]
40
 
41
  # --- 3. Model Metadata ---