Alyafeai commited on
Commit
fbb9d41
Β·
1 Parent(s): a587249

mcq tasks

Browse files
__pycache__/app.cpython-313.pyc ADDED
Binary file (8.07 kB). View file
 
backend/__pycache__/__init__.cpython-313.pyc ADDED
Binary file (172 Bytes). View file
 
backend/__pycache__/config.cpython-313.pyc ADDED
Binary file (1.79 kB). View file
 
backend/__pycache__/data_loader.cpython-313.pyc ADDED
Binary file (6.86 kB). View file
 
backend/__pycache__/helpers.cpython-313.pyc ADDED
Binary file (4.07 kB). View file
 
backend/__pycache__/submission_handler.cpython-313.pyc ADDED
Binary file (20.6 kB). View file
 
backend/config.py CHANGED
@@ -1,29 +1,40 @@
1
- # backend/config.py
2
  import os
 
3
  from huggingface_hub import HfApi
4
 
5
- # Hugging Face dataset repos (PUBLIC)
6
- REQUESTS_REPO_ID = "qimma/leaderboard-requests"
7
- RESULTS_REPO_ID = "qimma/leaderboard-results"
 
 
8
 
9
- # Tasks definition (task_key, metric_key, display_name)
10
- TASKS = [
11
- ("arc", "acc_norm", "ARC"),
12
- ("mmlu", "acc", "MMLU"),
13
- ("hellaswag", "acc_norm", "HellaSwag"),
14
- ]
15
 
16
- MODEL_TYPE_TO_EMOJI = {
17
- "base": "🧱",
18
- "chat": "πŸ’¬",
19
- "instruct": "🧠",
20
- }
21
 
22
- # Optional token (read-only)
23
- hf_api_token = os.getenv("HF_TOKEN")
 
 
 
 
 
 
 
 
 
 
 
 
24
 
25
- # SAFE: API always exists
26
- API = HfApi(token=hf_api_token) if hf_api_token else HfApi()
27
 
28
- # SAFE: always defined
29
- SLACK_WEBHOOK_URL = None
 
 
 
 
 
 
 
 
1
  import os
2
+ from typing import Dict, List, Tuple, Optional
3
  from huggingface_hub import HfApi
4
 
5
+ # --- 1. Repository & API Configuration ---
6
+ OWNER: str = "qimma"
7
+ REPO_ID: str = f"{OWNER}/Qimma-Leaderboard"
8
+ RESULTS_REPO_ID: str = f"{OWNER}/results_v3"
9
+ REQUESTS_REPO_ID: str = f"{OWNER}/requests_v3"
10
 
11
+ SLACK_WEBHOOK_URL = os.getenv("SLACK_WEBHOOK_URL", "")
 
 
 
 
 
12
 
13
+ hf_api_token: Optional[str] = os.getenv("HF_API_TOKEN")
14
+ API = HfApi(token=hf_api_token)
 
 
 
15
 
16
+ # --- 2. Task Definitions ---
17
+ # Format: (dataset_key, metric_field, display_name)
18
+ TASKS: List[Tuple[str, str, str]] = [
19
+ ("qimma-AraDiCE-Culture:_average|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "AraDiCE-Culture"),
20
+ ("qimma-ArabicMMLU:_average|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "ArabicMMLU"),
21
+ ("qimma-MedArabiQ:_average|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "MedArabiQ"),
22
+ ("qimma-ArabCulture:_average|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "ArabCulture"),
23
+ ("qimma-SyntheticQA:_average|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "SyntheticQA"),
24
+ ("qimma-PALMX-2025|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "PALMX"),
25
+ ("qimma-NativeQA|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "NativeQA"),
26
+ ("qimma-NativeQA-RDP|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "NativeQA-RDP"),
27
+ ("qimma-AraTrust|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "AraTrust"),
28
+ ("qimma-MizanQA|0", "acc:logprob_normalization=LogProbCharNorm(name='norm', ignore_first_space=False)", "MizanQA"),
29
+ ]
30
 
31
+ # --- 3. Model Metadata ---
 
32
 
33
+ MODEL_TYPE_TO_EMOJI: Dict[str, str] = {
34
+ "🟒 : pretrained": "🟒",
35
+ "🟩 : continuously pretrained": "🟩",
36
+ "πŸ’¬ : chat models (RLHF, DPO, IFT, ...)": "πŸ’¬",
37
+ "πŸ”Ά : fine-tuned on domain-specific datasets": "πŸ”Ά",
38
+ "🀝 : base merges and merges": "🀝",
39
+ "Missing": "?",
40
+ }
frontend/leaderboard.html CHANGED
@@ -746,7 +746,7 @@
746
  $('#modalLinkHF').href = `https://huggingface.co/${model["Model Name"]}`;
747
 
748
  const cleanName = model["Model Name"].replace(/\//g, '__');
749
- const datasetId = `OALL/details_${cleanName}_v2`;
750
  $('#modalLinkDetails').href = `https://huggingface.co/datasets/${datasetId}`;
751
 
752
  const chartContainer = $('#modalChart');
 
746
  $('#modalLinkHF').href = `https://huggingface.co/${model["Model Name"]}`;
747
 
748
  const cleanName = model["Model Name"].replace(/\//g, '__');
749
+ const datasetId = `OALL/details_${cleanName}`;
750
  $('#modalLinkDetails').href = `https://huggingface.co/datasets/${datasetId}`;
751
 
752
  const chartContainer = $('#modalChart');