File size: 454 Bytes
64eea7d
 
 
 
 
 
 
 
0ab7173
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
- dataset:
    id: SWE-bench/SWE-bench_Verified
    task_id: swe_bench_%_resolved
  value: 72.80
  source:
    url: https://www.swebench.com/
    name: SWE-Bench official evaluation
    user: nielsr
  notes: high reasoning, official

- dataset:
    id: SWE-bench/SWE-bench_Verified
    task_id: swe_bench_%_resolved
  value: 77.8
  source:
    url: https://huggingface.co/zai-org/GLM-5/
    name: Model card
    user: nielsr
  notes: Z.ai reported number