SaylorTwift HF Staff commited on
Commit
bd4420e
·
verified ·
1 Parent(s): 298e15b

Upload folder using huggingface_hub

Browse files
logs/2026-03-27T13-43-21-00-00_gpqa-diamond_8nPDKERxKwnvmMmwAQYqcE.eval ADDED
Binary file (89.1 kB). View file
 
logs/listing.json CHANGED
@@ -1,19 +1,19 @@
1
  {
2
- "2026-03-26T16-01-28-00-00_gpqa-diamond_DpKPo39Uh2hEuHAmtatWQB.eval": {
3
- "eval_id": "ioNuAtSUnf7QajutLVEGRH",
4
- "run_id": "5mmFN44EXWTxxAqXr9DQY6",
5
  "task": "inspect_evals/gpqa_diamond",
6
- "task_id": "DpKPo39Uh2hEuHAmtatWQB",
7
  "task_version": 2,
8
  "version": 2,
9
  "status": "success",
10
  "invalidated": false,
11
- "model": "openai-api/transformers-serve/Qwen/Qwen3.5-0.8B",
12
- "started_at": "2026-03-26T16:01:28+00:00",
13
- "completed_at": "2026-03-26T16:21:43+00:00",
14
  "primary_metric": {
15
  "name": "accuracy",
16
- "value": 0.2,
17
  "params": {}
18
  }
19
  }
 
1
  {
2
+ "2026-03-27T13-43-21-00-00_gpqa-diamond_8nPDKERxKwnvmMmwAQYqcE.eval": {
3
+ "eval_id": "EcgN3XD8WfHkQaGqu279Hv",
4
+ "run_id": "muqihDJ8QzMbrCDHx2Uyiq",
5
  "task": "inspect_evals/gpqa_diamond",
6
+ "task_id": "8nPDKERxKwnvmMmwAQYqcE",
7
  "task_version": 2,
8
  "version": 2,
9
  "status": "success",
10
  "invalidated": false,
11
+ "model": "openai-api/transformers-serve/meta-llama/Llama-3.1-8B-Instruct",
12
+ "started_at": "2026-03-27T13:43:21+00:00",
13
+ "completed_at": "2026-03-27T14:03:37+00:00",
14
  "primary_metric": {
15
  "name": "accuracy",
16
+ "value": 0.15,
17
  "params": {}
18
  }
19
  }