File size: 1,150 Bytes
cc1cd06
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
{
  "format_version": 1,
  "name": "Gemma4 MTPLX Optimized Speed",
  "variant": "speed",
  "layout": {
    "target": "target",
    "assistant": "assistant"
  },
  "source": {
    "target_repo": "google/gemma-4-31B-it",
    "target_revision": "145dc2508c480a64b47242f160d286cff94a2343",
    "assistant_repo": "google/gemma-4-31B-it-assistant",
    "assistant_revision": "cffbbd2cea41ea56a0fa5b0487e0d445121fd204"
  },
  "target": {
    "role": "verifier",
    "model_type": "gemma4",
    "quantization": {
      "bits": 4,
      "group_size": 64,
      "mode": "affine"
    }
  },
  "assistant": {
    "role": "drafter",
    "model_type": "gemma4_assistant",
    "quantization": {
      "bits": 6,
      "group_size": 64,
      "mode": "affine"
    }
  },
  "benchmark": {
    "prompt_suite": "flappy",
    "max_tokens": 1000,
    "temperature": 1.0,
    "top_p": 0.95,
    "top_k": 64,
    "seed": 0,
    "best_block_size": 6,
    "acceptance": {
      "accepted": 830,
      "drafted": 846,
      "ratio": 0.9810874704491725
    },
    "observed_mtp_tok_s": [
      43.558797060869416,
      44.457398919489286,
      44.071735166669846
    ]
  }
}