File size: 2,538 Bytes
f284194
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
{
  "source": "cache/huggingface/hub/models--Qwen--Qwen3.6-27B/snapshots/6a9e13bd6fc8f0983b9b99948120bc37f49c13e9",
  "candidate": "outputs/qwen3.6-27b-alpha080-secondpass-n2-reg05-layercap15",
  "default_alpha": 0.895,
  "layer_alpha_rules": [],
  "key_alpha_rules": [
    {
      "pattern": "model\\.layers\\.(12|13|14|16)\\.linear_attn\\.(in_proj_a|in_proj_b|norm|conv1d|dt_bias|A_log).*",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.15\\.self_attn\\.(q_norm|k_norm)\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.(12|13|14|15)\\.(input_layernorm|post_attention_layernorm)\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.1\\.mlp\\.gate_proj\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.(12|19)\\.mlp\\.up_proj\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.(15|22)\\.mlp\\.gate_proj\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.26\\.mlp\\.up_proj\\.weight",
      "alpha": 0.0
    },
    {
      "pattern": "model\\.layers\\.(9|16|27)\\.mlp\\.down_proj\\.weight",
      "alpha": 0.0
    }
  ],
  "formula": "source + alpha(key) * (candidate - source)",
  "source_key_prefix_translation": "model.* -> model.language_model.* when needed",
  "shards": [
    "model-00001-of-00028.safetensors",
    "model-00002-of-00028.safetensors",
    "model-00003-of-00028.safetensors",
    "model-00004-of-00028.safetensors",
    "model-00005-of-00028.safetensors",
    "model-00006-of-00028.safetensors",
    "model-00007-of-00028.safetensors",
    "model-00008-of-00028.safetensors",
    "model-00009-of-00028.safetensors",
    "model-00010-of-00028.safetensors",
    "model-00011-of-00028.safetensors",
    "model-00012-of-00028.safetensors",
    "model-00013-of-00028.safetensors",
    "model-00014-of-00028.safetensors",
    "model-00015-of-00028.safetensors",
    "model-00016-of-00028.safetensors",
    "model-00017-of-00028.safetensors",
    "model-00018-of-00028.safetensors",
    "model-00019-of-00028.safetensors",
    "model-00020-of-00028.safetensors",
    "model-00021-of-00028.safetensors",
    "model-00022-of-00028.safetensors",
    "model-00023-of-00028.safetensors",
    "model-00024-of-00028.safetensors",
    "model-00025-of-00028.safetensors",
    "model-00026-of-00028.safetensors",
    "model-00027-of-00028.safetensors",
    "model-00028-of-00028.safetensors"
  ],
  "unmatched_keys": [],
  "alpha_counts": {
    "0.895": 808,
    "0": 43
  }
}