Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- 2b_l10/outputs_add_free/all/lang/1/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/100/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/105/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/111/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/115/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/118/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/12/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/124/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/126/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/129/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/133/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/134/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/136/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/14/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/143/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/145/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/149/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/15/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/150/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/152/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/153/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/154/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/157/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/161/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/163/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/164/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/168/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/17/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/175/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/178/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/179/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/18/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/181/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/189/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/191/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/192/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/198/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/203/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/209/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/21/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/210/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/220/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/222/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/223/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/226/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/233/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/234/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/235/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/236/config.json +12 -0
- 2b_l10/outputs_add_free/all/lang/237/config.json +12 -0
2b_l10/outputs_add_free/all/lang/1/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/100/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/105/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/111/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/115/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/118/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/12/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/124/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/126/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/129/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/133/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/134/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/136/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/14/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/143/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/145/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/149/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/15/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/150/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/152/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/153/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/154/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/157/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/161/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/163/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/164/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/168/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/17/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/175/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/178/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/179/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/18/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/181/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/189/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/191/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/192/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/198/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/203/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/209/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/21/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/210/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/220/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/222/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/223/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/226/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/233/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/234/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/235/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/236/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|
2b_l10/outputs_add_free/all/lang/237/config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"layer": 10,
|
| 4 |
+
"embed_dim": 2304,
|
| 5 |
+
"low_rank_dim": 1,
|
| 6 |
+
"target_module": "model.layers.10",
|
| 7 |
+
"intervention_type": "AdditionFreeIntervention",
|
| 8 |
+
"factor_init_scale": 2.0,
|
| 9 |
+
"vector_init_scale": 1.0,
|
| 10 |
+
"alpha": 0.0
|
| 11 |
+
}
|
| 12 |
+
]
|