Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- dandy-serenity-43/hyperparameters.yaml +78 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_10235904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_102395904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_102395904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_107515904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_112635904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_117755904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_122875904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_122875904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_127995904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_133115904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_138235904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_143355904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_143355904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_148475904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_15355904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_153595904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_158715904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_163835904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_163835904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_168955904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_174075904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_179195904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_184315904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_184315904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_189435904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_194555904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_199675904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_20475904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_20475904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_204795904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_204795904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_209915904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_215035904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_220155904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_225275904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_225275904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_230395904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_235515904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_240635904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_245755904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_245755904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_250875904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_25595904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_255995904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_261115904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_266235904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_266235904_log_feature_sparsity.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_271355904.pt +3 -0
- dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_276475904.pt +3 -0
dandy-serenity-43/hyperparameters.yaml
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
activation_function: relu
|
| 2 |
+
adam_beta1: 0.9
|
| 3 |
+
adam_beta2: 0.999
|
| 4 |
+
b_dec_init_method: zeros
|
| 5 |
+
cached_activations_path: null
|
| 6 |
+
checkpoint_path: ../outputs/checkpoints
|
| 7 |
+
clip_grad_norm: false
|
| 8 |
+
context_size: 1024
|
| 9 |
+
custom_loss: null
|
| 10 |
+
d_in: 2048
|
| 11 |
+
d_out: null
|
| 12 |
+
dataset: Skylion007/openwebtext
|
| 13 |
+
dense_loss_coefficient: 0
|
| 14 |
+
device: cuda
|
| 15 |
+
different_output: false
|
| 16 |
+
dtype: float32
|
| 17 |
+
epsilon_l0_approx: 0.2
|
| 18 |
+
eval_frequency: 500
|
| 19 |
+
expansion_factor: 8
|
| 20 |
+
feature_reinit_scale: 0.2
|
| 21 |
+
feature_resampling_method: null
|
| 22 |
+
fine_tune_dataset: false
|
| 23 |
+
finetuning_steps: !!python/tuple
|
| 24 |
+
- 1000
|
| 25 |
+
flatten_activations_over_layer: false
|
| 26 |
+
flatten_activations_over_layer_output: false
|
| 27 |
+
from_pretrained_path: null
|
| 28 |
+
hook_point: blocks.7.hook_resid_pre
|
| 29 |
+
hook_point_head_index: null
|
| 30 |
+
hook_point_head_index_output: null
|
| 31 |
+
hook_point_layer: 7
|
| 32 |
+
hook_point_layer_output: null
|
| 33 |
+
hook_point_output: null
|
| 34 |
+
initial_decoder_norm: 0.1
|
| 35 |
+
initialise_encoder_to_decoder_transpose: false
|
| 36 |
+
is_dataset_tokenized: false
|
| 37 |
+
l0_coefficient: 7.0e-05
|
| 38 |
+
l0_warmup: false
|
| 39 |
+
l0_warmup_steps: 1000
|
| 40 |
+
l1_coefficient: 0
|
| 41 |
+
l1_warmup: false
|
| 42 |
+
l1_warmup_steps: 1000
|
| 43 |
+
log_to_wandb: true
|
| 44 |
+
loop_dataset: false
|
| 45 |
+
lr: 0.0004
|
| 46 |
+
lr_scheduler_name: constant
|
| 47 |
+
lr_warm_up_steps: 500
|
| 48 |
+
max_resample_step: 100000
|
| 49 |
+
max_sparsity_target: 1
|
| 50 |
+
min_sparsity_for_resample: 0
|
| 51 |
+
min_sparsity_target: 1.0e-05
|
| 52 |
+
model_name: gemma-2b-it
|
| 53 |
+
mse_loss_coefficient: 1
|
| 54 |
+
mse_loss_type: centered
|
| 55 |
+
multiple_runs: false
|
| 56 |
+
n_batches_in_store_buffer: 128
|
| 57 |
+
n_checkpoints: 160
|
| 58 |
+
n_running_sparsity: 300
|
| 59 |
+
n_starting_steps: null
|
| 60 |
+
normalise_initial_decoder_weights: false
|
| 61 |
+
normalise_w_dec: true
|
| 62 |
+
remove_bos_tokens: false
|
| 63 |
+
resample_batches: 128
|
| 64 |
+
resample_frequency: 25000
|
| 65 |
+
scale_input_norm: false
|
| 66 |
+
seed: 42
|
| 67 |
+
sparse_loss_coefficient: 1.0e-06
|
| 68 |
+
sparsity_log_frequency: 5000
|
| 69 |
+
store_batch_size: 2
|
| 70 |
+
subtract_b_dec_from_inputs: false
|
| 71 |
+
topk_amount: 10
|
| 72 |
+
total_training_steps: 200000
|
| 73 |
+
train_batch_size: 4096
|
| 74 |
+
use_cached_activations: false
|
| 75 |
+
use_gated_sparse_autoencoder: false
|
| 76 |
+
wandb_log_frequency: 10
|
| 77 |
+
wandb_project: test_gemma_2b
|
| 78 |
+
weight_l1_by_decoder_norms: false
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_10235904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be2fb7ba8817cb64c0c01a1e6371fa27d0cc12257e10c2fce9bab60cf3bdfe51
|
| 3 |
+
size 268514568
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_102395904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:adeaf4107dc0564a61b3ff851365a3aa51304a9db6e2e6f137dc4eb71ca4c269
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_102395904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:258c476be55eaa5e10d57f7c33774ed8d50926b20678c7c20a19ae4501dca264
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_107515904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af2b1c2b6fcaa36b7e5587f461faa86e78821eadd3af2e130986c09330a4e2c1
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_112635904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9276926c0bcfc25b071570501136a7cae406630c29effe2f3480be34cd7effc
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_117755904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe983e5aa1864268329945c285eaacb3776775d623fbf2c635293f6de0fc4092
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_122875904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e60fe4aa43536ce512c57d26ef00ddc2790fdf3a98fc570ea8572e912c9dabb
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_122875904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7bd69dfa7646a119d250de2b7a335fb071f7fe179e846a39c5ee43a340bf470
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_127995904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c96ba8ccded95d7e82709aba01c348c4addbada123952721f2866fb1e5fdac1
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_133115904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7539b21e69dde3a6d9334a7dcffa5f4a78a9ce4527435dc24983a71f99305181
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_138235904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b13f3eed0006a31f69aac2bed739b9ada4541a8b544df35ed56e23749e7e2f81
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_143355904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b54afa5e5784198c7aaa59cca1007edb4aa88126a2e4b43d481812c527dee204
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_143355904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19e725d2efec88457b35b77173062d0863f95c8c77df385db988040e30055e1f
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_148475904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d256f1e54f2d851d6337b89f17b2fb14b007e0c247b1e5c2cf150b6a358dcc01
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_15355904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f04dc86a9f54d86c5222270c77d6d65668e95b02c90774dc9beb62260d8d2bf1
|
| 3 |
+
size 268514568
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_153595904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d284f91e8c57c3fc1215948497e79598595eb450fd91c8a5c7b6f91a8d6cf88
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_158715904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16e4796cc164c218702b8e1d78b3f3f165d2cd102d1731d543b17c8847354428
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_163835904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3276ec29f0ae72f05c00d416f4c343a422d399bd3400b6612f602cc348ec2aaa
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_163835904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6faa133ace9e98acfbc9a93c09d929a461bd22d97af82f1adbc79b25ac4041a
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_168955904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae33f0b2ac056c6abe86495534e4109d8d06442642f8e93077f2aa845e11034b
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_174075904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85a7fde827b3585552ad053001cbe12b654e541a198ee1af231d4ac92767bcdb
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_179195904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfa12928d9fc34713c45594d0d9a1da71e1a8a6463163830880b6e29ebb811f2
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_184315904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81afed7c2796ec97523d6deb6a7ab5070e042c1ade5fb921f6648272960351d9
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_184315904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd70e938010bb37ed427a4f0d91190916dfc0328a46f58b26f24f29ed816b461
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_189435904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3dd1426a8091e6af0a06f9b921d97856bb559a83c43131810c459bea531f2252
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_194555904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9d72282202cc221804e5092aad89a2fa6137dd960d973c599990a5379741358
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_199675904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70f39f862126dba6826fc471b7dc4c3a022c62725d1151fe4f1ee0d7b9ab8e4b
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_20475904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59d0509c304de59128591118f0e45c06278ae930add5ded8379cf84551d4f741
|
| 3 |
+
size 268514568
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_20475904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efae3135fab2de47c65f545fead25c2edd250cbcaa5782669a212447c3fa0d63
|
| 3 |
+
size 67520
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_204795904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed3f880395d316bd1a57e6c4444768ca603b43299530047ceda6e5deea138cd6
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_204795904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:087713398995dc3f236296a063413380858ff8d0977a3622eafe2e6fdbd20c9f
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_209915904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a65299f03fd6c22ab2b789cb71734540e62deab451b3866aa611f49cd9378b9b
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_215035904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5329389a88bebc4c3c9ecd73c30733473b6b88add6da0c76a77c9eeb5ab8955a
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_220155904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fd295e0d0173f9b6dd00c303ae3aed645e8a5f0d2d5a588fa0466a8bc779e09
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_225275904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f6734c9ee10febbc59885b7004f5f990efd103a06017880cd86ee2168cb264e
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_225275904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c07af06d1a4161977da3287825db68c938780f35d295b5361b8b9ca1a96a5ed
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_230395904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e634027ded361f1549ffa549e10048e0ca17235c1c24d2cb94059e4d7d578e1
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_235515904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43d4015443fed417215ad37f51f2cc454f885c39091b6d2519985754397d044c
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_240635904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a0e134d64ab4cde259faf3156f0bd452d3710174ae62758de5a1bfc9403fe62
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_245755904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df61c4c1f50e99025e97adaf0c95e7e4039cecb8333e93015dbf4595c7882777
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_245755904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c11200e05163efedb81895e80abd1a8de1cdde5e7f89b4fc0cec96d0b1e1118
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_250875904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86bdf158c5edc33f907e470e8fb20e79c78d2256f878097f62a6ffb9228648e6
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_25595904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68d9d6ff34220d5fdbe61fc4d5c530855856d00a60d57f4d7a816a52e000fcf4
|
| 3 |
+
size 268514568
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_255995904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0fa7330a164115b4e4c41c643cd82ed14984ab44c995f0c3063942ebed873752
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_261115904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b869ba58d7b8d3b2d26d11c2489f7459d2067a913860d733f675932075498580
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_266235904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de2b42bc187cbfb210efa690422194ba06bc049f205bac3894200434fc262073
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_266235904_log_feature_sparsity.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19f31329bd3f49c84d70ac10170a75d5b89e37bcf6c6d4aedeb0423b1929d3f0
|
| 3 |
+
size 67525
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_271355904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b1c73b4cb5eacdaf43050fd2055c8263047b966df31f23c65072290a03f645c
|
| 3 |
+
size 268514640
|
dandy-serenity-43/sparse_autoencoder_gemma-2b-it_blocks.7.hook_resid_pre_s16384_276475904.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:379cb4868692fbf8db6ef813d346affa7c46ff09717d4bf221c34e81a7879c4e
|
| 3 |
+
size 268514640
|