yahavb commited on Oct 17, 2024

Commit

959aa71

verified ·

1 Parent(s): 5f162b1

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +10 -0
checkpoint/config.json +29 -0
checkpoint/generation_config.json +7 -0
checkpoint/pytorch_model.bin/key_to_filename.json +3 -0
checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight +3 -0
checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight +3 -0
checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight +3 -0
checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight +3 -0
checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight +3 -0
checkpoint/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight +3 -0
checkpoint/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight +3 -0
checkpoint/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight +3 -0
checkpoint/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight +3 -0
checkpoint/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight +3 -0
checkpoint/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight +3 -0
checkpoint/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight +3 -0
checkpoint/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight +3 -0
checkpoint/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+compiled/11574574e1a1f192d4a1.neff filter=lfs diff=lfs merge=lfs -text
+compiled/122746679d48e45b1766.neff filter=lfs diff=lfs merge=lfs -text
+compiled/2a7a2dab10b46a8e80e7.neff filter=lfs diff=lfs merge=lfs -text
+compiled/3281d3b8a26a3df86d05.neff filter=lfs diff=lfs merge=lfs -text
+compiled/37baec6c3020c2d4b379.neff filter=lfs diff=lfs merge=lfs -text
+compiled/49f48b453e5b11a0783f.neff filter=lfs diff=lfs merge=lfs -text
+compiled/9aae27aa51a7b54737a7.neff filter=lfs diff=lfs merge=lfs -text
+compiled/b69c1a2eba7a14d3045b.neff filter=lfs diff=lfs merge=lfs -text
+compiled/c5cb555d5a821ae6d5e2.neff filter=lfs diff=lfs merge=lfs -text
+compiled/c6c6edfd104bd0cba793.neff filter=lfs diff=lfs merge=lfs -text

checkpoint/config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "/home/ubuntu/optimum-neuron/docs/source/training_tutorials/dolly_llama",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": 128001,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 14336,
+  "layerdrop": 0,
+  "max_position_embeddings": 8192,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.36.2",
+  "use_cache": false,
+  "vocab_size": 128256
+}

checkpoint/generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 128000,
+  "eos_token_id": 128001,
+  "transformers_version": "4.36.2",
+  "use_cache": false
+}

checkpoint/pytorch_model.bin/key_to_filename.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:825d20f4a18183eff3963e805edd13ef7eb35b0aff7a850e8153ca1eeeb37970
+size 26397

checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:14eb6e8aed29226e92ccb4b76feb4208053e9cd6bf6fffc92ff28684a2b02c26
+size 1050673941

checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a9c323179784bd0be4dcfae827bcde624a84b0df80cc6687ee81b5934590f5e
+size 33555324

checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:149a16be6906da65838685beed20bfb59a8e098938c59007d78a7a4b62f7aca8
+size 33555327

checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2cd3cccba855c0d498f8a9d0e4061b400b22493890e30c318552a9d4be81e7c
+size 33555397

checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d5d18171e38abf4bb84c673baf1d40374f5432022372b16fa3335ea4e93341d
+size 8389573

checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe99c31adcd6e0915ac94f5149e57d888a2631341e5e9d230ed8cff771f5645d
+size 8389573

checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e6d5f4c7a23091deb7ba7605201c2f6e4b7af6a8c0d3d674ca27d7da64295d85
+size 33555397

checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e34c19d2262228b9fa507eacea013eba25ba28ac79888cbdf42980e132544a8
+size 117441404

checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f938840f20133faacf57aaf19cd34b80e763fb9e6df98147b945be2a890fe7e
+size 117441398

checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d354ae6188721075022e072aec5eb5ca8dc0cfef6dc09bac64c507f2b21bbef7
+size 117441404

checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb60c54f1105cb992d494d8a2008fef2d4dd3106298941a5807340536e8267ed
+size 9090

checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b726af842bb95a95de57e5d833e42b16bd4000c326dfb3c376c2a3bbeeea4f9b
+size 9181

checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7c69e969caa1786c0bf9e06b22bf2b12c50581d7f6f45e0750fe7adedf338d2
+size 33555397

checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:baa12e3f6f26a4f835ff86822e4d71ba789feb365cdaf9d628e1464ae30b2caf
+size 8389503

checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29888a871fba92966b857698c2ac1e2cd3c109a8cb08b02ceff9d2ec09c3c46b
+size 8389573

checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9642389b894d6e31a40ba139fdf23294d4df71f669c243a91f80afbf00f6f353
+size 8389573

checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bcfd65e9a1f171c63a6cf231dfdfb37cea8b4a7cac736925ba36477cd491972
+size 33555397

checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9257ac41d1bddb65f36d180edf843fde710840aae203ce8e0a24771418419733
+size 117441404

checkpoint/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce9fd90e4dac0457f7fc2e05966c34f4c092c7f9cc923bb4a530d1d46ef791d9
+size 117441398

checkpoint/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fdb9217c68c5e69d152707f70e031e9491a50ff89b85d71fd98b1cf64b186920
+size 117441404

checkpoint/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77f67562c3419ed84d26b916345674b6aacb7a527bcdd3b839d0c2881bf4dfb1
+size 9090

checkpoint/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60e47e514376deee0af7a57f0657fcd83fda9bb2ac8c931fd47b641fd893f998
+size 9181

checkpoint/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49ec92d99563e5ed63e8a01048a9efaca19b3171300a0df56396edce3f2310c3
+size 33555397

checkpoint/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bbc7fb4feb3625d4825775c3e945bf2755b57d725b7a700f1fcd70da0e001c2
+size 8389573

checkpoint/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3935dd2eba933c2284a674b331812b9fbbd52a95f6f99f0b9f501640b0b52452
+size 8389503

checkpoint/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fc887de70d50ed610c9e7c8e63b4303327f9d46478d32dd28b948b793d92acd
+size 8389573

checkpoint/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93cc174827edbb49d8c54452634ae70a973548283d248f454c5dec9c62e30ab8
+size 33555397

checkpoint/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6f3e9b664572902c7993427adc7df18e6c254d18d2f756dd4938c982b378867
+size 117441404

checkpoint/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1599ff1fa5ba84760976df4a91f69076d30626407a46f83b641f891363072208
+size 117441398

checkpoint/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5fc71fe64af1fd1732dbcc55ecc7ad06c0e85a2821960dad61307f5d2fa249e7
+size 117441404

checkpoint/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d483caf70adcd9c403585990cd2bb05170addde38bbea334b356cd5fd5d5fcf
+size 9090

checkpoint/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b0756466c655e299da2f33612ba13b0acf714f4ad1569e2822829bf5812d9e2
+size 9181

checkpoint/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d4367b1259e0067574b42ed53cd8fe919bb3c623c7e13e3ed834e01df90209c
+size 33555397

checkpoint/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:58d86a7be7846a3b6b9d9e8054f04001fd30d047213f5d040e44f51474694cae
+size 8389573

checkpoint/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:765c8982cd3752e2a8b1a4195a30d886513e79ba4d16c4edf0a59f2a1334c4ed
+size 8389573

checkpoint/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ab80039bad67ce6478471bb9ee3cce1306ccec613baec2cc7f6feb9fa3ea5fc
+size 33555327

checkpoint/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ab6ba8b511b3749ffd8d05dc1902e53564e7340e94803e97ac666fa1c18c0d2
+size 33555397

checkpoint/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf44fef885c940175d5c89af77a33024a7dc11e1c0b4c718dfbfc623aa5d6cdc
+size 117441404

checkpoint/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81384a1105e9eb43efc285591a36bf074eb7512a5b94fe1ef4293f7c0203676a
+size 117441398

checkpoint/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35015a0b14c55b47c9bfc8e4c2189ca8ec650e077d1f9fa3f128c06614d61c64
+size 117441404

checkpoint/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a875a19e23a9339b41e9b2104fb2be56c00fd8158a994743dad0d6c3e1bde988
+size 9090

checkpoint/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da471e20e6a10a7138126c436e52c7f42c78b1c1b15003e1c972d37c082630ce
+size 9181

checkpoint/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f24fff5469db1b80e994cbdf300ac26723846d8a026bfc6affededb35af7390d
+size 33555397

checkpoint/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ec3840b966b4432b8385432e24f2348e36b00cd70088bcdc69d450712af43dc
+size 8389573

checkpoint/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e429ec30ea013c37054c415a50b1dddaa033d43bcacc715ed71b121e10c5da7b
+size 8389573

checkpoint/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:07bed933b246f616153dee54219c0677706a770105dd610df48629605c6eb5d5
+size 33555397