Add files using upload-large-folder tool
Browse files- Llama-3.2-3B-Instruct/.ipynb_checkpoints/config-checkpoint.json +39 -0
- output/state_0/model.safetensors +1 -1
- output/state_0/optimizer.bin +1 -1
- output/state_0/scheduler.bin +1 -1
- output/state_1/model.safetensors +1 -1
- output/state_1/optimizer.bin +1 -1
- output/state_1/scheduler.bin +1 -1
- output/state_10/model.safetensors +1 -1
- output/state_10/optimizer.bin +1 -1
- output/state_10/scheduler.bin +1 -1
- output/state_2/model.safetensors +1 -1
- output/state_2/optimizer.bin +1 -1
- output/state_2/scheduler.bin +1 -1
- output/state_3/model.safetensors +1 -1
- output/state_3/optimizer.bin +1 -1
- output/state_3/scheduler.bin +1 -1
- output/state_5/model.safetensors +1 -1
- output/state_5/optimizer.bin +1 -1
- output/state_5/scheduler.bin +1 -1
- output/state_6/model.safetensors +1 -1
- output/state_6/optimizer.bin +1 -1
- output/state_6/scheduler.bin +1 -1
- output/state_7/model.safetensors +1 -1
- output/state_7/optimizer.bin +1 -1
- output/state_7/scheduler.bin +1 -1
- output/state_8/model.safetensors +1 -1
- output/state_8/optimizer.bin +1 -1
- output/state_8/scheduler.bin +1 -1
Llama-3.2-3B-Instruct/.ipynb_checkpoints/config-checkpoint.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"LlamaForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": false,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": 128000,
|
| 8 |
+
"eos_token_id": [
|
| 9 |
+
128001,
|
| 10 |
+
128008,
|
| 11 |
+
128009
|
| 12 |
+
],
|
| 13 |
+
"head_dim": 128,
|
| 14 |
+
"hidden_act": "silu",
|
| 15 |
+
"hidden_size": 3072,
|
| 16 |
+
"initializer_range": 0.02,
|
| 17 |
+
"intermediate_size": 8192,
|
| 18 |
+
"max_position_embeddings": 131072,
|
| 19 |
+
"mlp_bias": false,
|
| 20 |
+
"model_type": "llama",
|
| 21 |
+
"num_attention_heads": 24,
|
| 22 |
+
"num_hidden_layers": 28,
|
| 23 |
+
"num_key_value_heads": 8,
|
| 24 |
+
"pretraining_tp": 1,
|
| 25 |
+
"rms_norm_eps": 1e-05,
|
| 26 |
+
"rope_scaling": {
|
| 27 |
+
"factor": 32.0,
|
| 28 |
+
"high_freq_factor": 4.0,
|
| 29 |
+
"low_freq_factor": 1.0,
|
| 30 |
+
"original_max_position_embeddings": 8192,
|
| 31 |
+
"rope_type": "llama3"
|
| 32 |
+
},
|
| 33 |
+
"rope_theta": 500000.0,
|
| 34 |
+
"tie_word_embeddings": true,
|
| 35 |
+
"torch_dtype": "bfloat16",
|
| 36 |
+
"transformers_version": "4.45.0.dev0",
|
| 37 |
+
"use_cache": true,
|
| 38 |
+
"vocab_size": 128256
|
| 39 |
+
}
|
output/state_0/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c201d140806abd6234e5b42ae4ba44d2ea1fb016ca71c8f8b252f99a9454a481
|
| 3 |
size 2054186136
|
output/state_0/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ba6dc42b81e22903fa0487a82aa78c4918ac54019deeedb8306a9c06ca0d629
|
| 3 |
size 956359825
|
output/state_0/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f27e259c38912c76b5f52f93444c1e26a550d5be21d3b2a2d50dc7abcd44864
|
| 3 |
size 1401
|
output/state_1/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bf66bb5bcdab9cc877e1059af4bfb6cda4e23cc9612a98cb7352972eb10cefb
|
| 3 |
size 2054186136
|
output/state_1/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76bd0d4b83e1fb7d825750c9304176020ee29116e5564db8e57914a247992533
|
| 3 |
size 956359825
|
output/state_1/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66ad4ea5da2bfb70f060b16b681b79bc6ac4f6a8e560a112dd28ee1f67c8fdf4
|
| 3 |
size 1401
|
output/state_10/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e61c4c8d8fb54b0e3145417941186aab8dea93941d530b56978f66d787a5ef4b
|
| 3 |
size 2054186136
|
output/state_10/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f41b7a496665ffc049db3cb28a65e8e2ee64d6165d79ae47518987416689fc2
|
| 3 |
size 956359825
|
output/state_10/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ed71f4e134f40f16228fdbd072bebd40061dd69f90052088cc1dcd9f11561b2
|
| 3 |
size 1401
|
output/state_2/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09b7d0b74625bb27057e564e6dc3fde6413c4d5d81fadca8ef69676186c35c90
|
| 3 |
size 2054186136
|
output/state_2/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87d7ff6e2dbceef2378419c97b103b4815b8ccb8fd562c44e66ab860fe43d04b
|
| 3 |
size 956359825
|
output/state_2/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78e0d3f1231e3e44aee6e95f99ecba9de266678ad018e6d0e6feb29089b4f6d9
|
| 3 |
size 1401
|
output/state_3/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58592517f5166be8200128966436a3c928ab76ce78307e6b125610649ccc6138
|
| 3 |
size 2054186136
|
output/state_3/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0e777320353270186872747ce3bba396c6a924778e53b9faaa327632b44a710
|
| 3 |
size 956359825
|
output/state_3/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cee1cea88cc157ab22c432313eb868c69fe0787f9bd62eb0c2c077300b853e80
|
| 3 |
size 1401
|
output/state_5/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e674f7c203cb676613d85bfefd5755cc6177918dae8cd2c70c9046d3a871b7e
|
| 3 |
size 2054186136
|
output/state_5/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:013b7eee12b42e48e5798731b17b270bc41f0487338d5f58a49e10224e958207
|
| 3 |
size 956359825
|
output/state_5/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f5bdeb75c594be6b54ef4b44ca9a1e873bab81f6e5ee392bf4665d046347ca8
|
| 3 |
size 1401
|
output/state_6/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b020e0ade6892957716bb48a7ac026f8e28de4f33a4b6cf86b4ead354b3e905f
|
| 3 |
size 2054186136
|
output/state_6/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6120cec174f5e40aeef4b976d0e38187e84c591c7d8b9c050ad3de7f20c1d9c6
|
| 3 |
size 956359825
|
output/state_6/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d10e8d03a05068c620de50e3e085bbde9fcaace576dd2c1fa2bacb98e43dbf3c
|
| 3 |
size 1401
|
output/state_7/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f59e427e589ea3f3edf4fb1d67d9bff6750d3c74f6a40ba630f28d1ecbd9a0ea
|
| 3 |
size 2054186136
|
output/state_7/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed61de61e09a323bdf1bcb8f04ea94d6cff9c3fb5363b1a38c5813dfd5fc7196
|
| 3 |
size 956359825
|
output/state_7/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:363b5fe9cf24ae86f33e9240afc77379de53cdf590142246591a5e04e77c3425
|
| 3 |
size 1401
|
output/state_8/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2054186136
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68c109f8be326e87bb78184087a4d8d2f4d0df5cd20d6abf16eef7db60f8101e
|
| 3 |
size 2054186136
|
output/state_8/optimizer.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 956359825
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:381564bed5b8b5458dc63ddd06d3f09ed2ae3307fbfb1f375bc787f05261c443
|
| 3 |
size 956359825
|
output/state_8/scheduler.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa8349faf395cb3d5dd5b3d0537340384f6d4a9ae414163d23fa7be6bf32ef6a
|
| 3 |
size 1401
|