Add files using upload-large-folder tool
Browse files- checkpoint-500/global_step500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/global_step500/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoint-500/model-00001-of-00004.safetensors +3 -0
- checkpoint-500/model-00002-of-00004.safetensors +3 -0
- checkpoint-500/model-00003-of-00004.safetensors +3 -0
- checkpoint-500/model-00004-of-00004.safetensors +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_4_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_5_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_6_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/global_step735/zero_pp_rank_7_mp_rank_00_model_states.pt +3 -0
- checkpoint-735/model-00001-of-00004.safetensors +3 -0
- checkpoint-735/model-00002-of-00004.safetensors +3 -0
- checkpoint-735/model-00003-of-00004.safetensors +3 -0
- checkpoint-735/model-00004-of-00004.safetensors +3 -0
- checkpoint-735/rng_state_0.pth +3 -0
- checkpoint-735/rng_state_2.pth +3 -0
- checkpoint-735/rng_state_3.pth +3 -0
- checkpoint-735/rng_state_4.pth +3 -0
- checkpoint-735/rng_state_5.pth +3 -0
- checkpoint-735/rng_state_7.pth +3 -0
- checkpoint-735/scheduler.pt +3 -0
- checkpoint-735/special_tokens_map.json +26 -0
- checkpoint-735/training_args.bin +3 -0
- model-00001-of-00004.safetensors +3 -0
- model-00002-of-00004.safetensors +3 -0
- model-00003-of-00004.safetensors +3 -0
- model-00004-of-00004.safetensors +3 -0
checkpoint-500/global_step500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c622ef6da1a1ef0dd33bb414988a3d408fbf94acc74dd018ea33922216d77af
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a1d213b4e9252018cbcd61e153a88b00cfa8f3a4093c6b54a6b0bdbbd36604
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:051b37633d4bc13e5a81d7f3125ded771a1209903ef68ad407656a3d76974eb3
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20d65135bd943e0573cb038815e1d055597455eec4d33e06851959d1e54adde3
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a46299c4d19b92b08b701b41f0645754210d0514f00e602c8dcb4a19455c0f9
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a47ebe5dd4a62c2f86f17187988f4e1e9bf8ef9dd631f1bf99992c982e5b97de
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd3fd884e26f873bb707a807a40e3f6cfe2b0315e108eb7ef1b9701025127673
|
3 |
+
size 12045397132
|
checkpoint-500/global_step500/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d42e307113ce3baed312b61b101444253f6095d17c75129a1be4894c19d3afec
|
3 |
+
size 12045397132
|
checkpoint-500/model-00001-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72552f30555a294a8a2cf2fd3fb30b7781bbe4d7c18f50e17e92d9db094c4ec8
|
3 |
+
size 4976698672
|
checkpoint-500/model-00002-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eed17f9035a7aa2928bf7f7f3c8806c742196864946c58f0ec2bfeaf2ccf5c09
|
3 |
+
size 4999802720
|
checkpoint-500/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87cdf9fafde97f9771b0bd450c614605a082d728326f1be2f501e0b526478f99
|
3 |
+
size 4915916176
|
checkpoint-500/model-00004-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95a11834e1319f82641176d8e7f9eb1644bdfc75d53224f77f1dcd59373281ed
|
3 |
+
size 1168138808
|
checkpoint-735/global_step735/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43f0faad49636b58f2fcd0837f9431f156dfb8f9de2bd5c3852753fb203727aa
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8eb94e292e302e3be1b012f1232a2fba4141135e033a71b14d939a80ae0479a
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7afde9a1469cd82d58e0ee70d3d969046bc2c3c6f1b4c5fcbc55bcc97d5c4c1
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5b49f28c1b0361950626913d38297c3fba05421cc74a25db27508bdc0e236df
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:093ea6ec3d812dfa8b2fc71fec48bd632c475c3a5ef66bb91a9534e35fb9aa15
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7d1059ab87d303231b326ca8762cff546748a7f73a06f1847ad9600098e36d4
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98f0aed4bc302dcd4a59563f3aad86cca0fc1f678850bcdba1a948279c3bf30d
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9482d5c62b7469d067561e85e0fc81e681840d2ce9e4c4a5ce7580cf074219e8
|
3 |
+
size 12045397132
|
checkpoint-735/global_step735/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85707e3c66ed553ecf00b132e407513f86ba967e7d20b1cda5fd53cdf44a9ef9
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6087aac0f790586df00593737b44ea6477b4915e23f5f474c8b085aae1da34b0
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:659e3b12c81ca929d8b2fa6aeb811837bef3cad619a293fb44a27c0192d7f482
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b013c92e9f9959a17e9c938346144629085babeea2c312d4ca867a261279bdd0
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_4_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67679473ce6e97d93aa569cd8339a3bb58e0da550e6c597f619348e5bea8c05d
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_5_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f37971d99b34353d7f0bae48d641e061039ad55b55325cbbfdbfb6d746b5786
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_6_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c4ad2825041bef84ac26a2618a2d7450a594a2116fbab35a07b4e05e659f00b
|
3 |
+
size 151013
|
checkpoint-735/global_step735/zero_pp_rank_7_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f8f4a23a416253dae08a11f8a65d7a5ebe068b02c27161026ece0f7d1a7d1a3
|
3 |
+
size 151013
|
checkpoint-735/model-00001-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a10d2fecc66ef82987c5db38d13ea091c692d8283ca7ca700322209e36b78a76
|
3 |
+
size 4976698672
|
checkpoint-735/model-00002-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71d03e372a4df9d65bc98054e19f3cc6f67af880f07cf7a361bfbb3fad58e4ee
|
3 |
+
size 4999802720
|
checkpoint-735/model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ea0f9313405628d968bb8a094f622561f974c46c64098d4ba1b11ac8e2ebb69
|
3 |
+
size 4915916176
|
checkpoint-735/model-00004-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37dbd0c3180f533fbf39ee68d23b86ece913ce41a803b5204cf4269529df8b78
|
3 |
+
size 1168138808
|
checkpoint-735/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08282b46825aa78d10fe10e3fea89555c5b5a691b261a3ddfd58fcb58370edff
|
3 |
+
size 15984
|
checkpoint-735/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caac82d57d878d30219a4f9ec289a97ff90c53afc160b968f251b3fd3454b8d8
|
3 |
+
size 15984
|
checkpoint-735/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19762d2d370222b01817da11bbaa6665d542293373186d66f754e7246bb861ed
|
3 |
+
size 15984
|
checkpoint-735/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00c7508b346a7d3c5c23392845f1d013331114ade778794b76e919cb3ed5d33e
|
3 |
+
size 15984
|
checkpoint-735/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b89de7d14dd20a191f56b74c816ef8b7fe5c171e31efbeadbf321c4539ed68c3
|
3 |
+
size 15984
|
checkpoint-735/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b67db12a26a26ffe03d9afc84a43857eb2e5b2fec2dd189653b415f74208190
|
3 |
+
size 15984
|
checkpoint-735/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:807cb46baeb5b5d4d1cc00555f221aed93f81f1db4830ee42a2e37e8b4e43f95
|
3 |
+
size 1064
|
checkpoint-735/special_tokens_map.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
{
|
4 |
+
"content": "<|eom_id|>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false
|
9 |
+
}
|
10 |
+
],
|
11 |
+
"bos_token": {
|
12 |
+
"content": "<|begin_of_text|>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false
|
17 |
+
},
|
18 |
+
"eos_token": {
|
19 |
+
"content": "<|eot_id|>",
|
20 |
+
"lstrip": false,
|
21 |
+
"normalized": false,
|
22 |
+
"rstrip": false,
|
23 |
+
"single_word": false
|
24 |
+
},
|
25 |
+
"pad_token": "<|eot_id|>"
|
26 |
+
}
|
checkpoint-735/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca8468f3236591b8bc9414bf8c5e45bbc9d0c3b125c984f856d216b07a582114
|
3 |
+
size 7416
|
model-00001-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a10d2fecc66ef82987c5db38d13ea091c692d8283ca7ca700322209e36b78a76
|
3 |
+
size 4976698672
|
model-00002-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71d03e372a4df9d65bc98054e19f3cc6f67af880f07cf7a361bfbb3fad58e4ee
|
3 |
+
size 4999802720
|
model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ea0f9313405628d968bb8a094f622561f974c46c64098d4ba1b11ac8e2ebb69
|
3 |
+
size 4915916176
|
model-00004-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37dbd0c3180f533fbf39ee68d23b86ece913ce41a803b5204cf4269529df8b78
|
3 |
+
size 1168138808
|