ShawLiu
commited on
Commit
·
321cfb6
1
Parent(s):
2277342
Init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +30 -0
- generation_config.json +6 -0
- model-00001-of-00082.safetensors +3 -0
- model-00002-of-00082.safetensors +3 -0
- model-00003-of-00082.safetensors +3 -0
- model-00004-of-00082.safetensors +3 -0
- model-00005-of-00082.safetensors +3 -0
- model-00006-of-00082.safetensors +3 -0
- model-00007-of-00082.safetensors +3 -0
- model-00008-of-00082.safetensors +3 -0
- model-00009-of-00082.safetensors +3 -0
- model-00010-of-00082.safetensors +3 -0
- model-00011-of-00082.safetensors +3 -0
- model-00012-of-00082.safetensors +3 -0
- model-00013-of-00082.safetensors +3 -0
- model-00014-of-00082.safetensors +3 -0
- model-00015-of-00082.safetensors +3 -0
- model-00016-of-00082.safetensors +3 -0
- model-00017-of-00082.safetensors +3 -0
- model-00018-of-00082.safetensors +3 -0
- model-00019-of-00082.safetensors +3 -0
- model-00020-of-00082.safetensors +3 -0
- model-00021-of-00082.safetensors +3 -0
- model-00022-of-00082.safetensors +3 -0
- model-00023-of-00082.safetensors +3 -0
- model-00024-of-00082.safetensors +3 -0
- model-00025-of-00082.safetensors +3 -0
- model-00026-of-00082.safetensors +3 -0
- model-00027-of-00082.safetensors +3 -0
- model-00028-of-00082.safetensors +3 -0
- model-00029-of-00082.safetensors +3 -0
- model-00030-of-00082.safetensors +3 -0
- model-00031-of-00082.safetensors +3 -0
- model-00032-of-00082.safetensors +3 -0
- model-00033-of-00082.safetensors +3 -0
- model-00034-of-00082.safetensors +3 -0
- model-00035-of-00082.safetensors +3 -0
- model-00036-of-00082.safetensors +3 -0
- model-00037-of-00082.safetensors +3 -0
- model-00038-of-00082.safetensors +3 -0
- model-00039-of-00082.safetensors +3 -0
- model-00040-of-00082.safetensors +3 -0
- model-00041-of-00082.safetensors +3 -0
- model-00042-of-00082.safetensors +3 -0
- model-00043-of-00082.safetensors +3 -0
- model-00044-of-00082.safetensors +3 -0
- model-00045-of-00082.safetensors +3 -0
- model-00046-of-00082.safetensors +3 -0
- model-00047-of-00082.safetensors +3 -0
- model-00048-of-00082.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/workspace/hanyu/hanyu/ckpt/meta-llama-3-70b-instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"head_dim": 128,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 8192,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 28672,
|
15 |
+
"max_position_embeddings": 16384,
|
16 |
+
"mlp_bias": false,
|
17 |
+
"model_type": "llama",
|
18 |
+
"num_attention_heads": 64,
|
19 |
+
"num_hidden_layers": 80,
|
20 |
+
"num_key_value_heads": 8,
|
21 |
+
"pretraining_tp": 1,
|
22 |
+
"rms_norm_eps": 1e-05,
|
23 |
+
"rope_scaling": null,
|
24 |
+
"rope_theta": 500000.0,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.45.2",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 128256
|
30 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"eos_token_id": 128001,
|
5 |
+
"transformers_version": "4.45.2"
|
6 |
+
}
|
model-00001-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e982ea8f60fc718c9d2cba8c5d3b70366c60195c686a4a3a38b3778ea75f5f4d
|
3 |
+
size 2101346448
|
model-00002-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34129c719e9f407e74168546970669d81015eb9cb41ace5fc6c564da83313cea
|
3 |
+
size 1879082376
|
model-00003-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:091bf08cea3d3010e753184c29acd3291dcbc6ca2fc863320522560ffcc69ef1
|
3 |
+
size 1845527704
|
model-00004-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4159b0e443108f61677452ba96e503101a8c4ac7a93c41acda19a6675e5bccaa
|
3 |
+
size 1711309864
|
model-00005-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b5b68fc93edfc13d799cea64039b880c10bc2e0c9ba4bc528da9593032a7885
|
3 |
+
size 1711309864
|
model-00006-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02e92efb380e37bd30a93db25ec6d35e1f2b97fe3b48c08464c587395b5cc4ad
|
3 |
+
size 1711309864
|
model-00007-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1caa7f5ad3d98b5a99a3d6126e1fbb983c2d6b5df643a2495534ba2daf9832c
|
3 |
+
size 1711309864
|
model-00008-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d90ded0fb5dd393b4b69fa9c7c3d28259b6e6c3349da9b8553ef1a57c8384d9
|
3 |
+
size 1711309864
|
model-00009-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5f7cef642169a5e6df6e12232d332a0f8212cb08442ec7ebeb78845ec4c5778
|
3 |
+
size 1711309864
|
model-00010-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0210c88aa21553f586301bf90173d7dfdc88d2e8d08cca8a60f979ffeaf1fea
|
3 |
+
size 1711309864
|
model-00011-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:920b48358e7c265e4bd4ee92fb9ce86f68ae696b2b25336aa29f93c114eecba3
|
3 |
+
size 1711309864
|
model-00012-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38d2575629f839686056ac07a929575de03b207e4ac12045f2a6b8efb4aed896
|
3 |
+
size 1711309872
|
model-00013-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1c1d06800381779b918509ab2285896aec0434d5831f321b0dfb7d6053cf65a
|
3 |
+
size 1711309872
|
model-00014-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:691af48a4c4ba8ce80725fc08086a31d104516df7a0131f0e189a7375ddafa46
|
3 |
+
size 1711309872
|
model-00015-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43fd353f72876835f70b6e0256fec9f4175c832e6ffb1457769785f03d16b3e5
|
3 |
+
size 1711309872
|
model-00016-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9928dd3a43aea81299ae8a82636dceb326202b8178950dc55e45d241d8263f7b
|
3 |
+
size 1711309872
|
model-00017-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7855503ed4fa69e9622fb6ba16be9fa21f3abf706f331f37cbd6b340870b48a5
|
3 |
+
size 1711309872
|
model-00018-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05588d52fbe944780ec66640aa1d817c16246c21b9a09efb4cfe55c0d92ca0d1
|
3 |
+
size 1711309872
|
model-00019-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8037a125415837f3bc2c8c2f834bf3ae22ae79c2c92b6854041c64c40a83a251
|
3 |
+
size 1711309872
|
model-00020-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c75854e06cdf70aff48887700fca1b15abf7c7d1624922b801f82e12defdbdfc
|
3 |
+
size 1711309872
|
model-00021-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d7d8b26abaacac3c8a786afd4a1f9e5db5c7f7aead12a3d0690dcd73f752d6f
|
3 |
+
size 1711309872
|
model-00022-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f59b8b8cafe47899423d65f134917381185ce3c3690323b7b4e967f6e70ce22
|
3 |
+
size 1711309872
|
model-00023-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a9e1ba98999bc52694e413fefedc8a40a8f9e876f600c5285469a028055135e
|
3 |
+
size 1711309872
|
model-00024-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d16252fdd4e22779ddb8e158af404d7ca5a76873fe12c967f355fb9fb737d1b5
|
3 |
+
size 1711309872
|
model-00025-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdb04014628e0ad92038bd32830dcc5470a8c6895286245d6baa129eddef8623
|
3 |
+
size 1711309872
|
model-00026-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:413e6646f15f31ee93daadab91063dc4926e117249fc1e08709ffd494bad8a83
|
3 |
+
size 1711309872
|
model-00027-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4619dfa4b7ab35d6c09a56a71e5afa0967e859de4f1a0f4d62645a32f10cc0d
|
3 |
+
size 1711309872
|
model-00028-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f96abaaf554dab5d5dc6a9cb52583088f3eca41043515ded2df0a958c933c9b
|
3 |
+
size 1711309872
|
model-00029-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f2bde6a1dac986d2e1d2a5e79ced7febf92dfde98e7dae5ea0a24c171af5fa2
|
3 |
+
size 1711309872
|
model-00030-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c7a379e07a2de1a1ca85c394e9425de9bfce4b8c1515a95e652b707f6e1786b
|
3 |
+
size 1711309872
|
model-00031-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbadd8a390f05e3519b69941fb4c188597190cd9331d5d11e1dafd09adcb6885
|
3 |
+
size 1711309872
|
model-00032-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88544230b3a2182ee08480b4087ae90b640aae4cf5db9cffa068843b6305730c
|
3 |
+
size 1711309872
|
model-00033-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89cabf8df7703a4c2860bef33463549e616c6593d2f4b5a082f8b833e141e39c
|
3 |
+
size 1711309872
|
model-00034-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8808964780eec93c6ad988dc2ddf31b01a250f21a718815d6c9e6f647e1293db
|
3 |
+
size 1711309872
|
model-00035-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d88a2d0ddc04da6d4f627409793133a6b95d43177df90811d4099118f02bca4d
|
3 |
+
size 1711309872
|
model-00036-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca5fa4c960199e07e703522ba92015fcc913afa263e3120962cda7fbe5e4d69b
|
3 |
+
size 1711309872
|
model-00037-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:336859db8158260491ada8d2dfeb4d93ad6fc6116942bd56688a43083c612131
|
3 |
+
size 1711309872
|
model-00038-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e15e5086029e1f7484861b0a93221247279b03187478b2a951ee0abdfa42921a
|
3 |
+
size 1711309872
|
model-00039-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd1153f7c8476c7179b41a92657f85c4664b9f9f1c648d57932b603bfb0ffd0b
|
3 |
+
size 1711309872
|
model-00040-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e75cac1e0747ec244e53100dff3d577337fd768eac54fdd0cbc348bb2189f364
|
3 |
+
size 1711309872
|
model-00041-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7aadbe2832f61885792439b2cf780df59373fcd4a4f09600a89fd25c4b67c7f
|
3 |
+
size 1711309872
|
model-00042-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dfdcbb144c27dfad06d581985780cfc0aeb1d20d0c3adf3400addefd53c438a
|
3 |
+
size 1711309872
|
model-00043-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5479903e04b4f63e5eb64e5e5086f5b414b3310984ae868c0e96e55df7d44f6c
|
3 |
+
size 1711309872
|
model-00044-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41bc062b37f4a1c5dac7ce1c7239c964126a4fc010abd932530e2f1ff6ebac6e
|
3 |
+
size 1711309872
|
model-00045-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02cc9ba12035ff6b793d407df3ab4fd324b786d9cb22a5ca671b24bed6849695
|
3 |
+
size 1711309872
|
model-00046-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e410c7c5dc5e006e906d724dc5682fe581d6396b4ed51158e68507f2f5c56931
|
3 |
+
size 1711309872
|
model-00047-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f21c5c607e01c76182a19f64f09a227b640ab80179c3e738d68ecdf21411ef7
|
3 |
+
size 1711309872
|
model-00048-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7b7fda12f7a96c70ba6f3344de2eca138cf8a18a9f4552081eed89af2689ae2
|
3 |
+
size 1711309872
|