Upload 28 files
Browse files- mlc-chat-config.json +42 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_6.bin +3 -0
- params_shard_7.bin +3 -0
- params_shard_8.bin +3 -0
- params_shard_9.bin +3 -0
mlc-chat-config.json
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "llama",
|
| 3 |
+
"quantization": "q4f16_1",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"hidden_size": 2048,
|
| 6 |
+
"intermediate_size": 5504,
|
| 7 |
+
"num_attention_heads": 16,
|
| 8 |
+
"num_hidden_layers": 24,
|
| 9 |
+
"rms_norm_eps": 1e-05,
|
| 10 |
+
"vocab_size": 32002,
|
| 11 |
+
"position_embedding_base": 10000.0,
|
| 12 |
+
"context_window_size": 768,
|
| 13 |
+
"prefill_chunk_size": 768,
|
| 14 |
+
"num_key_value_heads": 16,
|
| 15 |
+
"head_dim": 128,
|
| 16 |
+
"tensor_parallel_shards": 1,
|
| 17 |
+
"max_batch_size": 1
|
| 18 |
+
},
|
| 19 |
+
"vocab_size": 32002,
|
| 20 |
+
"context_window_size": 768,
|
| 21 |
+
"sliding_window_size": -1,
|
| 22 |
+
"prefill_chunk_size": 768,
|
| 23 |
+
"attention_sink_size": -1,
|
| 24 |
+
"tensor_parallel_shards": 1,
|
| 25 |
+
"max_batch_size": 80,
|
| 26 |
+
"mean_gen_len": 128,
|
| 27 |
+
"max_gen_len": 512,
|
| 28 |
+
"shift_fill_factor": 0.3,
|
| 29 |
+
"temperature": 0.7,
|
| 30 |
+
"repetition_penalty": 1.0,
|
| 31 |
+
"top_p": 0.95,
|
| 32 |
+
"conv_template": "open_hermes_mistral",
|
| 33 |
+
"system": "",
|
| 34 |
+
"pad_token_id": 0,
|
| 35 |
+
"bos_token_id": 1,
|
| 36 |
+
"eos_token_id": 2,
|
| 37 |
+
"tokenizer_files": [
|
| 38 |
+
"tokenizer.json",
|
| 39 |
+
"tokenizer_config.json"
|
| 40 |
+
],
|
| 41 |
+
"version": "0.1.0"
|
| 42 |
+
}
|
ndarray-cache.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
params_shard_0.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db0fe99f3ff8a2199019b332182bb11d63f812a7620731def3c0b3b6ddb53bb3
|
| 3 |
+
size 32770048
|
params_shard_1.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a495a79632243e914c2ed18f1fce0546dfb1ec817b60bca6b5b0a2b8ea2c2be5
|
| 3 |
+
size 32770048
|
params_shard_10.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ab740649dd514477001eddfe3cb147d0784d5712eabb8d35f06211784c21a79
|
| 3 |
+
size 28467200
|
params_shard_11.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e852830473b6bde93b52dea54a6eaf0f61a88c002924e4daa0530db0c7aba7f0
|
| 3 |
+
size 28467200
|
params_shard_12.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99f8c5c3e54a73cde9ce6dea091521b7bb6bdc3e165ba94046d4f97c0e7bfce4
|
| 3 |
+
size 28467200
|
params_shard_13.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b656a33fbf64e3f08df30df89d54c8bcfa06822895d7adcc949d5a00c717ee8
|
| 3 |
+
size 28467200
|
params_shard_14.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b8de58b4a6bf47f33526bfa8b9c1fc58f2036bcba4833e4eba9c3a0a43250c6
|
| 3 |
+
size 28467200
|
params_shard_15.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:83f75d5dcfcb1e9365ab00eb991b72466470e957dacd34795cd0a94efcc1f69e
|
| 3 |
+
size 28467200
|
params_shard_16.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1993c6f7c8fe2575ab4f40733da2be74db189acc603cef9d6b72b0314ae37562
|
| 3 |
+
size 28467200
|
params_shard_17.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe6204381b17df490bafff30951a5f827da24679b68e3d624e82fa701a63fff6
|
| 3 |
+
size 28467200
|
params_shard_18.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc2294d68b57bf18abb5aa661e11b1c801eb601f7f2892344f70c7d18b944b98
|
| 3 |
+
size 31563776
|
params_shard_19.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:651af8148c604b19636d488ef16ba5fae5b447ce38577089392b1972c6fefe84
|
| 3 |
+
size 28467200
|
params_shard_2.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a58c35569f8a842125e5520c408e0d2d539a6f24b222f937573a4fd1fc8da950
|
| 3 |
+
size 32866816
|
params_shard_20.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de1727d451e48cd6913a1fd137dfcfc37e07ba19d211ae1426bc0a320744a2b2
|
| 3 |
+
size 28467200
|
params_shard_21.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21471892f3507a40dc8d68516f8024e6ec3cdfd992f635d85b7b43dba0da8828
|
| 3 |
+
size 28467200
|
params_shard_22.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d656044f0b4b069e255424963d8ccebf66de7df049a57f2bffa31073f891df8
|
| 3 |
+
size 28467200
|
params_shard_23.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:604aabc4d7b57936a60e57a44fefd8d4c168cb95b64fcb08f0851b8fdc905e9e
|
| 3 |
+
size 28467200
|
params_shard_24.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e21821fb1537f088b072a0b58acaa166419c8f54a682cbaa1a22694615cd831
|
| 3 |
+
size 28467200
|
params_shard_25.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81ffe6f6d4ae91ba8063a6ee4ba555a2d0aeee0702f6927c541b4ccf582402cb
|
| 3 |
+
size 28463104
|
params_shard_3.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9aa928f3863e3d8114c5139be2e1fbb868a7d172c4e2d5a94be47ee78ee0c95
|
| 3 |
+
size 29171712
|
params_shard_4.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:381ad04e5142b34a2d636e3d6588e8ff10ade41d2b1e746b57a77137d60f3694
|
| 3 |
+
size 28467200
|
params_shard_5.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46fa10dcc14bda34a5954c6f596a67a98f8e4a5f6c996fdeafae9c872d14824c
|
| 3 |
+
size 28467200
|
params_shard_6.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9995b1a0888366b7f59d10bac156df034ac655e322c559b04b8568df50778e6
|
| 3 |
+
size 28467200
|
params_shard_7.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbb48477acb41b494f1e4b9a5c7b0e273361fa2e722911b5bb0364d55c33461e
|
| 3 |
+
size 28467200
|
params_shard_8.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df44fd51777abab4f34554a27e868669bb3c32813b82a5db8a011a326c991ecf
|
| 3 |
+
size 28467200
|
params_shard_9.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74de7131d3f6e25fe6871259a95fe1dfc993121100afc40a7504e0e1bf55dbd3
|
| 3 |
+
size 28467200
|