Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/aarch64-cu126-sm87.so +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/mlc-chat-config.json +76 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/ndarray-cache.json +0 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_0.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_1.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_10.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_100.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_101.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_102.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_103.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_104.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_105.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_106.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_107.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_108.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_109.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_11.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_110.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_111.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_112.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_113.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_114.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_115.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_116.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_117.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_118.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_119.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_12.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_120.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_121.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_122.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_123.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_124.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_125.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_126.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_127.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_128.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_129.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_13.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_130.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_131.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_132.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_133.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_134.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_135.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_136.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_137.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_138.bin +3 -0
- DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_139.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/aarch64-cu126-sm87.so filter=lfs diff=lfs merge=lfs -text
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/aarch64-cu126-sm87.so
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6277acfac1b0e45b02942bf1c4370fe4925c2c8d2c48a12c1877c08eedd3a03e
|
3 |
+
size 24358808
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "q4f16_ft",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 5120,
|
8 |
+
"intermediate_size": 13824,
|
9 |
+
"num_attention_heads": 40,
|
10 |
+
"num_hidden_layers": 48,
|
11 |
+
"num_key_value_heads": 8,
|
12 |
+
"rms_norm_eps": 1e-05,
|
13 |
+
"rope_theta": 1000000.0,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"tie_word_embeddings": false,
|
16 |
+
"context_window_size": 131072,
|
17 |
+
"prefill_chunk_size": 8192,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"head_dim": 128,
|
20 |
+
"dtype": "float32",
|
21 |
+
"max_batch_size": 1
|
22 |
+
},
|
23 |
+
"vocab_size": 152064,
|
24 |
+
"context_window_size": 131072,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 8192,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 0.6,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.95,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "deepseek_r1_qwen",
|
46 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
47 |
+
"system_message": "You are a helpful assistant.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<\uff5cUser\uff5c>",
|
52 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"",
|
62 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
63 |
+
],
|
64 |
+
"role_content_sep": "",
|
65 |
+
"role_empty_sep": "",
|
66 |
+
"stop_str": [],
|
67 |
+
"stop_token_ids": [
|
68 |
+
151643
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 151646,
|
75 |
+
"eos_token_id": 151643
|
76 |
+
}
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e420aaab6f44df1e1b1b8a82fd411547d633850350c623e8aa7f8ee8082ecf9
|
3 |
+
size 389283840
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2543f0b530d797bed53e2eba964564165253ed78d0e614477234956c898927ac
|
3 |
+
size 48660480
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aaee67da8860e9cb52c73704c1ec3f056ee80a817d6708fd64540bcb3eeea21
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43e33636eb95d1d0dddbfdad1b2f5b718b7c60536d2bdb9c3c662dbbbef77d87
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d71a397f1a39ff5f49c981f8b078a602276c2eb02e47af6995184a54cb2141e
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a2f535b9b6af0086620c925bf22405807aae6073f042a2bfdf9649fa45e3378
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d906500233dead750182ed7b9579ec27a8ce40ca1ef9bf3b293eafe2a49fdaae
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df8e27d55209a5b6836fb37b17776bf6e46150d8a691bf57ab86c30b26dd914a
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de4c22c8b4f57ea5bac81a3e4e4bebdac914d42eea8bc7f81ad8033255b6cd0a
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b39dffc6592c615000ad7a1c20608bd285d9779662691f87158f221854142f69
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c28ceb64ccfd0b1a37fc667a3c02ba1a308bd3d03cef93fa3a2edd1350af941
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7afdf7ec6bbf7310b679aab5ecb942144bad5ee60ff9c8887b84001185debb23
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b8fc6be9372f1deb3fbfdaffadb4c91be9291263c57b957a9e6c9ed4a36d1f
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbb8e8ec4a110064c58571b531e38321ae11aa97f167045881a0cc35091caa1b
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5323425299dba42a93a99273b28135de52d03a897b82e85f5d40d6dbaf33e949
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e84dddce2a9df36678341b533a55cd9c6f23b7a2c2e3a0979cedf916fc8d228b
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bfdf3277daf9bc7d8c9c2cfeea85948a7d5b2e099bffc3c6d9c862cdc22ef07
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f838908bb15381693091b2eb8452e22e7f351294967d0cf18adb43c6fa3ec52e
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:116a9717ca1a525aa5940e6ca4de6080de0b0133562e1393c3bf1c00a7c11ac8
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbeb0615ee5657a4a7d3048ce701a8c1c00fb3ca4e60deae75a4b7d63d132f0e
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6154ef0363a4793b5e6007b4a579da47e5c4309097a70f59f71d7b2bf32bba21
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:170fec721e732ede328c5377779c8fe70c97137ae5505ba722ee02392499ebbe
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e42fe669cbb8c3e9c3013a769892e3912c15beb732559cf2ef5331f8dfb21dc
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c68c5a095c0cee90fbf2955e34c3d9ac743b180dac3c8e1c98d7e11be2a1f42a
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f207329ab1c89d2944e06914d331539e2543edb759a7778f68a72a79c8e3b89
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbcee5362934dce69a40fab5ff00fab8ef937451f479a2a340276d87c05fb194
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187017b7577b4d628eb85d114eb887670d17470e43f602f08edacb7ae824728e
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd3b5f602f0c7a252df505178d76c42fa7bd893197a2463d6b771547b96f44ac
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36d255198f1da2d54ec03fc87be8a49429eccecbc639097bac1ce16d9280bd03
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:208d9dabdda69b99290221a55ac7b585ad10c3d93881ab17db39b035d14834d4
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f52be3b5989609e9a34891d40aaada0b0f007638753b3cbfb0a2e7851ed36d26
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e63678bc68a311d09ff597185ed21fbe1bd873caf793b44e5d2f3270a2668eda
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13b023734a59ebd589d70fc305feebc2ed1d9b9ef6f75f91208f6a172af55c69
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11ac4c13df2db43bc9daa88ad18e1494adfa68d13d00a261672c12d5745521ce
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c6e88904554564e12dfdc532a3350dca5e123a65a3cbe807954d5b73c556fe2
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df7800eaa1734b1ffc0909e988d4921e0fff0fd177128109a2cde39f10122579
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37b6e19a434d4aedcae5a69a60c2e7c6fdd8c90328cf9bb41c627cbe91e9649e
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e508a8fe331f60fd0879ab28740ef2a1b7bc56de49a24e73d9a9bdd82df01b0e
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47cb316cc428fdd444048b26919cd85d203498bfec39de5456d675fab820dcd1
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abb6db9b570b99cc650518ba56d40d2de10b0e61dad5a4fee67c180b07b16ee9
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50cb20ba949b6855bfd2e7714a1fa832f124f7fa6c1d9afe1faa6a9805b21609
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a81df72878d41057e9005eadbb4a538ba4aa725c2d5f4716b8f113c45618c500
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8a22693fc7c7c1eefe9db8c146e0b9649dc8b54e06c040462bede0a088f4a8d
|
3 |
+
size 35389440
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab343588736c97eb67af903f896a99dde70d670acb085b6569a945896c19c054
|
3 |
+
size 31582208
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b83a4d8cfc4bcab0863c38735023ccf8aa154a056037cfbe301b924c76eef3f
|
3 |
+
size 70778880
|
DeepSeek-R1-Distill-Qwen-14B-q4f16_ft-MLC/params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c2be28b87ad9216672e0cfa130aa1c931f31f44f555c4019e1c6b6e04a084b6
|
3 |
+
size 35389440
|