zackli4ai commited on
Commit
6bfaf0f
·
verified ·
1 Parent(s): d8e1af6

Upload 544 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +6 -0
  2. config.json +51 -0
  3. decoder_layer_0.blob +3 -0
  4. decoder_layer_1.blob +3 -0
  5. decoder_layer_prefill.blob +3 -0
  6. embedding_post.blob +3 -0
  7. embedding_post_prefill.blob +3 -0
  8. generation_config.json +9 -0
  9. lm_head.blob +3 -0
  10. model_weights/model_0_input_10.bin +3 -0
  11. model_weights/model_0_input_11.bin +3 -0
  12. model_weights/model_0_input_12.bin +3 -0
  13. model_weights/model_0_input_13.bin +3 -0
  14. model_weights/model_0_input_14.bin +3 -0
  15. model_weights/model_0_input_15.bin +3 -0
  16. model_weights/model_0_input_16.bin +3 -0
  17. model_weights/model_0_input_17.bin +3 -0
  18. model_weights/model_0_input_18.bin +3 -0
  19. model_weights/model_0_input_19.bin +3 -0
  20. model_weights/model_0_input_20.bin +3 -0
  21. model_weights/model_0_input_21.bin +3 -0
  22. model_weights/model_0_input_3.bin +3 -0
  23. model_weights/model_0_input_4.bin +3 -0
  24. model_weights/model_0_input_5.bin +3 -0
  25. model_weights/model_0_input_6.bin +3 -0
  26. model_weights/model_0_input_7.bin +3 -0
  27. model_weights/model_0_input_8.bin +3 -0
  28. model_weights/model_0_input_9.bin +3 -0
  29. model_weights/model_10_input_10.bin +3 -0
  30. model_weights/model_10_input_11.bin +3 -0
  31. model_weights/model_10_input_12.bin +3 -0
  32. model_weights/model_10_input_13.bin +3 -0
  33. model_weights/model_10_input_14.bin +3 -0
  34. model_weights/model_10_input_15.bin +3 -0
  35. model_weights/model_10_input_16.bin +3 -0
  36. model_weights/model_10_input_17.bin +3 -0
  37. model_weights/model_10_input_18.bin +3 -0
  38. model_weights/model_10_input_19.bin +3 -0
  39. model_weights/model_10_input_20.bin +3 -0
  40. model_weights/model_10_input_21.bin +3 -0
  41. model_weights/model_10_input_3.bin +3 -0
  42. model_weights/model_10_input_4.bin +3 -0
  43. model_weights/model_10_input_5.bin +3 -0
  44. model_weights/model_10_input_6.bin +3 -0
  45. model_weights/model_10_input_7.bin +3 -0
  46. model_weights/model_10_input_8.bin +3 -0
  47. model_weights/model_10_input_9.bin +3 -0
  48. model_weights/model_11_input_10.bin +3 -0
  49. model_weights/model_11_input_11.bin +3 -0
  50. model_weights/model_11_input_12.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ decoder_layer_0.blob filter=lfs diff=lfs merge=lfs -text
37
+ decoder_layer_1.blob filter=lfs diff=lfs merge=lfs -text
38
+ decoder_layer_prefill.blob filter=lfs diff=lfs merge=lfs -text
39
+ embedding_post_prefill.blob filter=lfs diff=lfs merge=lfs -text
40
+ embedding_post.blob filter=lfs diff=lfs merge=lfs -text
41
+ lm_head.blob filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "DeepSeek-R1-Distill-Qwen-7B",
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "asym": false,
7
+ "attention_dropout": 0.0,
8
+ "bigdl_transformers_low_bit": "sym_int4_rtn",
9
+ "bos_token_id": 151643,
10
+ "const_parameter": true,
11
+ "cos_sin_input": true,
12
+ "embedding_post": true,
13
+ "eos_token_id": 151643,
14
+ "fused_layers": 2,
15
+ "group_size": 0,
16
+ "head_dim": 128,
17
+ "hidden_act": "silu",
18
+ "hidden_size": 3584,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 18944,
21
+ "kv_len": 1023,
22
+ "lm_head_low_bit": "sym_int4_rtn",
23
+ "max_position_embeddings": 131072,
24
+ "max_prompt_len": 512,
25
+ "max_window_layers": 28,
26
+ "mixed_precision": false,
27
+ "model_type": "qwen2",
28
+ "n_splits_down_proj": 2,
29
+ "n_splits_linear": 1,
30
+ "num_attention_heads": 28,
31
+ "num_head": 28,
32
+ "num_hidden_layers": 28,
33
+ "num_key_value_heads": 4,
34
+ "optimize_model": true,
35
+ "qkv_bias": true,
36
+ "rms_norm_eps": 1e-06,
37
+ "rope_scaling": null,
38
+ "rope_theta": 10000,
39
+ "sliding_window": null,
40
+ "tie_word_embeddings": false,
41
+ "torch_dtype": "float16",
42
+ "transformers_version": "4.45.0",
43
+ "transpose_value_cache": true,
44
+ "use_cache": true,
45
+ "use_mrope": false,
46
+ "use_prefill_sdp": false,
47
+ "use_sliding_window": false,
48
+ "vocab_size": 152064,
49
+ "weight_idx": 8,
50
+ "weight_num": 7
51
+ }
decoder_layer_0.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a805efd6dee09d5fe88b71744ba6e42158e926c7e76d1b4a8557c7a1533e730a
3
+ size 19344440
decoder_layer_1.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0989654f0d95ad741c6e3df40c5187a33308a504b53e5e8720d681e448841af8
3
+ size 19344440
decoder_layer_prefill.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81b460571b964d30618bc0737b40872cfabad4e2e497379a8398316c4125d1f1
3
+ size 13843512
embedding_post.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b757369422e940f131a9b38e9fbd1bff053f1ceb18422dd474905d953ccd678
3
+ size 167456
embedding_post_prefill.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dac4e21394beb5f9c1859d79a7ab17a72b60623c12e8558acd2ee26ce59964ca
3
+ size 196552
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 151646,
4
+ "do_sample": true,
5
+ "eos_token_id": 151643,
6
+ "temperature": 0.6,
7
+ "top_p": 0.95,
8
+ "transformers_version": "4.45.0"
9
+ }
lm_head.blob ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93e65e84e1f960189f8afadc094a07a2c79adfab6b6f8adb52866c3c0cce7615
3
+ size 22843552
model_weights/model_0_input_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe0705765e3f3d616ab9b035a3795a53c5b9a50dd2978a24e8699d03d6bc8ddf
3
+ size 917504
model_weights/model_0_input_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cf9cebecc73530f9ce251cedde0e7afc7652a0368ba232ebb73aaabc526c59d
3
+ size 1024
model_weights/model_0_input_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ce7a9c0e34a80dc5f7b4644dc758ffd0f86cd1087acc53315de44b62cc97033
3
+ size 917504
model_weights/model_0_input_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd96d30bbd633811673bd68d7def881842264d97b5ee7ebdb7e45ac85dabca59
3
+ size 1024
model_weights/model_0_input_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3966367f65dda7cbb6d366b1af760f88b1a4875233e18d17b5b652a43baf72b6
3
+ size 6422528
model_weights/model_0_input_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebaf02ae3ce7128b818da938de6d826ef0a01f8ad494253a06521a00536ab427
3
+ size 7168
model_weights/model_0_input_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba44462e3b5ca003e2e90add31aef37db5540a00c7ef25c8dc028c90571c1331
3
+ size 33947648
model_weights/model_0_input_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47df6118708c8ca234268344df565e46ab9483d03f12d6193d414212b51d6b21
3
+ size 37888
model_weights/model_0_input_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a92fdce1c88a11677c20333a4c83e9a35c135026b6ff03f95093ea1941d7fc53
3
+ size 33947648
model_weights/model_0_input_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf78e5ffbf28532b34a78ff0187d53217675c84fbeb706df55c505e7c935ed75
3
+ size 37888
model_weights/model_0_input_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f93512a014c556ebeb2476830fc31855d4257db100011adb4097928bde624f89
3
+ size 33947648
model_weights/model_0_input_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68001a81330eab620b8c583a9045d918c2278e427d0b026c021da78153cff445
3
+ size 14336
model_weights/model_0_input_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dcd76bc2917f9ffde8a81d59efc2e26a388c9cdbbe482942699e8ba19c9788c
3
+ size 7168
model_weights/model_0_input_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90b67d92e60416a625c36afe2b4a5d0cc08316ae799f5982e6237b4b3c4a47b4
3
+ size 7168
model_weights/model_0_input_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35ff901910758b998a703afae819d51ca6768638bd0504871179cc9e410ad394
3
+ size 7168
model_weights/model_0_input_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cde24cc4a0e74ebec5d4823c21712e5679659c00448b46d5b209ef4e2c0c011
3
+ size 1024
model_weights/model_0_input_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de68c262f4fb1897b8a781b90684c9b0b3d29d0f2306fd51b243438541138b06
3
+ size 1024
model_weights/model_0_input_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b578073288598f5a7b0bf2a02ebcef6bae62ac5fbb9f5f30b7685a80192f96ec
3
+ size 6422528
model_weights/model_0_input_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:448a37c9944d9d6248cfcddf4ce8181f317a55b0203aa381ebf056c770198724
3
+ size 7168
model_weights/model_10_input_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83506a174fee16cd2d91d3bb7d7556c93f03d77eff4c7d61dca39a150de66ef3
3
+ size 917504
model_weights/model_10_input_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b35105cf9dd4cfd12eaa7e6458ed2b6c006e55f9ac2301ed19781366e31e5524
3
+ size 1024
model_weights/model_10_input_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecb3c6340bbf9044c771a6c026b4a3717d671a844d3b5e9305d9b1e9aa6377f9
3
+ size 917504
model_weights/model_10_input_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a5f65c4b881908ae01596b4d161dda5b38f665a955036ec5a451dd7ec31a302
3
+ size 1024
model_weights/model_10_input_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb79aa20796060bc7dbed8e57f5f5d60f75f711d302673d0be8c3687884ea43c
3
+ size 6422528
model_weights/model_10_input_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4b6c26dd66f39f818ffa312de4803760b12907b42be6ec2c42174b60cff9209
3
+ size 7168
model_weights/model_10_input_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b260650196fb9c62cfa17feb4908ac8a80c239682671d9de5bb82205d86d1f
3
+ size 33947648
model_weights/model_10_input_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:783198914eeb1364b1d51c13cc210fdebc044018ab609e55bfbf77265ce6dc79
3
+ size 37888
model_weights/model_10_input_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:323225207b87cdd6a8aa1f2623828cab6a40f8a1785bf40bc41555badc680fdf
3
+ size 33947648
model_weights/model_10_input_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f110a38811b0a7e1b32aca8a987e4cd33a668b50adf64a8d938d947620429dd4
3
+ size 37888
model_weights/model_10_input_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4fab998a0bd1d2407468e57d18618df690a8125104ab53a6c754891a3ad1f3a
3
+ size 33947648
model_weights/model_10_input_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de03b9b7d8961dc8e08970817ec8fc9637e9928db89edc7910456034549a258
3
+ size 14336
model_weights/model_10_input_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11ce29112f292653b0819095b30cabd1683004343b7a2c3b7ca83b04f63a1afd
3
+ size 7168
model_weights/model_10_input_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b8cd9efbd7a736eaa1f9fa1b3e9985ab5f82b2e5ac62246a7fec5a94666f092
3
+ size 7168
model_weights/model_10_input_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a2738756c9a3b6a4fbfab49f5af007e638ddf292c33fbe71b4dc14755cc5574
3
+ size 7168
model_weights/model_10_input_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:610737cfcfdd871e051924d9bdb0251501abef91a36efcf2e5f92e5b41cd43a5
3
+ size 1024
model_weights/model_10_input_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a604e1a19946e519ddb25517baeaefc910ef8c6166b5874db85556fff8dcbf
3
+ size 1024
model_weights/model_10_input_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d902c2a5671bf58940293d1b94645d79cd7f1f1681cc18607375a44653e0dce1
3
+ size 6422528
model_weights/model_10_input_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d11dd4648136040bcd09b7fa0d9da499fe47bb4c2de692c8a20f51e1c36060e
3
+ size 7168
model_weights/model_11_input_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c492841fda47b293a2c9699b6be00648e0005b5810e1a372cd04943c2469853e
3
+ size 917504
model_weights/model_11_input_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:397b0960773173ae55211bbdc1efd81bd4b6df5b6c6703768dd6662073571218
3
+ size 1024
model_weights/model_11_input_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69fb43c76497c4a4f64578b033a68e69340780e7223b4291862a98881dd04c12
3
+ size 917504