Upload folder using huggingface_hub
Browse files- README.md +8 -2
- mergekit_config.yml +5 -0
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
README.md
CHANGED
|
@@ -19,9 +19,10 @@ This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge m
|
|
| 19 |
### Models Merged
|
| 20 |
|
| 21 |
The following models were included in the merge:
|
| 22 |
-
* ./full_model_2
|
| 23 |
-
* ./full_model_0
|
| 24 |
* ./full_model_1
|
|
|
|
|
|
|
|
|
|
| 25 |
|
| 26 |
### Configuration
|
| 27 |
|
|
@@ -45,6 +46,11 @@ models:
|
|
| 45 |
density: 0.5 # Keeps the top 50% of most changed weights
|
| 46 |
weight: 0.33 # Give each model roughly equal weight
|
| 47 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 48 |
merge_method: ties
|
| 49 |
base_model: GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct # TIES needs the original base model
|
| 50 |
parameters:
|
|
|
|
| 19 |
### Models Merged
|
| 20 |
|
| 21 |
The following models were included in the merge:
|
|
|
|
|
|
|
| 22 |
* ./full_model_1
|
| 23 |
+
* ./full_model_0
|
| 24 |
+
* ./full_model_3
|
| 25 |
+
* ./full_model_2
|
| 26 |
|
| 27 |
### Configuration
|
| 28 |
|
|
|
|
| 46 |
density: 0.5 # Keeps the top 50% of most changed weights
|
| 47 |
weight: 0.33 # Give each model roughly equal weight
|
| 48 |
|
| 49 |
+
- model: ./full_model_3
|
| 50 |
+
parameters:
|
| 51 |
+
density: 0.5 # Keeps the top 50% of most changed weights
|
| 52 |
+
weight: 0.33 # Give each model roughly equal weight
|
| 53 |
+
|
| 54 |
merge_method: ties
|
| 55 |
base_model: GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct # TIES needs the original base model
|
| 56 |
parameters:
|
mergekit_config.yml
CHANGED
|
@@ -15,6 +15,11 @@ models:
|
|
| 15 |
density: 0.5 # Keeps the top 50% of most changed weights
|
| 16 |
weight: 0.33 # Give each model roughly equal weight
|
| 17 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
merge_method: ties
|
| 19 |
base_model: GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct # TIES needs the original base model
|
| 20 |
parameters:
|
|
|
|
| 15 |
density: 0.5 # Keeps the top 50% of most changed weights
|
| 16 |
weight: 0.33 # Give each model roughly equal weight
|
| 17 |
|
| 18 |
+
- model: ./full_model_3
|
| 19 |
+
parameters:
|
| 20 |
+
density: 0.5 # Keeps the top 50% of most changed weights
|
| 21 |
+
weight: 0.33 # Give each model roughly equal weight
|
| 22 |
+
|
| 23 |
merge_method: ties
|
| 24 |
base_model: GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct # TIES needs the original base model
|
| 25 |
parameters:
|
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4953586328
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32eaadc49913f7d8506f21c9d5cb70f503bd34e3782b8bfb366ccb7967862e8f
|
| 3 |
size 4953586328
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999819232
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c45cf2cc7570f535be81bee0c61c50f2af8d34479920f6522aba72e30fb0ca6c
|
| 3 |
size 4999819232
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916048
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:610dbc3e6060835566c613adf58d5f58ce1162581661858e8a345a6b8729a005
|
| 3 |
size 4915916048
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1191234448
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d7fd47c67b37742e89f0d16c224986a9af3001a6feec0e3348c648da2e48ae0
|
| 3 |
size 1191234448
|