leafspark
/

WizardHermes-2-Pro-Llama-3-8b

Text Generation

Model card Files Files and versions

leafspark commited on May 5, 2024

Commit

39b2f86

·

verified ·

1 Parent(s): 58d72bd

Update README.md

Files changed (1) hide show

README.md +95 -3

README.md CHANGED Viewed

@@ -1,3 +1,95 @@
----
-license: llama3
----

+---
+license: llama3
+language:
+- en
+library_name: transformers
+pipeline_tag: text-generation
+datasets:
+- cognitivecomputations/WizardLM_alpaca_evol_instruct_70k_unfiltered
+tags:
+- finetune
+- llama
+---
+# WizardHermes-2-Pro-Llama-3-8b
+Finetuned from Meta-Llama-3-8b, 0.55 epoches
+Merged with Hermes-2-Pro-Llama-3-8b
+Eval (0.0 temp) ([https://inflection.ai/assets/MMLU-Examples.pdf](https://inflection.ai/assets/MMLU-Examples.pdf)):
+```
+Hermes 2 Pro LoRA (merged) (checkpoint 1): 7/12
+Hermes 2 Pro LoRA (merged) (checkpoint 2): 9/12
+Hermes 2 Pro Llama 3 8b: 8/12
+```
+Trained using MonsterAPI
+LoRA training parameters:
+```
+{
+	"deployment_name": "wizardlm-llama-3-8b",
+	"pretrainedmodel_config": {
+		"model_path": "meta-llama/Meta-Llama-3-8B",
+		"other_model_info": null,
+		"resume_checkpoint_path": "",
+		"use_lora": true,
+		"lora_r": 8,
+		"lora_alpha": 16,
+		"lora_dropout": 0,
+		"lora_bias": "none",
+		"use_quantization": false,
+		"use_gradient_checkpointing": false,
+		"parallelization": "nmp"
+	},
+	"data_config": {
+		"data_path": "cognitivecomputations/WizardLM_alpaca_evol_instruct_70k_unfiltered",
+		"data_subset": "default",
+		"data_source_type": "hub_link",
+		"cutoff_len": 4096,
+		"data_split_config": {
+			"train": 0.9,
+			"validation": 0.1
+		},
+		"prevalidated": true,
+		"concat_config": {
+			"0": {
+				"text": "Below is an instruction that describes a task. Write a response that appropriately completes the request. \n\n\n###Instruction:",
+				"column": false
+			},
+			"1": {
+				"text": "instruction",
+				"column": true
+			},
+			"2": {
+				"text": "\n\n\n###Response:",
+				"column": false
+			},
+			"3": {
+				"text": "output",
+				"column": true
+			}
+		}
+	},
+	"training_config": {
+		"early_stopping_patience": 5,
+		"num_train_epochs": 5,
+		"gradient_accumulation_steps": 1,
+		"warmup_steps": 300,
+		"learning_rate": 0.0005,
+		"lr_scheduler_type": "reduce_lr_on_plateau",
+		"group_by_length": false,
+		"use_hugging_face": false
+	},
+	"logging_config": {
+		"use_wandb": false,
+		"wandb_username": "",
+		"wandb_login_key": "",
+		"wandb_project": "",
+		"wandb_run_name": ""
+	},
+	"accessorytasks_config": {
+		"run_eval_report": false,
+		"run_quantize_merge": false
+	}
+}
+```