Training in progress, epoch 1

Files changed (7) hide show

adapter_config.json CHANGED Viewed

@@ -1,7 +1,10 @@
 {
   "alpha_pattern": {},
-  "auto_mapping": null,
-  "base_model_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
@@ -13,7 +16,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 8,
   "lora_bias": false,
   "lora_dropout": 0.05,
   "megatron_config": null,
@@ -23,19 +26,22 @@
     "embed_tokens"
   ],
   "peft_type": "LORA",
-  "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "up_proj",
     "gate_proj",
-    "v_proj",
     "o_proj",
     "k_proj",
-    "down_proj"
   ],
-  "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false

 {
   "alpha_pattern": {},
+  "auto_mapping": {
+    "base_model_class": "Gemma3ForConditionalGeneration",
+    "parent_library": "transformers.models.gemma3.modeling_gemma3"
+  },
+  "base_model_name_or_path": "google/gemma-3-27b-it",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 16,
   "lora_bias": false,
   "lora_dropout": 0.05,
   "megatron_config": null,
     "embed_tokens"
   ],
   "peft_type": "LORA",
+  "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "out_proj",
+    "fc2",
+    "down_proj",
     "gate_proj",
+    "up_proj",
+    "fc1",
     "o_proj",
     "k_proj",
+    "v_proj",
+    "q_proj"
   ],
+  "task_type": null,
   "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3103739f20055b097aa7e8eb1f5835b25753fb77386dc4c348b868c0bf7a5224
-size 3382826216

 version https://git-lfs.github.com/spec/v1
+oid sha256:740908d9140c8ef11d44c015ad7e4fc8c06f674d02e721c5f96dc9aab4109742
+size 6127551176

runs/May05_07-34-31_code-smells-gpu/events.out.tfevents.1746430489.code-smells-gpu.5094.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:131cda81cb0d1aa7a3952614df76588a9f4c723bb1f195fc5835e160e5128f7f
+size 18286

special_tokens_map.json CHANGED Viewed

@@ -1,20 +1,30 @@
 {
   "bos_token": {
-    "content": "<｜begin▁of▁sentence｜>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,
     "single_word": false
   },
   "eos_token": {
-    "content": "<｜end▁of▁sentence｜>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,
     "single_word": false
   },
   "pad_token": {
-    "content": "<｜end▁of▁sentence｜>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

 {
+  "boi_token": "<start_of_image>",
   "bos_token": {
+    "content": "<bos>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,
     "single_word": false
   },
+  "eoi_token": "<end_of_image>",
   "eos_token": {
+    "content": "<eos>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,
     "single_word": false
   },
+  "image_token": "<image_soft_token>",
   "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
-size 11422778

 version https://git-lfs.github.com/spec/v1
+oid sha256:4667f2089529e8e7657cfb6d1c19910ae71ff5f28aa7ab2ff2763330affad795
+size 33384568

tokenizer_config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e755e1fb8c5b095b9aa2eb663b64de0c6ac5602912cbaba6997903f592fc8e6b
 size 5816

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb68ee0a206c5ab6f71dbae93b6c2ba860e5f97388483e3c285141814c228dca
 size 5816