Training in progress, step 3, checkpoint
Browse files- last-checkpoint/adapter_config.json +5 -5
- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +8 -8
- last-checkpoint/training_args.bin +2 -2
last-checkpoint/adapter_config.json
CHANGED
@@ -24,13 +24,13 @@
|
|
24 |
"rank_pattern": {},
|
25 |
"revision": null,
|
26 |
"target_modules": [
|
27 |
-
"o_proj",
|
28 |
-
"down_proj",
|
29 |
-
"up_proj",
|
30 |
"q_proj",
|
31 |
-
"
|
|
|
|
|
32 |
"v_proj",
|
33 |
-
"
|
|
|
34 |
],
|
35 |
"task_type": "CAUSAL_LM",
|
36 |
"trainable_token_indices": null,
|
|
|
24 |
"rank_pattern": {},
|
25 |
"revision": null,
|
26 |
"target_modules": [
|
|
|
|
|
|
|
27 |
"q_proj",
|
28 |
+
"down_proj",
|
29 |
+
"o_proj",
|
30 |
+
"gate_proj",
|
31 |
"v_proj",
|
32 |
+
"up_proj",
|
33 |
+
"k_proj"
|
34 |
],
|
35 |
"task_type": "CAUSAL_LM",
|
36 |
"trainable_token_indices": null,
|
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 36981072
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96dc805f8ec4bd0e855d7adf77c4e5aeb8fccae1eb9b6a75e0b8cf80a66ca6b9
|
3 |
size 36981072
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 74188650
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:111022490b414d8de24040a2def6d07ef67150fecce1d375dd858f5ead2d602f
|
3 |
size 74188650
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2030b6fa4cba3b806c7bd50086686655d43925111f7c1f49e9476afbacf3c36
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3866b207848bde64e003e2009c19ad36b11cfa7e85afea28bcb9e78b9bbbc07c
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30c91fcbbb30d4ea264cde8e92f569f82e13868db72bdecd83da3096aa62b6fc
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,18 +2,18 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch":
|
6 |
-
"eval_steps":
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
11 |
"log_history": [],
|
12 |
-
"logging_steps":
|
13 |
-
"max_steps":
|
14 |
"num_input_tokens_seen": 0,
|
15 |
-
"num_train_epochs":
|
16 |
-
"save_steps":
|
17 |
"stateful_callbacks": {
|
18 |
"TrainerControl": {
|
19 |
"args": {
|
@@ -26,7 +26,7 @@
|
|
26 |
"attributes": {}
|
27 |
}
|
28 |
},
|
29 |
-
"total_flos":
|
30 |
"train_batch_size": 16,
|
31 |
"trial_name": null,
|
32 |
"trial_params": null
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 3.0,
|
6 |
+
"eval_steps": 100,
|
7 |
+
"global_step": 3,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
11 |
"log_history": [],
|
12 |
+
"logging_steps": 100,
|
13 |
+
"max_steps": 3,
|
14 |
"num_input_tokens_seen": 0,
|
15 |
+
"num_train_epochs": 3,
|
16 |
+
"save_steps": 500,
|
17 |
"stateful_callbacks": {
|
18 |
"TrainerControl": {
|
19 |
"args": {
|
|
|
26 |
"attributes": {}
|
27 |
}
|
28 |
},
|
29 |
+
"total_flos": 1362052685758464.0,
|
30 |
"train_batch_size": 16,
|
31 |
"trial_name": null,
|
32 |
"trial_params": null
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246f4beac515de39119f51ef65f2d1a9e068fb98a957786c00d690b3fe1de63e
|
3 |
+
size 5560
|