tuandunghcmut commited on
Commit
da32300
·
verified ·
1 Parent(s): 926e3bc

Training in progress, step 3, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -24,13 +24,13 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "o_proj",
28
- "down_proj",
29
- "up_proj",
30
  "q_proj",
31
- "k_proj",
 
 
32
  "v_proj",
33
- "gate_proj"
 
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
 
 
27
  "q_proj",
28
+ "down_proj",
29
+ "o_proj",
30
+ "gate_proj",
31
  "v_proj",
32
+ "up_proj",
33
+ "k_proj"
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:565b467fbbdbf25cc2bfa3c71f0bd336e8de28ad86df3918e596ca504bd31ced
3
  size 36981072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96dc805f8ec4bd0e855d7adf77c4e5aeb8fccae1eb9b6a75e0b8cf80a66ca6b9
3
  size 36981072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf47764c7f0af2d260e514ff53be11a069fc1773d2d9785ce9f40fca8159f6f7
3
  size 74188650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:111022490b414d8de24040a2def6d07ef67150fecce1d375dd858f5ead2d602f
3
  size 74188650
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97fb176f598ac490ccae77ec442df96e8ad14280345b9f1e433afd80f74a6b78
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2030b6fa4cba3b806c7bd50086686655d43925111f7c1f49e9476afbacf3c36
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b524f48acea96061f9e17824552379d210ce1c60f82e25c1280fb8b2df4b21f0
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3866b207848bde64e003e2009c19ad36b11cfa7e85afea28bcb9e78b9bbbc07c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcd240061f71d888d805feed14123a68774f5e130888a3057bdaa388caa9028c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30c91fcbbb30d4ea264cde8e92f569f82e13868db72bdecd83da3096aa62b6fc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,18 +2,18 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 1.0,
6
- "eval_steps": 10,
7
- "global_step": 1,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [],
12
- "logging_steps": 10,
13
- "max_steps": 1,
14
  "num_input_tokens_seen": 0,
15
- "num_train_epochs": 1,
16
- "save_steps": 20,
17
  "stateful_callbacks": {
18
  "TrainerControl": {
19
  "args": {
@@ -26,7 +26,7 @@
26
  "attributes": {}
27
  }
28
  },
29
- "total_flos": 16214912925696.0,
30
  "train_batch_size": 16,
31
  "trial_name": null,
32
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 3.0,
6
+ "eval_steps": 100,
7
+ "global_step": 3,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [],
12
+ "logging_steps": 100,
13
+ "max_steps": 3,
14
  "num_input_tokens_seen": 0,
15
+ "num_train_epochs": 3,
16
+ "save_steps": 500,
17
  "stateful_callbacks": {
18
  "TrainerControl": {
19
  "args": {
 
26
  "attributes": {}
27
  }
28
  },
29
+ "total_flos": 1362052685758464.0,
30
  "train_batch_size": 16,
31
  "trial_name": null,
32
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a226bdb6c8f1d8a261b365e32993c518d7b102eea55ff51a4f3775eac230c30
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:246f4beac515de39119f51ef65f2d1a9e068fb98a957786c00d690b3fe1de63e
3
+ size 5560