TirathP commited on
Commit
0f6a982
·
verified ·
1 Parent(s): dd1e850

Model save

Browse files
README.md CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 30
44
 
45
  ### Training results
46
 
 
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 50
44
 
45
  ### Training results
46
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 30.0,
3
- "eval_accuracy": 0.42857142857142855,
4
- "eval_f1": 0.2852813852813853,
5
- "eval_loss": 0.9329891800880432,
6
- "eval_runtime": 9.6641,
7
- "eval_samples_per_second": 1.449,
8
- "eval_steps_per_second": 0.207,
9
- "train_loss": 1.0424017588297525,
10
- "train_runtime": 383.8523,
11
- "train_samples_per_second": 1.094,
12
  "train_steps_per_second": 0.078
13
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "eval_accuracy": 0.7142857142857143,
4
+ "eval_f1": 0.4205128205128205,
5
+ "eval_loss": 0.4884902834892273,
6
+ "eval_runtime": 14.7003,
7
+ "eval_samples_per_second": 1.905,
8
+ "eval_steps_per_second": 0.272,
9
+ "train_loss": 0.6426682790120443,
10
+ "train_runtime": 770.3252,
11
+ "train_samples_per_second": 1.09,
12
  "train_steps_per_second": 0.078
13
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 30.0,
3
- "eval_accuracy": 0.42857142857142855,
4
- "eval_f1": 0.2852813852813853,
5
- "eval_loss": 0.9329891800880432,
6
- "eval_runtime": 9.6641,
7
- "eval_samples_per_second": 1.449,
8
- "eval_steps_per_second": 0.207
9
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "eval_accuracy": 0.7142857142857143,
4
+ "eval_f1": 0.4205128205128205,
5
+ "eval_loss": 0.4884902834892273,
6
+ "eval_runtime": 14.7003,
7
+ "eval_samples_per_second": 1.905,
8
+ "eval_steps_per_second": 0.272
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe96c949e5ad21cb5a030a5afd86937f73a33e1b3fcf8a0bfe6731d9b92b2674
3
  size 343299757
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0960f1e93365b2283831adf2fe4bf2a1ea54d24d8123be323c62af70718434b
3
  size 343299757
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 30.0,
3
- "train_loss": 1.0424017588297525,
4
- "train_runtime": 383.8523,
5
- "train_samples_per_second": 1.094,
6
  "train_steps_per_second": 0.078
7
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "train_loss": 0.6426682790120443,
4
+ "train_runtime": 770.3252,
5
+ "train_samples_per_second": 1.09,
6
  "train_steps_per_second": 0.078
7
  }
trainer_state.json CHANGED
@@ -3,26 +3,26 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 30.0,
5
  "eval_steps": 1000,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 30.0,
13
- "step": 30,
14
- "total_flos": 3.25492609849344e+16,
15
- "train_loss": 1.0424017588297525,
16
- "train_runtime": 383.8523,
17
- "train_samples_per_second": 1.094,
18
  "train_steps_per_second": 0.078
19
  }
20
  ],
21
  "logging_steps": 1000,
22
- "max_steps": 30,
23
  "num_train_epochs": 30,
24
  "save_steps": 1000,
25
- "total_flos": 3.25492609849344e+16,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
 
3
  "best_model_checkpoint": null,
4
  "epoch": 30.0,
5
  "eval_steps": 1000,
6
+ "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 30.0,
13
+ "step": 60,
14
+ "total_flos": 6.509968879067136e+16,
15
+ "train_loss": 0.6426682790120443,
16
+ "train_runtime": 770.3252,
17
+ "train_samples_per_second": 1.09,
18
  "train_steps_per_second": 0.078
19
  }
20
  ],
21
  "logging_steps": 1000,
22
+ "max_steps": 60,
23
  "num_train_epochs": 30,
24
  "save_steps": 1000,
25
+ "total_flos": 6.509968879067136e+16,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cf2287a18cc72d9e06aacf3d85a4179b9a3cfbee45d74f8950c4b77d87c89af
3
  size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11a92367af4ba92931d71cab3db55389b600af617d9d464e035d79e4ff4446ee
3
  size 4027