mkopecki commited on
Commit
1fb1140
1 Parent(s): 0187f02

End of training

Browse files
Files changed (1) hide show
  1. trainer_state.json +16 -9
trainer_state.json CHANGED
@@ -3,23 +3,30 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 192,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
11
  {
12
  "epoch": 3.0,
13
- "step": 192,
14
- "total_flos": 2.031101718065971e+16,
15
- "train_loss": 0.5815114180246989,
16
- "train_runtime": 555.1073,
17
- "train_samples_per_second": 5.502,
18
- "train_steps_per_second": 0.346
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 192,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 3,
25
  "save_steps": 500,
@@ -35,7 +42,7 @@
35
  "attributes": {}
36
  }
37
  },
38
- "total_flos": 2.031101718065971e+16,
39
  "train_batch_size": 16,
40
  "trial_name": null,
41
  "trial_params": null
 
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 654,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 2.293577981651376,
13
+ "grad_norm": 0.8083828687667847,
14
+ "learning_rate": 1.1773700305810397e-05,
15
+ "loss": 0.5038,
16
+ "step": 500
17
+ },
18
  {
19
  "epoch": 3.0,
20
+ "step": 654,
21
+ "total_flos": 6.243879793095475e+16,
22
+ "train_loss": 0.462136259866417,
23
+ "train_runtime": 1671.2602,
24
+ "train_samples_per_second": 6.24,
25
+ "train_steps_per_second": 0.391
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 654,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 3,
32
  "save_steps": 500,
 
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 6.243879793095475e+16,
46
  "train_batch_size": 16,
47
  "trial_name": null,
48
  "trial_params": null