checkpoint-500/trainer_state.json
486 B · 23 lines · json Raw
1 {
2 "best_metric": null,
3 "best_model_checkpoint": null,
4 "epoch": 2.1645021645021645,
5 "global_step": 500,
6 "is_hyper_param_search": false,
7 "is_local_process_zero": true,
8 "is_world_process_zero": true,
9 "log_history": [
10 {
11 "epoch": 2.16,
12 "learning_rate": 1.3924963924963927e-05,
13 "loss": 1.2342,
14 "step": 500
15 }
16 ],
17 "max_steps": 693,
18 "num_train_epochs": 3,
19 "total_flos": 2.565976886136013e+16,
20 "trial_name": null,
21 "trial_params": null
22 }
23