| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 2.998504843008516, | |
| "global_step": 1440, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.42351716961498437, | |
| "eval_accuracy_0": 0.7588532883642496, | |
| "eval_accuracy_1": 0.046094750320102434, | |
| "eval_accuracy_2": 0.5985401459854015, | |
| "eval_loss": 0.80291348695755, | |
| "eval_runtime": 24.8435, | |
| "eval_samples_per_second": 77.364, | |
| "eval_steps_per_second": 77.364, | |
| "step": 480 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.4011446409989594, | |
| "eval_accuracy_0": 0.7470489038785835, | |
| "eval_accuracy_1": 0.18309859154929578, | |
| "eval_accuracy_2": 0.3375912408759124, | |
| "eval_loss": 0.7574263215065002, | |
| "eval_runtime": 24.6349, | |
| "eval_samples_per_second": 78.019, | |
| "eval_steps_per_second": 78.019, | |
| "step": 960 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.40790842872008326, | |
| "eval_accuracy_0": 0.8026981450252951, | |
| "eval_accuracy_1": 0.18693982074263765, | |
| "eval_accuracy_2": 0.2956204379562044, | |
| "eval_loss": 0.7730965614318848, | |
| "eval_runtime": 24.5617, | |
| "eval_samples_per_second": 78.252, | |
| "eval_steps_per_second": 78.252, | |
| "step": 1440 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "step": 1440, | |
| "total_flos": 2507409848941452.0, | |
| "train_loss": 0.7177374945746527, | |
| "train_runtime": 2670.6543, | |
| "train_samples_per_second": 17.28, | |
| "train_steps_per_second": 0.539 | |
| } | |
| ], | |
| "max_steps": 1440, | |
| "num_train_epochs": 3, | |
| "total_flos": 2507409848941452.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |