{ "best_metric": 0.43329915404319763, "best_model_checkpoint": "mobilebert_sa_GLUE_Experiment_sst2_256/checkpoint-527", "epoch": 6.0, "global_step": 3162, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 4.9e-05, "loss": 0.4969, "step": 527 }, { "epoch": 1.0, "eval_accuracy": 0.801605504587156, "eval_loss": 0.43329915404319763, "eval_runtime": 1.9711, "eval_samples_per_second": 442.394, "eval_steps_per_second": 3.551, "step": 527 }, { "epoch": 2.0, "learning_rate": 4.8e-05, "loss": 0.2781, "step": 1054 }, { "epoch": 2.0, "eval_accuracy": 0.783256880733945, "eval_loss": 0.49986955523490906, "eval_runtime": 1.9746, "eval_samples_per_second": 441.601, "eval_steps_per_second": 3.545, "step": 1054 }, { "epoch": 3.0, "learning_rate": 4.7e-05, "loss": 0.2274, "step": 1581 }, { "epoch": 3.0, "eval_accuracy": 0.7924311926605505, "eval_loss": 0.4782297611236572, "eval_runtime": 1.9765, "eval_samples_per_second": 441.178, "eval_steps_per_second": 3.542, "step": 1581 }, { "epoch": 4.0, "learning_rate": 4.600000000000001e-05, "loss": 0.2, "step": 2108 }, { "epoch": 4.0, "eval_accuracy": 0.7935779816513762, "eval_loss": 0.5582388043403625, "eval_runtime": 1.9778, "eval_samples_per_second": 440.902, "eval_steps_per_second": 3.539, "step": 2108 }, { "epoch": 5.0, "learning_rate": 4.5e-05, "loss": 0.1835, "step": 2635 }, { "epoch": 5.0, "eval_accuracy": 0.7912844036697247, "eval_loss": 0.4966583251953125, "eval_runtime": 1.9757, "eval_samples_per_second": 441.36, "eval_steps_per_second": 3.543, "step": 2635 }, { "epoch": 6.0, "learning_rate": 4.4000000000000006e-05, "loss": 0.1708, "step": 3162 }, { "epoch": 6.0, "eval_accuracy": 0.7855504587155964, "eval_loss": 0.5061066746711731, "eval_runtime": 1.9793, "eval_samples_per_second": 440.565, "eval_steps_per_second": 3.537, "step": 3162 }, { "epoch": 6.0, "step": 3162, "total_flos": 1.0644300396232704e+16, "train_loss": 0.25946182453654976, "train_runtime": 2837.2785, "train_samples_per_second": 1186.859, "train_steps_per_second": 9.287 } ], "max_steps": 26350, "num_train_epochs": 50, "total_flos": 1.0644300396232704e+16, "trial_name": null, "trial_params": null }