{ "best_global_step": null, "best_metric": 1.4674878120422363, "best_model_checkpoint": "/home/haji80as/invariant-LM2/Meditron-7B-merged-server-10000/checkpoint-10000", "epoch": null, "eval_steps": 500, "global_step": 0, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "eval_loss": 1.4994444847106934, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.7395, "eval_samples_per_second": 13.7, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4994444847106934, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.7395, "eval_samples_per_second": 13.7, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4910725355148315, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.2398, "eval_samples_per_second": 13.71, "eval_steps_per_second": 1.715, "step": 0 }, { "eval_loss": 1.4910725355148315, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.2398, "eval_samples_per_second": 13.71, "eval_steps_per_second": 1.715, "step": 0 }, { "eval_loss": 1.4851367473602295, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3243, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4851367473602295, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3243, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4799472093582153, "eval_model_preparation_time": 0.0249, "eval_runtime": 671.5587, "eval_samples_per_second": 13.622, "eval_steps_per_second": 1.703, "step": 0 }, { "eval_loss": 1.4799472093582153, "eval_model_preparation_time": 0.0249, "eval_runtime": 671.5587, "eval_samples_per_second": 13.622, "eval_steps_per_second": 1.703, "step": 0 }, { "eval_loss": 1.4777600765228271, "eval_model_preparation_time": 0.0249, "eval_runtime": 670.9932, "eval_samples_per_second": 13.634, "eval_steps_per_second": 1.705, "step": 0 }, { "eval_loss": 1.4777600765228271, "eval_model_preparation_time": 0.0249, "eval_runtime": 670.9932, "eval_samples_per_second": 13.634, "eval_steps_per_second": 1.705, "step": 0 }, { "eval_loss": 1.475777506828308, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3706, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.475777506828308, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3706, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4755457639694214, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3253, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4755457639694214, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3253, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4759819507598877, "eval_model_preparation_time": 0.0249, "eval_runtime": 668.1701, "eval_samples_per_second": 13.691, "eval_steps_per_second": 1.712, "step": 0 }, { "eval_loss": 1.4759819507598877, "eval_model_preparation_time": 0.0249, "eval_runtime": 668.1701, "eval_samples_per_second": 13.691, "eval_steps_per_second": 1.712, "step": 0 }, { "eval_loss": 1.4732918739318848, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.4922, "eval_samples_per_second": 13.603, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.4732918739318848, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.4922, "eval_samples_per_second": 13.603, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.474392294883728, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.3492, "eval_samples_per_second": 13.606, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.474392294883728, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.3492, "eval_samples_per_second": 13.606, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.4730381965637207, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.5252, "eval_samples_per_second": 13.704, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4730381965637207, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.5252, "eval_samples_per_second": 13.704, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.471816062927246, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.2797, "eval_samples_per_second": 13.709, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.471816062927246, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.2797, "eval_samples_per_second": 13.709, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4706984758377075, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.7394, "eval_samples_per_second": 13.7, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4706984758377075, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.7394, "eval_samples_per_second": 13.7, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4707434177398682, "eval_model_preparation_time": 0.0249, "eval_runtime": 671.0524, "eval_samples_per_second": 13.632, "eval_steps_per_second": 1.705, "step": 0 }, { "eval_loss": 1.4707434177398682, "eval_model_preparation_time": 0.0249, "eval_runtime": 671.0524, "eval_samples_per_second": 13.632, "eval_steps_per_second": 1.705, "step": 0 }, { "eval_loss": 1.4697192907333374, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.4022, "eval_samples_per_second": 13.707, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4697192907333374, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.4022, "eval_samples_per_second": 13.707, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4680581092834473, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3169, "eval_samples_per_second": 13.709, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4680581092834473, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.3169, "eval_samples_per_second": 13.709, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4677343368530273, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.6752, "eval_samples_per_second": 13.701, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4677343368530273, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.6752, "eval_samples_per_second": 13.701, "eval_steps_per_second": 1.713, "step": 0 }, { "eval_loss": 1.4676560163497925, "eval_model_preparation_time": 0.0249, "eval_runtime": 674.8107, "eval_samples_per_second": 13.556, "eval_steps_per_second": 1.695, "step": 0 }, { "eval_loss": 1.4676560163497925, "eval_model_preparation_time": 0.0249, "eval_runtime": 674.8107, "eval_samples_per_second": 13.556, "eval_steps_per_second": 1.695, "step": 0 }, { "eval_loss": 1.4675045013427734, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.511, "eval_samples_per_second": 13.603, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.4675045013427734, "eval_model_preparation_time": 0.0249, "eval_runtime": 672.511, "eval_samples_per_second": 13.603, "eval_steps_per_second": 1.701, "step": 0 }, { "eval_loss": 1.4674878120422363, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.5226, "eval_samples_per_second": 13.704, "eval_steps_per_second": 1.714, "step": 0 }, { "eval_loss": 1.4674878120422363, "eval_model_preparation_time": 0.0249, "eval_runtime": 667.5226, "eval_samples_per_second": 13.704, "eval_steps_per_second": 1.714, "step": 0 } ], "logging_steps": 500, "max_steps": 0, "num_input_tokens_seen": 0, "num_train_epochs": 0, "save_steps": 500, "stateful_callbacks": {}, "total_flos": 0, "train_batch_size": null, "trial_name": null, "trial_params": null }