[ { "epoch": 1, "train_loss": 0.2136226908833373, "lr": 9.045084971874738e-05, "val_loss": 0.14677325149273707, "val_loss_pos": NaN, "val_loss_neg": 0.14677325149273707, "val_n_pos": 0, "val_n_neg": 2160, "val_conditioning_accuracy": 0.537962962962963, "val_conditioning_gap": 6.71636889617528e-05, "val_conditioning_gap_pos": NaN, "val_conditioning_gap_neg": 6.71636889617528e-05, "val_adv_episode_alignment": 0.5, "val_alignment_on_success": 0.0, "val_alignment_on_failure": 1.0 }, { "epoch": 2, "train_loss": 0.12027364674882561, "lr": 5.920084971874737e-05, "val_loss": 0.11876977328992963, "val_loss_pos": NaN, "val_loss_neg": 0.11876977328992963, "val_n_pos": 0, "val_n_neg": 2144, "val_conditioning_accuracy": 0.0, "val_conditioning_gap": 0.0, "val_conditioning_gap_pos": NaN, "val_conditioning_gap_neg": 0.0, "val_adv_episode_alignment": 0.503731343283582, "val_alignment_on_success": 0.0, "val_alignment_on_failure": 1.0 }, { "epoch": 3, "train_loss": 0.09871727271139265, "lr": 3.125e-05, "val_loss": 0.0028377454727888107, "val_loss_pos": NaN, "val_loss_neg": 0.0028377454727888107, "val_n_pos": 0, "val_n_neg": 8, "val_conditioning_accuracy": 0.0, "val_conditioning_gap": 0.0, "val_conditioning_gap_pos": NaN, "val_conditioning_gap_neg": 0.0, "val_adv_episode_alignment": 1.0, "val_alignment_on_success": NaN, "val_alignment_on_failure": 1.0 }, { "epoch": 4, "train_loss": 0.08717213855802503, "lr": 8.63728757031316e-06, "val_loss": 0.1139170856033872, "val_loss_pos": NaN, "val_loss_neg": 0.1139170856033872, "val_n_pos": 0, "val_n_neg": 2128, "val_conditioning_accuracy": 0.0, "val_conditioning_gap": 0.0, "val_conditioning_gap_pos": NaN, "val_conditioning_gap_neg": 0.0, "val_adv_episode_alignment": 0.5075187969924813, "val_alignment_on_success": 0.0, "val_alignment_on_failure": 1.0 }, { "epoch": 5, "train_loss": 0.08140311014763038, "lr": 0.0, "val_loss": 0.001793158007785678, "val_loss_pos": NaN, "val_loss_neg": 0.001793158007785678, "val_n_pos": 0, "val_n_neg": 8, "val_conditioning_accuracy": 0.0, "val_conditioning_gap": 0.0, "val_conditioning_gap_pos": NaN, "val_conditioning_gap_neg": 0.0, "val_adv_episode_alignment": 1.0, "val_alignment_on_success": NaN, "val_alignment_on_failure": 1.0 } ]