{ "best_metric": 0.7296723842255801, "best_model_checkpoint": "/tmp/albrechtje/models/EuroBERT-610m-OnCoCo-DE-EN-cv5-4/checkpoint-4170", "epoch": 15.0, "eval_steps": 500, "global_step": 4170, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6627697841726619, "eval_accuracy_at_2": 0.7760791366906474, "eval_f1_macro": 0.5673126678314325, "eval_f1_macro_at_2": 0.7091318813784219, "eval_f1_micro": 0.6627697841726619, "eval_f1_weighted": 0.63249956992534, "eval_f1_weighted_at_2": 0.7524547845490651, "eval_loss": 1.2793892621994019, "eval_precision_weighted": 0.669000429503669, "eval_recall_weighted": 0.6627697841726619, "eval_runtime": 1.7261, "eval_samples_per_second": 644.24, "eval_steps_per_second": 40.555, "step": 278 }, { "epoch": 2.0, "eval_accuracy": 0.72931654676259, "eval_accuracy_at_2": 0.8336330935251799, "eval_f1_macro": 0.6752844759784321, "eval_f1_macro_at_2": 0.7940592529446071, "eval_f1_micro": 0.72931654676259, "eval_f1_weighted": 0.7221504602673161, "eval_f1_weighted_at_2": 0.8291369609268844, "eval_loss": 1.0086288452148438, "eval_precision_weighted": 0.7405142921497202, "eval_recall_weighted": 0.72931654676259, "eval_runtime": 1.7288, "eval_samples_per_second": 643.233, "eval_steps_per_second": 40.491, "step": 556 }, { "epoch": 3.0, "eval_accuracy": 0.7212230215827338, "eval_accuracy_at_2": 0.8345323741007195, "eval_f1_macro": 0.6694806632511426, "eval_f1_macro_at_2": 0.7980059444324954, "eval_f1_micro": 0.7212230215827338, "eval_f1_weighted": 0.7132639102071889, "eval_f1_weighted_at_2": 0.8298102085427823, "eval_loss": 1.348330020904541, "eval_precision_weighted": 0.7421885381816703, "eval_recall_weighted": 0.7212230215827338, "eval_runtime": 1.727, "eval_samples_per_second": 643.898, "eval_steps_per_second": 40.533, "step": 834 }, { "epoch": 4.0, "eval_accuracy": 0.710431654676259, "eval_accuracy_at_2": 0.8201438848920863, "eval_f1_macro": 0.6428369535361947, "eval_f1_macro_at_2": 0.7724504347113151, "eval_f1_micro": 0.710431654676259, "eval_f1_weighted": 0.7023716437139816, "eval_f1_weighted_at_2": 0.8169418213636089, "eval_loss": 1.4498661756515503, "eval_precision_weighted": 0.7370210870156869, "eval_recall_weighted": 0.710431654676259, "eval_runtime": 1.7263, "eval_samples_per_second": 644.146, "eval_steps_per_second": 40.549, "step": 1112 }, { "epoch": 5.0, "eval_accuracy": 0.7526978417266187, "eval_accuracy_at_2": 0.8345323741007195, "eval_f1_macro": 0.7060210555194106, "eval_f1_macro_at_2": 0.7886937000135417, "eval_f1_micro": 0.7526978417266187, "eval_f1_weighted": 0.7445654944821934, "eval_f1_weighted_at_2": 0.8272173955832338, "eval_loss": 1.519242763519287, "eval_precision_weighted": 0.7635093083360639, "eval_recall_weighted": 0.7526978417266187, "eval_runtime": 1.7213, "eval_samples_per_second": 646.039, "eval_steps_per_second": 40.668, "step": 1390 }, { "epoch": 6.0, "eval_accuracy": 0.7607913669064749, "eval_accuracy_at_2": 0.8408273381294964, "eval_f1_macro": 0.7039156582368327, "eval_f1_macro_at_2": 0.8019994977140246, "eval_f1_micro": 0.7607913669064749, "eval_f1_weighted": 0.7482322239414279, "eval_f1_weighted_at_2": 0.8312668948558287, "eval_loss": 1.4991692304611206, "eval_precision_weighted": 0.7621139615324087, "eval_recall_weighted": 0.7607913669064749, "eval_runtime": 1.7258, "eval_samples_per_second": 644.344, "eval_steps_per_second": 40.561, "step": 1668 }, { "epoch": 7.0, "eval_accuracy": 0.7634892086330936, "eval_accuracy_at_2": 0.8471223021582733, "eval_f1_macro": 0.6955317878216288, "eval_f1_macro_at_2": 0.8166191291309608, "eval_f1_micro": 0.7634892086330936, "eval_f1_weighted": 0.7510041672314496, "eval_f1_weighted_at_2": 0.8393077322569914, "eval_loss": 1.458231806755066, "eval_precision_weighted": 0.7645201130407223, "eval_recall_weighted": 0.7634892086330936, "eval_runtime": 1.7249, "eval_samples_per_second": 644.66, "eval_steps_per_second": 40.581, "step": 1946 }, { "epoch": 8.0, "eval_accuracy": 0.7598920863309353, "eval_accuracy_at_2": 0.8390287769784173, "eval_f1_macro": 0.696096379087516, "eval_f1_macro_at_2": 0.7932741388611341, "eval_f1_micro": 0.7598920863309353, "eval_f1_weighted": 0.7495980185543826, "eval_f1_weighted_at_2": 0.8326274963561894, "eval_loss": 1.6272355318069458, "eval_precision_weighted": 0.7659418585582665, "eval_recall_weighted": 0.7598920863309353, "eval_runtime": 1.7261, "eval_samples_per_second": 644.237, "eval_steps_per_second": 40.555, "step": 2224 }, { "epoch": 9.0, "eval_accuracy": 0.7589928057553957, "eval_accuracy_at_2": 0.841726618705036, "eval_f1_macro": 0.6987893288312187, "eval_f1_macro_at_2": 0.7996666859632781, "eval_f1_micro": 0.7589928057553957, "eval_f1_weighted": 0.7497801021327636, "eval_f1_weighted_at_2": 0.8366448594401756, "eval_loss": 1.580078363418579, "eval_precision_weighted": 0.7588850641113337, "eval_recall_weighted": 0.7589928057553957, "eval_runtime": 1.7262, "eval_samples_per_second": 644.198, "eval_steps_per_second": 40.552, "step": 2502 }, { "epoch": 10.0, "eval_accuracy": 0.7634892086330936, "eval_accuracy_at_2": 0.8435251798561151, "eval_f1_macro": 0.7009618080826578, "eval_f1_macro_at_2": 0.8139765719876315, "eval_f1_micro": 0.7634892086330936, "eval_f1_weighted": 0.7525198049149984, "eval_f1_weighted_at_2": 0.835374733368227, "eval_loss": 1.601148247718811, "eval_precision_weighted": 0.7626619291141639, "eval_recall_weighted": 0.7634892086330936, "eval_runtime": 1.7254, "eval_samples_per_second": 644.475, "eval_steps_per_second": 40.569, "step": 2780 }, { "epoch": 11.0, "eval_accuracy": 0.7616906474820144, "eval_accuracy_at_2": 0.841726618705036, "eval_f1_macro": 0.7125412813321691, "eval_f1_macro_at_2": 0.8049568408480121, "eval_f1_micro": 0.7616906474820144, "eval_f1_weighted": 0.753426103516513, "eval_f1_weighted_at_2": 0.8365198042850269, "eval_loss": 1.5725866556167603, "eval_precision_weighted": 0.7661972661776627, "eval_recall_weighted": 0.7616906474820144, "eval_runtime": 1.7253, "eval_samples_per_second": 644.51, "eval_steps_per_second": 40.572, "step": 3058 }, { "epoch": 12.0, "eval_accuracy": 0.7661870503597122, "eval_accuracy_at_2": 0.835431654676259, "eval_f1_macro": 0.7147133534539337, "eval_f1_macro_at_2": 0.7909847693173496, "eval_f1_micro": 0.7661870503597122, "eval_f1_weighted": 0.7528325022460537, "eval_f1_weighted_at_2": 0.8258195847328804, "eval_loss": 1.6502783298492432, "eval_precision_weighted": 0.7591421634449557, "eval_recall_weighted": 0.7661870503597122, "eval_runtime": 1.7262, "eval_samples_per_second": 644.207, "eval_steps_per_second": 40.553, "step": 3336 }, { "epoch": 13.0, "eval_accuracy": 0.7661870503597122, "eval_accuracy_at_2": 0.8381294964028777, "eval_f1_macro": 0.7157676063067756, "eval_f1_macro_at_2": 0.8066775674645668, "eval_f1_micro": 0.7661870503597122, "eval_f1_weighted": 0.7547889054147703, "eval_f1_weighted_at_2": 0.8293209101204917, "eval_loss": 1.6077083349227905, "eval_precision_weighted": 0.7655113318987471, "eval_recall_weighted": 0.7661870503597122, "eval_runtime": 1.7261, "eval_samples_per_second": 644.238, "eval_steps_per_second": 40.555, "step": 3614 }, { "epoch": 14.0, "eval_accuracy": 0.7652877697841727, "eval_accuracy_at_2": 0.8399280575539568, "eval_f1_macro": 0.7251318101032391, "eval_f1_macro_at_2": 0.8095146409316828, "eval_f1_micro": 0.7652877697841727, "eval_f1_weighted": 0.7535442727856384, "eval_f1_weighted_at_2": 0.8318093197662693, "eval_loss": 1.6115399599075317, "eval_precision_weighted": 0.7652284840584932, "eval_recall_weighted": 0.7652877697841727, "eval_runtime": 1.7263, "eval_samples_per_second": 644.149, "eval_steps_per_second": 40.549, "step": 3892 }, { "epoch": 15.0, "eval_accuracy": 0.7661870503597122, "eval_accuracy_at_2": 0.8408273381294964, "eval_f1_macro": 0.7296723842255801, "eval_f1_macro_at_2": 0.810034366402201, "eval_f1_micro": 0.7661870503597122, "eval_f1_weighted": 0.7540657431253593, "eval_f1_weighted_at_2": 0.8327842029609481, "eval_loss": 1.6192994117736816, "eval_precision_weighted": 0.764688174461808, "eval_recall_weighted": 0.7661870503597122, "eval_runtime": 1.7258, "eval_samples_per_second": 644.337, "eval_steps_per_second": 40.561, "step": 4170 } ], "logging_steps": 277.0, "max_steps": 4448, "num_input_tokens_seen": 0, "num_train_epochs": 16, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.046065690987632e+16, "train_batch_size": 16, "trial_name": null, "trial_params": null }