cognia-wav2vec / checkpoint-350 /trainer_state.json
Artyomorax's picture
Add wav2vec fine-tuned model files
288c286
Raw
History Blame
6.37 kB
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 14.0,
"eval_steps": 500,
"global_step": 350,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.4032258064516129,
"grad_norm": 15.945989608764648,
"learning_rate": 5.4e-07,
"loss": 2.942,
"step": 10
},
{
"epoch": 0.8064516129032258,
"grad_norm": 15.050374984741211,
"learning_rate": 1.14e-06,
"loss": 3.345,
"step": 20
},
{
"epoch": 1.2016129032258065,
"grad_norm": 9.487156867980957,
"learning_rate": 1.74e-06,
"loss": 2.6443,
"step": 30
},
{
"epoch": 1.6048387096774195,
"grad_norm": 14.825271606445312,
"learning_rate": 2.34e-06,
"loss": 3.0528,
"step": 40
},
{
"epoch": 2.0,
"grad_norm": 15.298517227172852,
"learning_rate": 2.9400000000000002e-06,
"loss": 2.2951,
"step": 50
},
{
"epoch": 2.403225806451613,
"grad_norm": 13.529952049255371,
"learning_rate": 3.54e-06,
"loss": 2.3061,
"step": 60
},
{
"epoch": 2.806451612903226,
"grad_norm": 12.780255317687988,
"learning_rate": 4.14e-06,
"loss": 1.828,
"step": 70
},
{
"epoch": 3.2016129032258065,
"grad_norm": 4.392550468444824,
"learning_rate": 4.74e-06,
"loss": 1.7883,
"step": 80
},
{
"epoch": 3.6048387096774195,
"grad_norm": 6.868764400482178,
"learning_rate": 5.34e-06,
"loss": 1.3883,
"step": 90
},
{
"epoch": 4.0,
"grad_norm": 11.529573440551758,
"learning_rate": 5.940000000000001e-06,
"loss": 1.2804,
"step": 100
},
{
"epoch": 4.403225806451613,
"grad_norm": 3.888104200363159,
"learning_rate": 6.54e-06,
"loss": 1.1184,
"step": 110
},
{
"epoch": 4.806451612903226,
"grad_norm": 5.543831825256348,
"learning_rate": 7.14e-06,
"loss": 0.8838,
"step": 120
},
{
"epoch": 5.201612903225806,
"grad_norm": 3.6435844898223877,
"learning_rate": 7.74e-06,
"loss": 0.7359,
"step": 130
},
{
"epoch": 5.604838709677419,
"grad_norm": 3.873931407928467,
"learning_rate": 8.340000000000001e-06,
"loss": 0.6677,
"step": 140
},
{
"epoch": 6.0,
"grad_norm": 6.526176929473877,
"learning_rate": 8.939999999999999e-06,
"loss": 0.5343,
"step": 150
},
{
"epoch": 6.403225806451613,
"grad_norm": 2.3237783908843994,
"learning_rate": 9.54e-06,
"loss": 0.4596,
"step": 160
},
{
"epoch": 6.806451612903226,
"grad_norm": 3.2708520889282227,
"learning_rate": 1.0140000000000001e-05,
"loss": 0.371,
"step": 170
},
{
"epoch": 7.201612903225806,
"grad_norm": 1.420652985572815,
"learning_rate": 1.074e-05,
"loss": 0.397,
"step": 180
},
{
"epoch": 7.604838709677419,
"grad_norm": 2.8168821334838867,
"learning_rate": 1.134e-05,
"loss": 0.2335,
"step": 190
},
{
"epoch": 8.0,
"grad_norm": 0.872466504573822,
"learning_rate": 1.1940000000000001e-05,
"loss": 0.2535,
"step": 200
},
{
"epoch": 8.403225806451612,
"grad_norm": 1.6869771480560303,
"learning_rate": 1.254e-05,
"loss": 0.1642,
"step": 210
},
{
"epoch": 8.806451612903226,
"grad_norm": 8.301424026489258,
"learning_rate": 1.314e-05,
"loss": 0.112,
"step": 220
},
{
"epoch": 9.201612903225806,
"grad_norm": 0.7436397671699524,
"learning_rate": 1.374e-05,
"loss": 0.1257,
"step": 230
},
{
"epoch": 9.60483870967742,
"grad_norm": 1.891860842704773,
"learning_rate": 1.434e-05,
"loss": 0.0623,
"step": 240
},
{
"epoch": 10.0,
"grad_norm": 0.5202131867408752,
"learning_rate": 1.4940000000000001e-05,
"loss": 0.0572,
"step": 250
},
{
"epoch": 10.403225806451612,
"grad_norm": 0.0677497610449791,
"learning_rate": 1.554e-05,
"loss": 0.0212,
"step": 260
},
{
"epoch": 10.806451612903226,
"grad_norm": 0.07801195234060287,
"learning_rate": 1.614e-05,
"loss": 0.0243,
"step": 270
},
{
"epoch": 11.201612903225806,
"grad_norm": 0.11515898257493973,
"learning_rate": 1.6740000000000002e-05,
"loss": 0.0321,
"step": 280
},
{
"epoch": 11.60483870967742,
"grad_norm": 0.11826858669519424,
"learning_rate": 1.734e-05,
"loss": 0.0254,
"step": 290
},
{
"epoch": 12.0,
"grad_norm": 0.13558819890022278,
"learning_rate": 1.794e-05,
"loss": 0.014,
"step": 300
},
{
"epoch": 12.403225806451612,
"grad_norm": 0.03777763620018959,
"learning_rate": 1.854e-05,
"loss": 0.0301,
"step": 310
},
{
"epoch": 12.806451612903226,
"grad_norm": 0.0405518114566803,
"learning_rate": 1.914e-05,
"loss": 0.0027,
"step": 320
},
{
"epoch": 13.201612903225806,
"grad_norm": 0.03762541711330414,
"learning_rate": 1.974e-05,
"loss": 0.0026,
"step": 330
},
{
"epoch": 13.60483870967742,
"grad_norm": 0.06563286483287811,
"learning_rate": 2.0340000000000002e-05,
"loss": 0.0279,
"step": 340
},
{
"epoch": 14.0,
"grad_norm": 0.12380703538656235,
"learning_rate": 2.094e-05,
"loss": 0.0063,
"step": 350
}
],
"logging_steps": 10,
"max_steps": 375,
"num_input_tokens_seen": 0,
"num_train_epochs": 15,
"save_steps": 50,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.651986705536446e+17,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}