kiddothe2b commited on Nov 24, 2022

Commit

f928948

1 Parent(s): f78ff50

Training in progress, step 350000

Browse files

Files changed (20) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
runs/Nov11_11-14-20_t1v-n-088af867-w-0/events.out.tfevents.1668165319.t1v-n-088af867-w-0.346597.0 +2 -2
runs/Nov17_09-03-22_t1v-n-088af867-w-0/1668675880.4394102/events.out.tfevents.1668675880.t1v-n-088af867-w-0.91101.1 +3 -0
runs/Nov17_09-03-22_t1v-n-088af867-w-0/events.out.tfevents.1668675880.t1v-n-088af867-w-0.91101.0 +3 -0
runs/Nov21_18-14-51_t1v-n-088af867-w-0/1669054551.8620195/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.1 +3 -0
runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 +3 -0
training_args.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:07a6b46aa8152383b0a50bd07b07a176c831d5337ddec91d8b5b5aba89b5b543
 size 996067161

 version https://git-lfs.github.com/spec/v1
+oid sha256:e61ee14a21dfb599f1c63f3e0e8686eb244cce7311c2a2b967485c15ff52a3f8
 size 996067161

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2517996d5c4c4163884506060e457650dff4618ff3814b55dc92b5b3c209528
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1fddf171aaf7fcd5407c99cb8a97835dce9ceccd14ee70ed5b23a17af12fdf3
 size 498046827

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b06f062cec2bd581a5223b4bd92c5f2dcf09d9cd3cfe1d2d70466080b2e9546a
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:036eb5eec66f4acc5bf94747270222b9c5a69b86c3f623f9e981140d862a7ab4
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d998162d48f4ee450ef4bf13d9e047fd62295bbe3f16a4efd05adea28896f336
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:9fcbaab8f44aa44b57133d3d5819bbf91b8fc92df692100e5583bb214e77939c
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b06f062cec2bd581a5223b4bd92c5f2dcf09d9cd3cfe1d2d70466080b2e9546a
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:036eb5eec66f4acc5bf94747270222b9c5a69b86c3f623f9e981140d862a7ab4
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:372875e5805e9be2c35e094a3a6b2332849035b4c4b7dbcec07d8d9b728521d7
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:74cd3be6cc3a9e9a714d813672381da6434030e8445f48465040931d56dcaba6
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b06f062cec2bd581a5223b4bd92c5f2dcf09d9cd3cfe1d2d70466080b2e9546a
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:673bcbb9d666bc7c835ef864763b55aa80db016b301aae7e39ae8a0cb0efb86a
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:372875e5805e9be2c35e094a3a6b2332849035b4c4b7dbcec07d8d9b728521d7
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:74cd3be6cc3a9e9a714d813672381da6434030e8445f48465040931d56dcaba6
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b06f062cec2bd581a5223b4bd92c5f2dcf09d9cd3cfe1d2d70466080b2e9546a
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:673bcbb9d666bc7c835ef864763b55aa80db016b301aae7e39ae8a0cb0efb86a
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:305632a8833b49b3167aa1319ddc125408cf66a7d459afebacacaa7cdcedb877
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:036eb5eec66f4acc5bf94747270222b9c5a69b86c3f623f9e981140d862a7ab4
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4d41c6734c2aef1f60ed0fbc886cbc351448520889799ebfa66c14f8f9e99059
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:f8f220426de5a076dbb6f66f54955d3a3fc0acbab10b1bd60cf9472b552bfdca
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.032937,
-  "global_step": 300000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1854,11 +1854,319 @@
       "eval_samples_per_second": 492.503,
       "eval_steps_per_second": 1.97,
       "step": 300000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 5.0546812649472e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.08296,
+  "global_step": 350000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 492.503,
       "eval_steps_per_second": 1.97,
       "step": 300000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 8.37422439088976e-05,
+      "loss": 0.894,
+      "step": 301000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 8.362004023673474e-05,
+      "loss": 0.8804,
+      "step": 302000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.349746890119826e-05,
+      "loss": 0.8663,
+      "step": 303000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.337453124270863e-05,
+      "loss": 0.8767,
+      "step": 304000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.32512286056924e-05,
+      "loss": 0.8697,
+      "step": 305000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.31275623385675e-05,
+      "loss": 0.876,
+      "step": 306000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.300353379372834e-05,
+      "loss": 0.8752,
+      "step": 307000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.287914432753123e-05,
+      "loss": 0.8711,
+      "step": 308000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.275439530027948e-05,
+      "loss": 0.8526,
+      "step": 309000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.262928807620843e-05,
+      "loss": 0.8794,
+      "step": 310000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.250382402347065e-05,
+      "loss": 0.8671,
+      "step": 311000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 8.237800451412095e-05,
+      "loss": 0.8772,
+      "step": 312000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.225183092410128e-05,
+      "loss": 0.8786,
+      "step": 313000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.212530463322583e-05,
+      "loss": 0.8704,
+      "step": 314000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.199842702516583e-05,
+      "loss": 0.8801,
+      "step": 315000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.18711994874345e-05,
+      "loss": 0.8728,
+      "step": 316000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.174362341137177e-05,
+      "loss": 0.8628,
+      "step": 317000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.161570019212921e-05,
+      "loss": 0.8591,
+      "step": 318000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.148743122865463e-05,
+      "loss": 0.8793,
+      "step": 319000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.135881792367686e-05,
+      "loss": 0.8958,
+      "step": 320000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.12298616836904e-05,
+      "loss": 0.8768,
+      "step": 321000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 8.110056391894005e-05,
+      "loss": 0.8882,
+      "step": 322000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.097092604340542e-05,
+      "loss": 0.8954,
+      "step": 323000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.084094947478556e-05,
+      "loss": 0.9074,
+      "step": 324000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.07106356344834e-05,
+      "loss": 0.894,
+      "step": 325000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.057998594759022e-05,
+      "loss": 0.8978,
+      "step": 326000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.044900184287007e-05,
+      "loss": 0.9071,
+      "step": 327000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.031768475274413e-05,
+      "loss": 0.9107,
+      "step": 328000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.018603611327504e-05,
+      "loss": 0.8774,
+      "step": 329000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 8.005405736415126e-05,
+      "loss": 0.8975,
+      "step": 330000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 7.992174994867123e-05,
+      "loss": 0.8813,
+      "step": 331000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 7.978911531372765e-05,
+      "loss": 0.869,
+      "step": 332000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.965615490979163e-05,
+      "loss": 0.8809,
+      "step": 333000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.952287019089685e-05,
+      "loss": 0.8669,
+      "step": 334000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.938926261462366e-05,
+      "loss": 0.8675,
+      "step": 335000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.925533364208309e-05,
+      "loss": 0.8748,
+      "step": 336000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.912108473790092e-05,
+      "loss": 0.883,
+      "step": 337000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.898651737020166e-05,
+      "loss": 0.8941,
+      "step": 338000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.88516330105925e-05,
+      "loss": 0.8876,
+      "step": 339000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.871643313414718e-05,
+      "loss": 0.8878,
+      "step": 340000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.858091921938988e-05,
+      "loss": 0.8908,
+      "step": 341000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 7.844509274827907e-05,
+      "loss": 0.8878,
+      "step": 342000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.830895520619128e-05,
+      "loss": 0.8865,
+      "step": 343000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.817250808190483e-05,
+      "loss": 0.8842,
+      "step": 344000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.803575286758364e-05,
+      "loss": 0.8879,
+      "step": 345000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.789869105876083e-05,
+      "loss": 0.8964,
+      "step": 346000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.776132415432234e-05,
+      "loss": 0.8836,
+      "step": 347000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.762365365649067e-05,
+      "loss": 0.8834,
+      "step": 348000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.748568107080832e-05,
+      "loss": 0.8907,
+      "step": 349000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 7.734740790612136e-05,
+      "loss": 0.8899,
+      "step": 350000
+    },
+    {
+      "epoch": 1.08,
+      "eval_loss": 0.8285813331604004,
+      "eval_runtime": 24.9856,
+      "eval_samples_per_second": 400.23,
+      "eval_steps_per_second": 1.601,
+      "step": 350000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 5.897119717969625e+18,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b4ff5810bc5e548a89007cef7a8f26eae082bc23f1a60b2fb29c87071c0fb01
 size 3375

 version https://git-lfs.github.com/spec/v1
+oid sha256:225de94e6547ae8e2d8e5b9a0e34c719612311b29038a27f9107115c46808f63
 size 3375

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2517996d5c4c4163884506060e457650dff4618ff3814b55dc92b5b3c209528
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1fddf171aaf7fcd5407c99cb8a97835dce9ceccd14ee70ed5b23a17af12fdf3
 size 498046827

runs/Nov11_11-14-20_t1v-n-088af867-w-0/events.out.tfevents.1668165319.t1v-n-088af867-w-0.346597.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c4c444c4e8e903f12d92ca730d51afacf1008416ca703be4c9290ba2b7d54fe2
-size 53355

 version https://git-lfs.github.com/spec/v1
+oid sha256:5f584155741b1ac1c66f2deec1a86eb4dec91ffb6ede4b340e14a38064332a51
+size 61035

runs/Nov17_09-03-22_t1v-n-088af867-w-0/1668675880.4394102/events.out.tfevents.1668675880.t1v-n-088af867-w-0.91101.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84092474497834ded5ff6a628c5df8f98b1991b6bf66a6e9c229275fb3983810
+size 5419

runs/Nov17_09-03-22_t1v-n-088af867-w-0/events.out.tfevents.1668675880.t1v-n-088af867-w-0.91101.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77d571d78f4fe0979689c970eb58513ff26e9e28f757dd306ffedcec3e98b4b2
+size 3748

runs/Nov21_18-14-51_t1v-n-088af867-w-0/1669054551.8620195/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6eadbd757619674b78bab6f3a98c1ced53a048c7440ccbd25ca0e2ad1b0441cf
+size 5419

runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1b0ad7fd9cf05d0068da00ee4295784721aa3d2aa25d542d74eb8a8ae739909e
+size 12024

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b4ff5810bc5e548a89007cef7a8f26eae082bc23f1a60b2fb29c87071c0fb01
 size 3375

 version https://git-lfs.github.com/spec/v1
+oid sha256:225de94e6547ae8e2d8e5b9a0e34c719612311b29038a27f9107115c46808f63
 size 3375