Training in progress, step 700, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66afc3d85ad47b5d1be06689a9b95f35b8263c4de56db57e5cfd8d012608c40e
 size 157308096

 version https://git-lfs.github.com/spec/v1
+oid sha256:9a1f81a979d83b45699d06c02548b57bebc286653c14630be8ee51d9cc5c577e
 size 157308096

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ef1ef269010fe272a9f4a5e0950e3907565d11e25dfb20a60ba52cc2a2fff63
 size 314671226

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0ae3487fe4662796b3ef6fb9ff96387b0a9e31b8352da8696a25b00f6e815ac
 size 314671226

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e556ea43a786747c49d91b2115ae288f4685b49c5654d937010d3646b45c410
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:05ecbb654eb9d520c9c2d628b7c67906fa27497fded38c4cf23920970bfa2f6b
 size 15920

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7d145daf5de0e6e4c7cbe7d6a7b1a99ea6f5f5ab11a6634c9aadfa0a197734f7
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b5492d8ec76ce628fd257523d91584ac91c687d7ea1ef2f0e8152c0e20ff570
 size 15920

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06bf7f6ea338a69748630c269d4a8a93e783dd8580aa6c2270050a5a582ea155
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:b646aee243f6a8534b782828cbcd0f3e047db163dadc7361bc3510d59b8e71cf
 size 15920

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4cd09ab162c4e59c55c2354c8b16b608f3087657c3a30bbee7c948d03c127c6e
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:50c34f5a01db989b610d43301c05aead10d5b35628396f8db1cc4a1d0c93327b
 size 15920

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1d0bcf2622bc32729c628f01a8656e80557929a1b51b9e03fd6b69a2095c11b5
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:34d6715ef9bcf8c2d160c0febb1f11b92784391c975eac88d5f405cd379e27cd
 size 15920

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b78837eb56314b91782e18192080e140c41a96eba3e74e928fd1a51476f0794b
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c88ab604f34281ba33dfad57ff22ed29b0aa7a757641052333954f5a008950b
 size 15920

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f8acf23010bf65cb2135d18157640ac2eb32bcd1c4a2b8f6e7cab3039ba5e39a
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:e6afe8bc07a4e18b43b02dd293c71e31b6e675d9f7b575c366a286e2778648d2
 size 15920

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:da77b547a2231c986b747c834bd4bc2fd5e52598053621c5953c3169941a1558
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:f21ad02873b1f5ad245ca6efdc40bd8b5a8d297e45f987f2c2e5e4688b02ba94
 size 15920

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65344ffcca5c2927ab748ec8325cda6b2e302939be48ec00a6dafd7a65462e37
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4efe5ad5ff1c774830ba0cbe5db77e2469a801b3e1c8c9f7575364d9145f02c7
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.7509386733416771,
   "eval_steps": 100,
-  "global_step": 600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -62,6 +62,14 @@
       "eval_samples_per_second": 5.997,
       "eval_steps_per_second": 0.375,
       "step": 600
     }
   ],
   "logging_steps": 500,
@@ -81,7 +89,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 6.851404845023232e+17,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.8760951188986232,
   "eval_steps": 100,
+  "global_step": 700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 5.997,
       "eval_steps_per_second": 0.375,
       "step": 600
+    },
+    {
+      "epoch": 0.8760951188986232,
+      "eval_loss": 0.015957491472363472,
+      "eval_runtime": 5.3181,
+      "eval_samples_per_second": 6.017,
+      "eval_steps_per_second": 0.376,
+      "step": 700
     }
   ],
   "logging_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 7.993305652527104e+17,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null