evgmaslov commited on
Commit
ef57025
·
verified ·
1 Parent(s): 3463562

Training in progress, step 700, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66afc3d85ad47b5d1be06689a9b95f35b8263c4de56db57e5cfd8d012608c40e
3
  size 157308096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a1f81a979d83b45699d06c02548b57bebc286653c14630be8ee51d9cc5c577e
3
  size 157308096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ef1ef269010fe272a9f4a5e0950e3907565d11e25dfb20a60ba52cc2a2fff63
3
  size 314671226
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0ae3487fe4662796b3ef6fb9ff96387b0a9e31b8352da8696a25b00f6e815ac
3
  size 314671226
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e556ea43a786747c49d91b2115ae288f4685b49c5654d937010d3646b45c410
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ecbb654eb9d520c9c2d628b7c67906fa27497fded38c4cf23920970bfa2f6b
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d145daf5de0e6e4c7cbe7d6a7b1a99ea6f5f5ab11a6634c9aadfa0a197734f7
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b5492d8ec76ce628fd257523d91584ac91c687d7ea1ef2f0e8152c0e20ff570
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06bf7f6ea338a69748630c269d4a8a93e783dd8580aa6c2270050a5a582ea155
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b646aee243f6a8534b782828cbcd0f3e047db163dadc7361bc3510d59b8e71cf
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cd09ab162c4e59c55c2354c8b16b608f3087657c3a30bbee7c948d03c127c6e
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50c34f5a01db989b610d43301c05aead10d5b35628396f8db1cc4a1d0c93327b
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d0bcf2622bc32729c628f01a8656e80557929a1b51b9e03fd6b69a2095c11b5
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34d6715ef9bcf8c2d160c0febb1f11b92784391c975eac88d5f405cd379e27cd
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b78837eb56314b91782e18192080e140c41a96eba3e74e928fd1a51476f0794b
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c88ab604f34281ba33dfad57ff22ed29b0aa7a757641052333954f5a008950b
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8acf23010bf65cb2135d18157640ac2eb32bcd1c4a2b8f6e7cab3039ba5e39a
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6afe8bc07a4e18b43b02dd293c71e31b6e675d9f7b575c366a286e2778648d2
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da77b547a2231c986b747c834bd4bc2fd5e52598053621c5953c3169941a1558
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f21ad02873b1f5ad245ca6efdc40bd8b5a8d297e45f987f2c2e5e4688b02ba94
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65344ffcca5c2927ab748ec8325cda6b2e302939be48ec00a6dafd7a65462e37
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4efe5ad5ff1c774830ba0cbe5db77e2469a801b3e1c8c9f7575364d9145f02c7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7509386733416771,
5
  "eval_steps": 100,
6
- "global_step": 600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -62,6 +62,14 @@
62
  "eval_samples_per_second": 5.997,
63
  "eval_steps_per_second": 0.375,
64
  "step": 600
 
 
 
 
 
 
 
 
65
  }
66
  ],
67
  "logging_steps": 500,
@@ -81,7 +89,7 @@
81
  "attributes": {}
82
  }
83
  },
84
- "total_flos": 6.851404845023232e+17,
85
  "train_batch_size": 2,
86
  "trial_name": null,
87
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8760951188986232,
5
  "eval_steps": 100,
6
+ "global_step": 700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
62
  "eval_samples_per_second": 5.997,
63
  "eval_steps_per_second": 0.375,
64
  "step": 600
65
+ },
66
+ {
67
+ "epoch": 0.8760951188986232,
68
+ "eval_loss": 0.015957491472363472,
69
+ "eval_runtime": 5.3181,
70
+ "eval_samples_per_second": 6.017,
71
+ "eval_steps_per_second": 0.376,
72
+ "step": 700
73
  }
74
  ],
75
  "logging_steps": 500,
 
89
  "attributes": {}
90
  }
91
  },
92
+ "total_flos": 7.993305652527104e+17,
93
  "train_batch_size": 2,
94
  "trial_name": null,
95
  "trial_params": null