Training in progress, step 41200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1339,6 +1339,10 @@ You can finetune this model on your own dataset.
|
|
| 1339 |
| 0.7227 | 40900 | 0.3322 |
|
| 1340 |
| 0.7236 | 40950 | 0.3424 |
|
| 1341 |
| 0.7245 | 41000 | 0.2834 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1342 |
|
| 1343 |
</details>
|
| 1344 |
|
|
|
|
| 1339 |
| 0.7227 | 40900 | 0.3322 |
|
| 1340 |
| 0.7236 | 40950 | 0.3424 |
|
| 1341 |
| 0.7245 | 41000 | 0.2834 |
|
| 1342 |
+
| 0.7254 | 41050 | 0.2776 |
|
| 1343 |
+
| 0.7263 | 41100 | 0.2924 |
|
| 1344 |
+
| 0.7271 | 41150 | 0.3982 |
|
| 1345 |
+
| 0.7280 | 41200 | 0.3379 |
|
| 1346 |
|
| 1347 |
</details>
|
| 1348 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:822f3843e5d129c0bef56a9f39c1ba41bc1fa63adfc0cc1868ef514ec0e5351b
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:086abfb2bf298dfb180a5caff3f861d5e6d3d3f4b12f1b97c28016e45648410e
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b9af559530a0818383bd31a393ecc6f9d55de4b1055f24c5ea4deb160850318
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:360bf556a97129543cdfd5bc8f9267eddea0b0255ab50b0df912124a90a12812
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be053631e025ff40e9a33566316f50efe9d70bdf16e7a6393f50270033d19672
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5748,6 +5748,34 @@
|
|
| 5748 |
"learning_rate": 1.532170976419077e-05,
|
| 5749 |
"loss": 0.2834,
|
| 5750 |
"step": 41000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5751 |
}
|
| 5752 |
],
|
| 5753 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7280309589864112,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 41200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5748 |
"learning_rate": 1.532170976419077e-05,
|
| 5749 |
"loss": 0.2834,
|
| 5750 |
"step": 41000
|
| 5751 |
+
},
|
| 5752 |
+
{
|
| 5753 |
+
"epoch": 0.7253803608347618,
|
| 5754 |
+
"grad_norm": 2.0050973892211914,
|
| 5755 |
+
"learning_rate": 1.5272623745852232e-05,
|
| 5756 |
+
"loss": 0.2776,
|
| 5757 |
+
"step": 41050
|
| 5758 |
+
},
|
| 5759 |
+
{
|
| 5760 |
+
"epoch": 0.7262638935519782,
|
| 5761 |
+
"grad_norm": 1.4293886423110962,
|
| 5762 |
+
"learning_rate": 1.5223537727513695e-05,
|
| 5763 |
+
"loss": 0.2924,
|
| 5764 |
+
"step": 41100
|
| 5765 |
+
},
|
| 5766 |
+
{
|
| 5767 |
+
"epoch": 0.7271474262691947,
|
| 5768 |
+
"grad_norm": 1.5391188859939575,
|
| 5769 |
+
"learning_rate": 1.5174451709175158e-05,
|
| 5770 |
+
"loss": 0.3982,
|
| 5771 |
+
"step": 41150
|
| 5772 |
+
},
|
| 5773 |
+
{
|
| 5774 |
+
"epoch": 0.7280309589864112,
|
| 5775 |
+
"grad_norm": 1.4493207931518555,
|
| 5776 |
+
"learning_rate": 1.5125365690836625e-05,
|
| 5777 |
+
"loss": 0.3379,
|
| 5778 |
+
"step": 41200
|
| 5779 |
}
|
| 5780 |
],
|
| 5781 |
"logging_steps": 50,
|