guyhadad01 commited on
Commit
3291cc1
·
verified ·
1 Parent(s): 1fb2235

Training in progress, step 41200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1339,6 +1339,10 @@ You can finetune this model on your own dataset.
1339
  | 0.7227 | 40900 | 0.3322 |
1340
  | 0.7236 | 40950 | 0.3424 |
1341
  | 0.7245 | 41000 | 0.2834 |
 
 
 
 
1342
 
1343
  </details>
1344
 
 
1339
  | 0.7227 | 40900 | 0.3322 |
1340
  | 0.7236 | 40950 | 0.3424 |
1341
  | 0.7245 | 41000 | 0.2834 |
1342
+ | 0.7254 | 41050 | 0.2776 |
1343
+ | 0.7263 | 41100 | 0.2924 |
1344
+ | 0.7271 | 41150 | 0.3982 |
1345
+ | 0.7280 | 41200 | 0.3379 |
1346
 
1347
  </details>
1348
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bad5fe2e60c5aa24260d1942f5fd36c57da4fa95b5377f04b02dcc5ceb9e653
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:822f3843e5d129c0bef56a9f39c1ba41bc1fa63adfc0cc1868ef514ec0e5351b
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fece1064662d61321c117cc1d24216b16971ad97b1195b94af13fb853181101
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086abfb2bf298dfb180a5caff3f861d5e6d3d3f4b12f1b97c28016e45648410e
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d73c58855bdaef926976cbbf2d9665190e116bcc636d4b89a717f6e32bf6a98
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b9af559530a0818383bd31a393ecc6f9d55de4b1055f24c5ea4deb160850318
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a4677c24f01289fca4e4e6cb6d863cf74dbec8f2665874e2aeb1133c6e53329
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:360bf556a97129543cdfd5bc8f9267eddea0b0255ab50b0df912124a90a12812
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9861609e13b6dfba877602ae0e61dca8ad368849f8b20c6f7958302bb7e1b3b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be053631e025ff40e9a33566316f50efe9d70bdf16e7a6393f50270033d19672
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7244968281175452,
6
  "eval_steps": 500,
7
- "global_step": 41000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5748,6 +5748,34 @@
5748
  "learning_rate": 1.532170976419077e-05,
5749
  "loss": 0.2834,
5750
  "step": 41000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5751
  }
5752
  ],
5753
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7280309589864112,
6
  "eval_steps": 500,
7
+ "global_step": 41200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5748
  "learning_rate": 1.532170976419077e-05,
5749
  "loss": 0.2834,
5750
  "step": 41000
5751
+ },
5752
+ {
5753
+ "epoch": 0.7253803608347618,
5754
+ "grad_norm": 2.0050973892211914,
5755
+ "learning_rate": 1.5272623745852232e-05,
5756
+ "loss": 0.2776,
5757
+ "step": 41050
5758
+ },
5759
+ {
5760
+ "epoch": 0.7262638935519782,
5761
+ "grad_norm": 1.4293886423110962,
5762
+ "learning_rate": 1.5223537727513695e-05,
5763
+ "loss": 0.2924,
5764
+ "step": 41100
5765
+ },
5766
+ {
5767
+ "epoch": 0.7271474262691947,
5768
+ "grad_norm": 1.5391188859939575,
5769
+ "learning_rate": 1.5174451709175158e-05,
5770
+ "loss": 0.3982,
5771
+ "step": 41150
5772
+ },
5773
+ {
5774
+ "epoch": 0.7280309589864112,
5775
+ "grad_norm": 1.4493207931518555,
5776
+ "learning_rate": 1.5125365690836625e-05,
5777
+ "loss": 0.3379,
5778
+ "step": 41200
5779
  }
5780
  ],
5781
  "logging_steps": 50,