guyhadad01 commited on
Commit
34441e4
·
verified ·
1 Parent(s): 1768eba

Training in progress, step 37000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1253,6 +1253,10 @@ You can finetune this model on your own dataset.
1253
  | 0.6485 | 36700 | 0.3111 |
1254
  | 0.6494 | 36750 | 0.3299 |
1255
  | 0.6503 | 36800 | 0.3994 |
 
 
 
 
1256
 
1257
 
1258
  ### Framework Versions
 
1253
  | 0.6485 | 36700 | 0.3111 |
1254
  | 0.6494 | 36750 | 0.3299 |
1255
  | 0.6503 | 36800 | 0.3994 |
1256
+ | 0.6512 | 36850 | 0.3595 |
1257
+ | 0.6520 | 36900 | 0.3572 |
1258
+ | 0.6529 | 36950 | 0.3085 |
1259
+ | 0.6538 | 37000 | 0.2647 |
1260
 
1261
 
1262
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4bf73f234398da4bc2354c62f35d8522fb992fe0cc8508b01e537eeb46ba200
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5aa3e074a25abb8c340316265b8419fb45e38d5ea71e4312b6d0194cb38cc86b
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:deab99f5ed27bec630b2e3f842027b1cc6d0187c2406e2f581cb275f3a90e563
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86c17b77d1cfac3584af9a6619882b78c1f9bc7dcb85e0259432165076b9f36
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b55608d8af777fe7d98d4ef8f564bad9679b83c0050069b201bb564a1ddf9edd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3da82f98ab298f77c390cd353b9bced87815dd73e91293360907ff091eb61d4e
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7ed611a4947df61c53bc83c6d678cf93c3033600c02343412dcb7919a293d43
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952a0b2337ddfcc5838b84a78a584c51460d6072b3d324731f0a62584e450719
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a56ae9bbdefa7bba62bf8ab81e508fcd56be09ecc92cd7e39c632b1b315132f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a249cc3fbdfe88ea20fb6dbfcb1191ec424d82ef41e7dafc1d1c85f14b5994e9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6502800798713576,
6
  "eval_steps": 500,
7
- "global_step": 36800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5160,6 +5160,34 @@
5160
  "learning_rate": 1.9442971863894287e-05,
5161
  "loss": 0.3994,
5162
  "step": 36800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5163
  }
5164
  ],
5165
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6538142107402237,
6
  "eval_steps": 500,
7
+ "global_step": 37000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5160
  "learning_rate": 1.9442971863894287e-05,
5161
  "loss": 0.3994,
5162
  "step": 36800
5163
+ },
5164
+ {
5165
+ "epoch": 0.6511636125885741,
5166
+ "grad_norm": 2.2977466583251953,
5167
+ "learning_rate": 1.9393885845555755e-05,
5168
+ "loss": 0.3595,
5169
+ "step": 36850
5170
+ },
5171
+ {
5172
+ "epoch": 0.6520471453057907,
5173
+ "grad_norm": 1.6370161771774292,
5174
+ "learning_rate": 1.9344799827217217e-05,
5175
+ "loss": 0.3572,
5176
+ "step": 36900
5177
+ },
5178
+ {
5179
+ "epoch": 0.6529306780230072,
5180
+ "grad_norm": 1.4357324838638306,
5181
+ "learning_rate": 1.9295713808878678e-05,
5182
+ "loss": 0.3085,
5183
+ "step": 36950
5184
+ },
5185
+ {
5186
+ "epoch": 0.6538142107402237,
5187
+ "grad_norm": 1.8057055473327637,
5188
+ "learning_rate": 1.9246627790540143e-05,
5189
+ "loss": 0.2647,
5190
+ "step": 37000
5191
  }
5192
  ],
5193
  "logging_steps": 50,