Training in progress, step 37000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1253,6 +1253,10 @@ You can finetune this model on your own dataset.
|
|
| 1253 |
| 0.6485 | 36700 | 0.3111 |
|
| 1254 |
| 0.6494 | 36750 | 0.3299 |
|
| 1255 |
| 0.6503 | 36800 | 0.3994 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1256 |
|
| 1257 |
|
| 1258 |
### Framework Versions
|
|
|
|
| 1253 |
| 0.6485 | 36700 | 0.3111 |
|
| 1254 |
| 0.6494 | 36750 | 0.3299 |
|
| 1255 |
| 0.6503 | 36800 | 0.3994 |
|
| 1256 |
+
| 0.6512 | 36850 | 0.3595 |
|
| 1257 |
+
| 0.6520 | 36900 | 0.3572 |
|
| 1258 |
+
| 0.6529 | 36950 | 0.3085 |
|
| 1259 |
+
| 0.6538 | 37000 | 0.2647 |
|
| 1260 |
|
| 1261 |
|
| 1262 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5aa3e074a25abb8c340316265b8419fb45e38d5ea71e4312b6d0194cb38cc86b
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a86c17b77d1cfac3584af9a6619882b78c1f9bc7dcb85e0259432165076b9f36
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3da82f98ab298f77c390cd353b9bced87815dd73e91293360907ff091eb61d4e
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:952a0b2337ddfcc5838b84a78a584c51460d6072b3d324731f0a62584e450719
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a249cc3fbdfe88ea20fb6dbfcb1191ec424d82ef41e7dafc1d1c85f14b5994e9
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5160,6 +5160,34 @@
|
|
| 5160 |
"learning_rate": 1.9442971863894287e-05,
|
| 5161 |
"loss": 0.3994,
|
| 5162 |
"step": 36800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5163 |
}
|
| 5164 |
],
|
| 5165 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6538142107402237,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 37000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5160 |
"learning_rate": 1.9442971863894287e-05,
|
| 5161 |
"loss": 0.3994,
|
| 5162 |
"step": 36800
|
| 5163 |
+
},
|
| 5164 |
+
{
|
| 5165 |
+
"epoch": 0.6511636125885741,
|
| 5166 |
+
"grad_norm": 2.2977466583251953,
|
| 5167 |
+
"learning_rate": 1.9393885845555755e-05,
|
| 5168 |
+
"loss": 0.3595,
|
| 5169 |
+
"step": 36850
|
| 5170 |
+
},
|
| 5171 |
+
{
|
| 5172 |
+
"epoch": 0.6520471453057907,
|
| 5173 |
+
"grad_norm": 1.6370161771774292,
|
| 5174 |
+
"learning_rate": 1.9344799827217217e-05,
|
| 5175 |
+
"loss": 0.3572,
|
| 5176 |
+
"step": 36900
|
| 5177 |
+
},
|
| 5178 |
+
{
|
| 5179 |
+
"epoch": 0.6529306780230072,
|
| 5180 |
+
"grad_norm": 1.4357324838638306,
|
| 5181 |
+
"learning_rate": 1.9295713808878678e-05,
|
| 5182 |
+
"loss": 0.3085,
|
| 5183 |
+
"step": 36950
|
| 5184 |
+
},
|
| 5185 |
+
{
|
| 5186 |
+
"epoch": 0.6538142107402237,
|
| 5187 |
+
"grad_norm": 1.8057055473327637,
|
| 5188 |
+
"learning_rate": 1.9246627790540143e-05,
|
| 5189 |
+
"loss": 0.2647,
|
| 5190 |
+
"step": 37000
|
| 5191 |
}
|
| 5192 |
],
|
| 5193 |
"logging_steps": 50,
|