Backfill manifest for add_sorl_abs1_500K
Browse files
add_sorl_abs1_500K/train_config.json
CHANGED
|
@@ -15,5 +15,14 @@
|
|
| 15 |
"output_dir": "ckpt/sweep_20260406_1652/add_sorl1_500000",
|
| 16 |
"device": "cuda",
|
| 17 |
"push_to_hub": true,
|
| 18 |
-
"no_wandb": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 19 |
}
|
|
|
|
| 15 |
"output_dir": "ckpt/sweep_20260406_1652/add_sorl1_500000",
|
| 16 |
"device": "cuda",
|
| 17 |
"push_to_hub": true,
|
| 18 |
+
"no_wandb": false,
|
| 19 |
+
"n_params": 167871744,
|
| 20 |
+
"run_name": "add_sorl_abs1_500K",
|
| 21 |
+
"git_commit": "pre-manifest",
|
| 22 |
+
"timestamp": "2026-04-06",
|
| 23 |
+
"tokenizer": "Qwen/Qwen3-0.6B",
|
| 24 |
+
"dataset_repo": "thoughtworks/arithmetic-sorl-data",
|
| 25 |
+
"dataset_config": "add_6digit",
|
| 26 |
+
"model_repo": "thoughtworks/arithmetic-sorl",
|
| 27 |
+
"trainer_version": "v6"
|
| 28 |
}
|