| { |
| "train_file": "data/synthetic/train.jsonl", |
| "validation_file": "data/synthetic/validation.jsonl", |
| "test_file": null, |
| "output_dir": "artifacts/tiny-router", |
| "encoder_name": "microsoft/deberta-v3-small", |
| "device": "auto", |
| "feature_mode": "full_interaction", |
| "pooling_type": "attention", |
| "use_head_dependencies": true, |
| "dependency_hidden_dim": 32, |
| "max_length": 128, |
| "recency_max": 3600, |
| "batch_size": 32, |
| "epochs": 20, |
| "encoder_lr": 2e-05, |
| "head_lr": 0.0001, |
| "weight_decay": 0.01, |
| "warmup_ratio": 0.1, |
| "dropout": 0.1, |
| "seed": 13, |
| "patience": 2, |
| "mixed_precision": false, |
| "confidence_threshold": 0.8, |
| "head_loss_weights": "{}" |
| } |