| { |
| "activation": "swiglu", |
| "bias": false, |
| "dim_feedforward": 3072, |
| "dpt_features": 128, |
| "dpt_out_channels": [ |
| 96, |
| 192, |
| 384, |
| 768 |
| ], |
| "dpt_out_layers": null, |
| "dropout": 0.0, |
| "include_alpha": false, |
| "latent_dim": 768, |
| "norm_first": true, |
| "norm_type": "rms_norm", |
| "num_heads": 6, |
| "num_layers": 12, |
| "num_register_tokens": 16, |
| "patch_size": 8, |
| "pe_type": "rope", |
| "qk_norm": true, |
| "rope_double_max_freq": false, |
| "rope_type": "triangle", |
| "texture_channels": 13, |
| "texture_encode_patch_size": 32, |
| "texture_encoder_norm_type": "rms_norm", |
| "turn_to_cam_coord": true, |
| "use_dpt_decoder": true, |
| "use_ldr": false, |
| "use_vn_encoder": true, |
| "vdir_num_freqs": 0, |
| "vdir_pe_type": "nerf", |
| "vertex_pe_num_freqs": 12, |
| "view_indep_qk_norm": true, |
| "view_transformer_ffn_hidden_dim": 3072, |
| "view_transformer_include_self_attn": true, |
| "view_transformer_latent_dim": 768, |
| "view_transformer_n_heads": 6, |
| "view_transformer_n_layers": 6, |
| "view_transformer_use_swin_attn": false, |
| "vn_encoder_norm_type": "rms_norm", |
| "vn_pe_num_freqs": 6 |
| } |