| """Contains different Gaussian predictors. |
| |
| For licensing see accompanying LICENSE file. |
| Copyright (C) 2025 Apple Inc. All Rights Reserved. |
| """ |
|
|
| from __future__ import annotations |
|
|
| from sharp.models.monodepth import ( |
| create_monodepth_adaptor, |
| create_monodepth_dpt, |
| ) |
|
|
| from .alignment import create_alignment |
| from .composer import GaussianComposer |
| from .gaussian_decoder import create_gaussian_decoder |
| from .heads import DirectPredictionHead |
| from .initializer import create_initializer |
| from .params import PredictorParams |
| from .predictor import RGBGaussianPredictor |
|
|
|
|
| def create_predictor(params: PredictorParams) -> RGBGaussianPredictor: |
| """Create gaussian predictor model specified by name.""" |
| if params.gaussian_decoder.stride < params.initializer.stride: |
| raise ValueError( |
| "We donot expected gaussian_decoder has higher resolution than initializer." |
| ) |
|
|
| scale_factor = params.gaussian_decoder.stride // params.initializer.stride |
| gaussian_composer = GaussianComposer( |
| delta_factor=params.delta_factor, |
| min_scale=params.min_scale, |
| max_scale=params.max_scale, |
| color_activation_type=params.color_activation_type, |
| opacity_activation_type=params.opacity_activation_type, |
| color_space=params.color_space, |
| scale_factor=scale_factor, |
| base_scale_on_predicted_mean=params.base_scale_on_predicted_mean, |
| ) |
| if params.num_monodepth_layers > 1 and params.initializer.num_layers != 2: |
| raise KeyError("We only support num_layers = 2 when num_monodepth_layers > 1.") |
|
|
| monodepth_model = create_monodepth_dpt(params.monodepth) |
| monodepth_adaptor = create_monodepth_adaptor( |
| monodepth_model, |
| params.monodepth_adaptor, |
| params.num_monodepth_layers, |
| params.sorting_monodepth, |
| ) |
|
|
| if params.num_monodepth_layers == 2: |
| monodepth_adaptor.replicate_head(params.num_monodepth_layers) |
|
|
| gaussian_decoder = create_gaussian_decoder( |
| params.gaussian_decoder, |
| dims_depth_features=monodepth_adaptor.get_feature_dims(), |
| ) |
| initializer = create_initializer( |
| params.initializer, |
| ) |
| prediction_head = DirectPredictionHead( |
| feature_dim=gaussian_decoder.dim_out, num_layers=initializer.num_layers |
| ) |
| decoder_dim = monodepth_model.decoder.dims_decoder[-1] |
| return RGBGaussianPredictor( |
| init_model=initializer, |
| feature_model=gaussian_decoder, |
| prediction_head=prediction_head, |
| monodepth_model=monodepth_adaptor, |
| gaussian_composer=gaussian_composer, |
| scale_map_estimator=create_alignment(params.depth_alignment, depth_decoder_dim=decoder_dim), |
| ) |
|
|
|
|
| __all__ = [ |
| "PredictorParams", |
| "create_predictor", |
| ] |
|
|