|
cond_image_size: 512 |
|
|
|
image_tokenizer_cls: tsr.models.tokenizers.image.DINOSingleImageTokenizer |
|
image_tokenizer: |
|
pretrained_model_name_or_path: "facebook/dino-vitb16" |
|
|
|
tokenizer_cls: tsr.models.tokenizers.triplane.Triplane1DTokenizer |
|
tokenizer: |
|
plane_size: 32 |
|
num_channels: 1024 |
|
|
|
backbone_cls: tsr.models.transformer.transformer_1d.Transformer1D |
|
backbone: |
|
in_channels: ${tokenizer.num_channels} |
|
num_attention_heads: 16 |
|
attention_head_dim: 64 |
|
num_layers: 16 |
|
cross_attention_dim: 768 |
|
|
|
post_processor_cls: tsr.models.network_utils.TriplaneUpsampleNetwork |
|
post_processor: |
|
in_channels: 1024 |
|
out_channels: 40 |
|
|
|
decoder_cls: tsr.models.network_utils.NeRFMLP |
|
decoder: |
|
in_channels: 120 |
|
n_neurons: 64 |
|
n_hidden_layers: 9 |
|
activation: silu |
|
|
|
renderer_cls: tsr.models.nerf_renderer.TriplaneNeRFRenderer |
|
renderer: |
|
radius: 0.87 |
|
feature_reduction: concat |
|
density_activation: exp |
|
density_bias: -1.0 |
|
num_samples_per_ray: 128 |