mirror of
https://github.com/facebookresearch/pytorch3d.git
synced 2025-07-31 10:52:50 +08:00
Summary: Copy code from NeRF for loading LLFF data and blender synthetic data, and create dataset objects for them Reviewed By: shapovalov Differential Revision: D35581039 fbshipit-source-id: af7a6f3e9a42499700693381b5b147c991f57e5d
368 lines
9.6 KiB
YAML
368 lines
9.6 KiB
YAML
generic_model_args:
|
|
mask_images: true
|
|
mask_depths: true
|
|
render_image_width: 400
|
|
render_image_height: 400
|
|
mask_threshold: 0.5
|
|
output_rasterized_mc: false
|
|
bg_color:
|
|
- 0.0
|
|
- 0.0
|
|
- 0.0
|
|
num_passes: 1
|
|
chunk_size_grid: 4096
|
|
render_features_dimensions: 3
|
|
tqdm_trigger_threshold: 16
|
|
n_train_target_views: 1
|
|
sampling_mode_training: mask_sample
|
|
sampling_mode_evaluation: full_grid
|
|
raysampler_class_type: AdaptiveRaySampler
|
|
renderer_class_type: MultiPassEmissionAbsorptionRenderer
|
|
image_feature_extractor_class_type: null
|
|
view_pooler_enabled: false
|
|
implicit_function_class_type: NeuralRadianceFieldImplicitFunction
|
|
loss_weights:
|
|
loss_rgb_mse: 1.0
|
|
loss_prev_stage_rgb_mse: 1.0
|
|
loss_mask_bce: 0.0
|
|
loss_prev_stage_mask_bce: 0.0
|
|
log_vars:
|
|
- loss_rgb_psnr_fg
|
|
- loss_rgb_psnr
|
|
- loss_rgb_mse
|
|
- loss_rgb_huber
|
|
- loss_depth_abs
|
|
- loss_depth_abs_fg
|
|
- loss_mask_neg_iou
|
|
- loss_mask_bce
|
|
- loss_mask_beta_prior
|
|
- loss_eikonal
|
|
- loss_density_tv
|
|
- loss_depth_neg_penalty
|
|
- loss_autodecoder_norm
|
|
- loss_prev_stage_rgb_mse
|
|
- loss_prev_stage_rgb_psnr_fg
|
|
- loss_prev_stage_rgb_psnr
|
|
- loss_prev_stage_mask_bce
|
|
- objective
|
|
- epoch
|
|
- sec/it
|
|
sequence_autodecoder_args:
|
|
encoding_dim: 0
|
|
n_instances: 0
|
|
init_scale: 1.0
|
|
ignore_input: false
|
|
raysampler_AdaptiveRaySampler_args:
|
|
image_width: 400
|
|
image_height: 400
|
|
sampling_mode_training: mask_sample
|
|
sampling_mode_evaluation: full_grid
|
|
n_pts_per_ray_training: 64
|
|
n_pts_per_ray_evaluation: 64
|
|
n_rays_per_image_sampled_from_mask: 1024
|
|
stratified_point_sampling_training: true
|
|
stratified_point_sampling_evaluation: false
|
|
scene_extent: 8.0
|
|
scene_center:
|
|
- 0.0
|
|
- 0.0
|
|
- 0.0
|
|
raysampler_NearFarRaySampler_args:
|
|
image_width: 400
|
|
image_height: 400
|
|
sampling_mode_training: mask_sample
|
|
sampling_mode_evaluation: full_grid
|
|
n_pts_per_ray_training: 64
|
|
n_pts_per_ray_evaluation: 64
|
|
n_rays_per_image_sampled_from_mask: 1024
|
|
stratified_point_sampling_training: true
|
|
stratified_point_sampling_evaluation: false
|
|
min_depth: 0.1
|
|
max_depth: 8.0
|
|
renderer_LSTMRenderer_args:
|
|
num_raymarch_steps: 10
|
|
init_depth: 17.0
|
|
init_depth_noise_std: 0.0005
|
|
hidden_size: 16
|
|
n_feature_channels: 256
|
|
verbose: false
|
|
renderer_MultiPassEmissionAbsorptionRenderer_args:
|
|
raymarcher_class_type: EmissionAbsorptionRaymarcher
|
|
n_pts_per_ray_fine_training: 64
|
|
n_pts_per_ray_fine_evaluation: 64
|
|
stratified_sampling_coarse_training: true
|
|
stratified_sampling_coarse_evaluation: false
|
|
append_coarse_samples_to_fine: true
|
|
density_noise_std_train: 0.0
|
|
return_weights: false
|
|
raymarcher_CumsumRaymarcher_args:
|
|
surface_thickness: 1
|
|
bg_color:
|
|
- 0.0
|
|
background_opacity: 0.0
|
|
density_relu: true
|
|
blend_output: false
|
|
raymarcher_EmissionAbsorptionRaymarcher_args:
|
|
surface_thickness: 1
|
|
bg_color:
|
|
- 0.0
|
|
background_opacity: 10000000000.0
|
|
density_relu: true
|
|
blend_output: false
|
|
renderer_SignedDistanceFunctionRenderer_args:
|
|
render_features_dimensions: 3
|
|
ray_tracer_args:
|
|
object_bounding_sphere: 1.0
|
|
sdf_threshold: 5.0e-05
|
|
line_search_step: 0.5
|
|
line_step_iters: 1
|
|
sphere_tracing_iters: 10
|
|
n_steps: 100
|
|
n_secant_steps: 8
|
|
ray_normal_coloring_network_args:
|
|
feature_vector_size: 3
|
|
mode: idr
|
|
d_in: 9
|
|
d_out: 3
|
|
dims:
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
weight_norm: true
|
|
n_harmonic_functions_dir: 0
|
|
pooled_feature_dim: 0
|
|
bg_color:
|
|
- 0.0
|
|
soft_mask_alpha: 50.0
|
|
image_feature_extractor_ResNetFeatureExtractor_args:
|
|
name: resnet34
|
|
pretrained: true
|
|
stages:
|
|
- 1
|
|
- 2
|
|
- 3
|
|
- 4
|
|
normalize_image: true
|
|
image_rescale: 0.16
|
|
first_max_pool: true
|
|
proj_dim: 32
|
|
l2_norm: true
|
|
add_masks: true
|
|
add_images: true
|
|
global_average_pool: false
|
|
feature_rescale: 1.0
|
|
view_pooler_args:
|
|
feature_aggregator_class_type: AngleWeightedReductionFeatureAggregator
|
|
view_sampler_args:
|
|
masked_sampling: false
|
|
sampling_mode: bilinear
|
|
feature_aggregator_AngleWeightedIdentityFeatureAggregator_args:
|
|
exclude_target_view: true
|
|
exclude_target_view_mask_features: true
|
|
concatenate_output: true
|
|
weight_by_ray_angle_gamma: 1.0
|
|
min_ray_angle_weight: 0.1
|
|
feature_aggregator_AngleWeightedReductionFeatureAggregator_args:
|
|
exclude_target_view: true
|
|
exclude_target_view_mask_features: true
|
|
concatenate_output: true
|
|
reduction_functions:
|
|
- AVG
|
|
- STD
|
|
weight_by_ray_angle_gamma: 1.0
|
|
min_ray_angle_weight: 0.1
|
|
feature_aggregator_IdentityFeatureAggregator_args:
|
|
exclude_target_view: true
|
|
exclude_target_view_mask_features: true
|
|
concatenate_output: true
|
|
feature_aggregator_ReductionFeatureAggregator_args:
|
|
exclude_target_view: true
|
|
exclude_target_view_mask_features: true
|
|
concatenate_output: true
|
|
reduction_functions:
|
|
- AVG
|
|
- STD
|
|
implicit_function_IdrFeatureField_args:
|
|
feature_vector_size: 3
|
|
d_in: 3
|
|
d_out: 1
|
|
dims:
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
- 512
|
|
geometric_init: true
|
|
bias: 1.0
|
|
skip_in: []
|
|
weight_norm: true
|
|
n_harmonic_functions_xyz: 0
|
|
pooled_feature_dim: 0
|
|
encoding_dim: 0
|
|
implicit_function_NeRFormerImplicitFunction_args:
|
|
n_harmonic_functions_xyz: 10
|
|
n_harmonic_functions_dir: 4
|
|
n_hidden_neurons_dir: 128
|
|
latent_dim: 0
|
|
input_xyz: true
|
|
xyz_ray_dir_in_camera_coords: false
|
|
color_dim: 3
|
|
transformer_dim_down_factor: 2.0
|
|
n_hidden_neurons_xyz: 80
|
|
n_layers_xyz: 2
|
|
append_xyz:
|
|
- 1
|
|
implicit_function_NeuralRadianceFieldImplicitFunction_args:
|
|
n_harmonic_functions_xyz: 10
|
|
n_harmonic_functions_dir: 4
|
|
n_hidden_neurons_dir: 128
|
|
latent_dim: 0
|
|
input_xyz: true
|
|
xyz_ray_dir_in_camera_coords: false
|
|
color_dim: 3
|
|
transformer_dim_down_factor: 1.0
|
|
n_hidden_neurons_xyz: 256
|
|
n_layers_xyz: 8
|
|
append_xyz:
|
|
- 5
|
|
implicit_function_SRNHyperNetImplicitFunction_args:
|
|
hypernet_args:
|
|
n_harmonic_functions: 3
|
|
n_hidden_units: 256
|
|
n_layers: 2
|
|
n_hidden_units_hypernet: 256
|
|
n_layers_hypernet: 1
|
|
in_features: 3
|
|
out_features: 256
|
|
latent_dim_hypernet: 0
|
|
latent_dim: 0
|
|
xyz_in_camera_coords: false
|
|
pixel_generator_args:
|
|
n_harmonic_functions: 4
|
|
n_hidden_units: 256
|
|
n_hidden_units_color: 128
|
|
n_layers: 2
|
|
in_features: 256
|
|
out_features: 3
|
|
ray_dir_in_camera_coords: false
|
|
implicit_function_SRNImplicitFunction_args:
|
|
raymarch_function_args:
|
|
n_harmonic_functions: 3
|
|
n_hidden_units: 256
|
|
n_layers: 2
|
|
in_features: 3
|
|
out_features: 256
|
|
latent_dim: 0
|
|
xyz_in_camera_coords: false
|
|
raymarch_function: null
|
|
pixel_generator_args:
|
|
n_harmonic_functions: 4
|
|
n_hidden_units: 256
|
|
n_hidden_units_color: 128
|
|
n_layers: 2
|
|
in_features: 256
|
|
out_features: 3
|
|
ray_dir_in_camera_coords: false
|
|
solver_args:
|
|
breed: adam
|
|
weight_decay: 0.0
|
|
lr_policy: multistep
|
|
lr: 0.0005
|
|
gamma: 0.1
|
|
momentum: 0.9
|
|
betas:
|
|
- 0.9
|
|
- 0.999
|
|
milestones: []
|
|
max_epochs: 1000
|
|
data_source_args:
|
|
dataset_map_provider_class_type: ???
|
|
data_loader_map_provider_class_type: SequenceDataLoaderMapProvider
|
|
dataset_map_provider_BlenderDatasetMapProvider_args:
|
|
base_dir: ???
|
|
object_name: ???
|
|
path_manager_factory_class_type: PathManagerFactory
|
|
n_known_frames_for_test: null
|
|
path_manager_factory_PathManagerFactory_args:
|
|
silence_logs: true
|
|
dataset_map_provider_JsonIndexDatasetMapProvider_args:
|
|
category: ???
|
|
task_str: singlesequence
|
|
dataset_root: ''
|
|
n_frames_per_sequence: -1
|
|
test_on_train: false
|
|
restrict_sequence_name: []
|
|
test_restrict_sequence_id: -1
|
|
assert_single_seq: false
|
|
only_test_set: false
|
|
dataset_class_type: JsonIndexDataset
|
|
path_manager_factory_class_type: PathManagerFactory
|
|
dataset_JsonIndexDataset_args:
|
|
limit_to: 0
|
|
limit_sequences_to: 0
|
|
exclude_sequence: []
|
|
limit_category_to: []
|
|
load_images: true
|
|
load_depths: true
|
|
load_depth_masks: true
|
|
load_masks: true
|
|
load_point_clouds: false
|
|
max_points: 0
|
|
mask_images: false
|
|
mask_depths: false
|
|
image_height: 800
|
|
image_width: 800
|
|
box_crop: true
|
|
box_crop_mask_thr: 0.4
|
|
box_crop_context: 0.3
|
|
remove_empty_masks: true
|
|
seed: 0
|
|
sort_frames: false
|
|
path_manager_factory_PathManagerFactory_args:
|
|
silence_logs: true
|
|
dataset_map_provider_LlffDatasetMapProvider_args:
|
|
base_dir: ???
|
|
object_name: ???
|
|
path_manager_factory_class_type: PathManagerFactory
|
|
n_known_frames_for_test: null
|
|
path_manager_factory_PathManagerFactory_args:
|
|
silence_logs: true
|
|
data_loader_map_provider_SequenceDataLoaderMapProvider_args:
|
|
batch_size: 1
|
|
num_workers: 0
|
|
dataset_len: 1000
|
|
dataset_len_val: 1
|
|
images_per_seq_options:
|
|
- 2
|
|
sample_consecutive_frames: false
|
|
consecutive_frames_max_gap: 0
|
|
consecutive_frames_max_gap_seconds: 0.1
|
|
architecture: generic
|
|
detect_anomaly: false
|
|
eval_only: false
|
|
exp_dir: ./data/default_experiment/
|
|
exp_idx: 0
|
|
gpu_idx: 0
|
|
metric_print_interval: 5
|
|
resume: true
|
|
resume_epoch: -1
|
|
seed: 0
|
|
store_checkpoints: true
|
|
store_checkpoints_purge: 1
|
|
test_interval: -1
|
|
test_when_finished: false
|
|
validation_interval: 1
|
|
visdom_env: ''
|
|
visdom_port: 8097
|
|
visdom_server: http://127.0.0.1
|
|
visualize_interval: 1000
|
|
clip_grad: 0.0
|
|
hydra:
|
|
run:
|
|
dir: .
|
|
output_subdir: null
|