experiment.yaml 8.66 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
generic_model_args:
  mask_images: true
  mask_depths: true
  render_image_width: 400
  render_image_height: 400
  mask_threshold: 0.5
  output_rasterized_mc: false
  bg_color:
  - 0.0
  - 0.0
  - 0.0
  num_passes: 1
  chunk_size_grid: 4096
  render_features_dimensions: 3
  tqdm_trigger_threshold: 16
  n_train_target_views: 1
  sampling_mode_training: mask_sample
  sampling_mode_evaluation: full_grid
  raysampler_class_type: AdaptiveRaySampler
  renderer_class_type: MultiPassEmissionAbsorptionRenderer
  image_feature_extractor_class_type: null
  view_pooler_enabled: false
  implicit_function_class_type: NeuralRadianceFieldImplicitFunction
  loss_weights:
    loss_rgb_mse: 1.0
    loss_prev_stage_rgb_mse: 1.0
    loss_mask_bce: 0.0
    loss_prev_stage_mask_bce: 0.0
  log_vars:
  - loss_rgb_psnr_fg
  - loss_rgb_psnr
  - loss_rgb_mse
  - loss_rgb_huber
  - loss_depth_abs
  - loss_depth_abs_fg
  - loss_mask_neg_iou
  - loss_mask_bce
  - loss_mask_beta_prior
  - loss_eikonal
  - loss_density_tv
  - loss_depth_neg_penalty
  - loss_autodecoder_norm
  - loss_prev_stage_rgb_mse
  - loss_prev_stage_rgb_psnr_fg
  - loss_prev_stage_rgb_psnr
  - loss_prev_stage_mask_bce
  - objective
  - epoch
  - sec/it
  sequence_autodecoder_args:
    encoding_dim: 0
    n_instances: 0
    init_scale: 1.0
    ignore_input: false
  raysampler_AdaptiveRaySampler_args:
    image_width: 400
    image_height: 400
    sampling_mode_training: mask_sample
    sampling_mode_evaluation: full_grid
    n_pts_per_ray_training: 64
    n_pts_per_ray_evaluation: 64
    n_rays_per_image_sampled_from_mask: 1024
    stratified_point_sampling_training: true
    stratified_point_sampling_evaluation: false
    scene_extent: 8.0
    scene_center:
    - 0.0
    - 0.0
    - 0.0
  raysampler_NearFarRaySampler_args:
    image_width: 400
    image_height: 400
    sampling_mode_training: mask_sample
    sampling_mode_evaluation: full_grid
    n_pts_per_ray_training: 64
    n_pts_per_ray_evaluation: 64
    n_rays_per_image_sampled_from_mask: 1024
    stratified_point_sampling_training: true
    stratified_point_sampling_evaluation: false
    min_depth: 0.1
    max_depth: 8.0
  renderer_LSTMRenderer_args:
    num_raymarch_steps: 10
    init_depth: 17.0
    init_depth_noise_std: 0.0005
    hidden_size: 16
    n_feature_channels: 256
    verbose: false
  renderer_MultiPassEmissionAbsorptionRenderer_args:
    raymarcher_class_type: EmissionAbsorptionRaymarcher
    n_pts_per_ray_fine_training: 64
    n_pts_per_ray_fine_evaluation: 64
    stratified_sampling_coarse_training: true
    stratified_sampling_coarse_evaluation: false
    append_coarse_samples_to_fine: true
    density_noise_std_train: 0.0
    return_weights: false
    raymarcher_EmissionAbsorptionRaymarcher_args:
      surface_thickness: 1
      bg_color:
      - 0.0
      background_opacity: 10000000000.0
      density_relu: true
      blend_output: false
    raymarcher_CumsumRaymarcher_args:
      surface_thickness: 1
      bg_color:
      - 0.0
      background_opacity: 0.0
      density_relu: true
      blend_output: false
  renderer_SignedDistanceFunctionRenderer_args:
    render_features_dimensions: 3
    ray_tracer_args:
      object_bounding_sphere: 1.0
      sdf_threshold: 5.0e-05
      line_search_step: 0.5
      line_step_iters: 1
      sphere_tracing_iters: 10
      n_steps: 100
      n_secant_steps: 8
    ray_normal_coloring_network_args:
      feature_vector_size: 3
      mode: idr
      d_in: 9
      d_out: 3
      dims:
      - 512
      - 512
      - 512
      - 512
      weight_norm: true
      n_harmonic_functions_dir: 0
      pooled_feature_dim: 0
    bg_color:
    - 0.0
    soft_mask_alpha: 50.0
  image_feature_extractor_ResNetFeatureExtractor_args:
    name: resnet34
    pretrained: true
    stages:
    - 1
    - 2
    - 3
    - 4
    normalize_image: true
    image_rescale: 0.16
    first_max_pool: true
    proj_dim: 32
    l2_norm: true
    add_masks: true
    add_images: true
    global_average_pool: false
    feature_rescale: 1.0
  view_pooler_args:
    feature_aggregator_class_type: AngleWeightedReductionFeatureAggregator
    view_sampler_args:
      masked_sampling: false
      sampling_mode: bilinear
    feature_aggregator_IdentityFeatureAggregator_args:
      exclude_target_view: true
      exclude_target_view_mask_features: true
      concatenate_output: true
    feature_aggregator_ReductionFeatureAggregator_args:
      exclude_target_view: true
      exclude_target_view_mask_features: true
      concatenate_output: true
      reduction_functions:
      - AVG
      - STD
    feature_aggregator_AngleWeightedReductionFeatureAggregator_args:
      exclude_target_view: true
      exclude_target_view_mask_features: true
      concatenate_output: true
      reduction_functions:
      - AVG
      - STD
      weight_by_ray_angle_gamma: 1.0
      min_ray_angle_weight: 0.1
    feature_aggregator_AngleWeightedIdentityFeatureAggregator_args:
      exclude_target_view: true
      exclude_target_view_mask_features: true
      concatenate_output: true
      weight_by_ray_angle_gamma: 1.0
      min_ray_angle_weight: 0.1
  implicit_function_IdrFeatureField_args:
    feature_vector_size: 3
    d_in: 3
    d_out: 1
    dims:
    - 512
    - 512
    - 512
    - 512
    - 512
    - 512
    - 512
    - 512
    geometric_init: true
    bias: 1.0
    skip_in: []
    weight_norm: true
    n_harmonic_functions_xyz: 0
    pooled_feature_dim: 0
    encoding_dim: 0
  implicit_function_NeuralRadianceFieldImplicitFunction_args:
    n_harmonic_functions_xyz: 10
    n_harmonic_functions_dir: 4
    n_hidden_neurons_dir: 128
    latent_dim: 0
    input_xyz: true
    xyz_ray_dir_in_camera_coords: false
    color_dim: 3
    transformer_dim_down_factor: 1.0
    n_hidden_neurons_xyz: 256
    n_layers_xyz: 8
    append_xyz:
    - 5
  implicit_function_NeRFormerImplicitFunction_args:
    n_harmonic_functions_xyz: 10
    n_harmonic_functions_dir: 4
    n_hidden_neurons_dir: 128
    latent_dim: 0
    input_xyz: true
    xyz_ray_dir_in_camera_coords: false
    color_dim: 3
    transformer_dim_down_factor: 2.0
    n_hidden_neurons_xyz: 80
    n_layers_xyz: 2
    append_xyz:
    - 1
  implicit_function_SRNImplicitFunction_args:
    raymarch_function_args:
      n_harmonic_functions: 3
      n_hidden_units: 256
      n_layers: 2
      in_features: 3
      out_features: 256
      latent_dim: 0
      xyz_in_camera_coords: false
      raymarch_function: null
    pixel_generator_args:
      n_harmonic_functions: 4
      n_hidden_units: 256
      n_hidden_units_color: 128
      n_layers: 2
      in_features: 256
      out_features: 3
      ray_dir_in_camera_coords: false
  implicit_function_SRNHyperNetImplicitFunction_args:
    hypernet_args:
      n_harmonic_functions: 3
      n_hidden_units: 256
      n_layers: 2
      n_hidden_units_hypernet: 256
      n_layers_hypernet: 1
      in_features: 3
      out_features: 256
      latent_dim_hypernet: 0
      latent_dim: 0
      xyz_in_camera_coords: false
    pixel_generator_args:
      n_harmonic_functions: 4
      n_hidden_units: 256
      n_hidden_units_color: 128
      n_layers: 2
      in_features: 256
      out_features: 3
      ray_dir_in_camera_coords: false
solver_args:
  breed: adam
  weight_decay: 0.0
  lr_policy: multistep
  lr: 0.0005
  gamma: 0.1
  momentum: 0.9
  betas:
  - 0.9
  - 0.999
  milestones: []
  max_epochs: 1000
data_source_args:
  dataset_map_provider_class_type: ???
  data_loader_map_provider_class_type: SequenceDataLoaderMapProvider
  dataset_map_provider_JsonIndexDatasetMapProvider_args:
    category: ???
    task_str: singlesequence
    dataset_root: ''
    limit_to: -1
    limit_sequences_to: -1
    n_frames_per_sequence: -1
    test_on_train: false
    load_point_clouds: false
    mask_images: false
    mask_depths: false
    restrict_sequence_name: []
    test_restrict_sequence_id: -1
    assert_single_seq: false
    only_test_set: false
    aux_dataset_kwargs:
      box_crop: true
      box_crop_context: 0.3
      image_width: 800
      image_height: 800
      remove_empty_masks: true
    path_manager: null
  data_loader_map_provider_SequenceDataLoaderMapProvider_args:
    batch_size: 1
    num_workers: 0
    dataset_len: 1000
    dataset_len_val: 1
    images_per_seq_options:
    - 2
    sample_consecutive_frames: false
    consecutive_frames_max_gap: 0
    consecutive_frames_max_gap_seconds: 0.1
architecture: generic
detect_anomaly: false
eval_only: false
exp_dir: ./data/default_experiment/
exp_idx: 0
gpu_idx: 0
metric_print_interval: 5
resume: true
resume_epoch: -1
seed: 0
store_checkpoints: true
store_checkpoints_purge: 1
test_interval: -1
test_when_finished: false
validation_interval: 1
visdom_env: ''
visdom_port: 8097
visdom_server: http://127.0.0.1
visualize_interval: 1000
clip_grad: 0.0
hydra:
  run:
    dir: .
  output_subdir: null