nbv_reconstruction/configs/server/train_config.yaml

95 lines
2.0 KiB
YAML
Raw Normal View History

2024-08-22 22:28:20 +08:00
runner:
general:
seed: 0
2024-09-12 15:11:09 +08:00
device: cuda
2024-08-22 22:28:20 +08:00
cuda_visible_devices: "0,1,2,3,4,5,6,7"
2024-09-12 15:11:09 +08:00
parallel: False
2024-08-22 22:28:20 +08:00
experiment:
2024-09-12 15:11:09 +08:00
name: test_overfit
2024-08-22 22:28:20 +08:00
root_dir: "experiments"
use_checkpoint: False
epoch: -1 # -1 stands for last epoch
2024-09-12 15:11:09 +08:00
max_epochs: 5000
save_checkpoint_interval: 1
test_first: False
2024-08-22 22:28:20 +08:00
train:
optimizer:
type: Adam
lr: 0.0001
losses:
2024-09-12 15:11:09 +08:00
- gf_loss
dataset: OmniObject3d_train
test:
frequency: 3 # test frequency
2024-08-22 22:28:20 +08:00
dataset_list:
2024-09-12 15:11:09 +08:00
- OmniObject3d_test
pipeline: nbv_reconstruction_pipeline
2024-08-22 22:28:20 +08:00
2024-09-12 15:11:09 +08:00
dataset:
2024-09-02 18:21:38 +08:00
OmniObject3d_train:
2024-09-13 09:40:08 +00:00
root_dir: "../data/sample_for_training/scenes"
2024-09-12 15:11:09 +08:00
source: nbv_reconstruction_dataset
2024-09-13 09:40:08 +00:00
split_file: "../data/sample_for_training/OmniObject3d_train.txt"
ratio: 1.0
batch_size: 1
num_workers: 12
2024-09-12 15:11:09 +08:00
pts_num: 4096
2024-09-02 18:21:38 +08:00
OmniObject3d_test:
2024-09-13 09:40:08 +00:00
root_dir: "../data/sample_for_training/scenes"
2024-09-12 15:11:09 +08:00
source: nbv_reconstruction_dataset
2024-09-13 09:40:08 +00:00
split_file: "../data/sample_for_training/OmniObject3d_train.txt"
eval_list:
- pose_diff
2024-09-12 15:11:09 +08:00
ratio: 0.1
batch_size: 1
num_workers: 1
2024-09-12 15:11:09 +08:00
pts_num: 4096
2024-09-12 15:11:09 +08:00
pipeline:
nbv_reconstruction_pipeline:
pts_encoder: pointnet_encoder
seq_encoder: transformer_seq_encoder
pose_encoder: pose_encoder
view_finder: gf_view_finder
module:
pointnet_encoder:
in_dim: 3
out_dim: 1024
global_feat: True
feature_transform: False
transformer_seq_encoder:
pts_embed_dim: 1024
pose_embed_dim: 256
2024-09-13 09:40:08 +00:00
num_heads: 4
ffn_dim: 256
num_layers: 3
output_dim: 2048
gf_view_finder:
2024-09-12 15:11:09 +08:00
t_feat_dim: 128
pose_feat_dim: 256
2024-09-13 09:40:08 +00:00
main_feat_dim: 2048
regression_head: Rx_Ry_and_T
pose_mode: rot_matrix
per_point_feature: False
sample_mode: ode
sampling_steps: 500
sde_mode: ve
2024-08-22 22:28:20 +08:00
pose_encoder:
pose_dim: 9
2024-09-12 15:11:09 +08:00
out_dim: 256
loss_function:
gf_loss:
evaluation_method:
pose_diff: