mirror of
https://github.com/deepseek-ai/DreamCraft3D
synced 2024-12-04 18:15:11 +00:00
166 lines
4.5 KiB
YAML
166 lines
4.5 KiB
YAML
|
name: "dreamcraft3d-texture"
|
||
|
tag: "${rmspace:${system.prompt_processor.prompt},_}"
|
||
|
exp_root_dir: "outputs"
|
||
|
seed: 0
|
||
|
|
||
|
data_type: "single-image-datamodule"
|
||
|
data:
|
||
|
image_path: ./load/images/hamburger_rgba.png
|
||
|
height: 1024
|
||
|
width: 1024
|
||
|
default_elevation_deg: 0.0
|
||
|
default_azimuth_deg: 0.0
|
||
|
default_camera_distance: 3.8
|
||
|
default_fovy_deg: 20.0
|
||
|
requires_depth: false
|
||
|
requires_normal: false
|
||
|
use_mixed_camera_config: false
|
||
|
random_camera:
|
||
|
height: 1024
|
||
|
width: 1024
|
||
|
batch_size: 1
|
||
|
eval_height: 1024
|
||
|
eval_width: 1024
|
||
|
eval_batch_size: 1
|
||
|
elevation_range: [-10, 45]
|
||
|
azimuth_range: [-180, 180]
|
||
|
camera_distance_range: [3.8, 3.8]
|
||
|
fovy_range: [20.0, 20.0] # Zero123 has fixed fovy
|
||
|
progressive_until: 0
|
||
|
camera_perturb: 0.0
|
||
|
center_perturb: 0.0
|
||
|
up_perturb: 0.0
|
||
|
eval_elevation_deg: ${data.default_elevation_deg}
|
||
|
eval_camera_distance: ${data.default_camera_distance}
|
||
|
eval_fovy_deg: ${data.default_fovy_deg}
|
||
|
batch_uniform_azimuth: false
|
||
|
n_val_views: 40
|
||
|
n_test_views: 120
|
||
|
|
||
|
system_type: "dreamcraft3d-system"
|
||
|
system:
|
||
|
stage: texture
|
||
|
use_mixed_camera_config: ${data.use_mixed_camera_config}
|
||
|
geometry_convert_from: ???
|
||
|
geometry_convert_inherit_texture: true
|
||
|
geometry_type: "tetrahedra-sdf-grid"
|
||
|
geometry:
|
||
|
radius: 2.0 # consistent with coarse
|
||
|
isosurface_resolution: 128
|
||
|
isosurface_deformable_grid: true
|
||
|
isosurface_remove_outliers: true
|
||
|
pos_encoding_config:
|
||
|
otype: HashGrid
|
||
|
n_levels: 16
|
||
|
n_features_per_level: 2
|
||
|
log2_hashmap_size: 19
|
||
|
base_resolution: 16
|
||
|
per_level_scale: 1.447269237440378 # max resolution 4096
|
||
|
fix_geometry: true
|
||
|
|
||
|
material_type: "no-material"
|
||
|
material:
|
||
|
n_output_dims: 3
|
||
|
|
||
|
background_type: "solid-color-background"
|
||
|
|
||
|
renderer_type: "nvdiff-rasterizer"
|
||
|
renderer:
|
||
|
context_type: cuda
|
||
|
|
||
|
prompt_processor_type: "stable-diffusion-prompt-processor"
|
||
|
prompt_processor:
|
||
|
pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
|
||
|
prompt: ???
|
||
|
front_threshold: 30.
|
||
|
back_threshold: 30.
|
||
|
|
||
|
guidance_type: "stable-diffusion-bsd-guidance"
|
||
|
guidance:
|
||
|
pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
|
||
|
pretrained_model_name_or_path_lora: "stabilityai/stable-diffusion-2-1-base"
|
||
|
# pretrained_model_name_or_path_lora: "stabilityai/stable-diffusion-2-1"
|
||
|
guidance_scale: 2.0
|
||
|
min_step_percent: 0.05
|
||
|
max_step_percent: [0, 0.5, 0.2, 5000]
|
||
|
only_pretrain_step: 1000
|
||
|
|
||
|
# guidance_3d_type: "stable-zero123-guidance"
|
||
|
# guidance_3d:
|
||
|
# pretrained_model_name_or_path: "./load/zero123/stable_zero123.ckpt"
|
||
|
# pretrained_config: "./load/zero123/sd-objaverse-finetune-c_concat-256.yaml"
|
||
|
# cond_image_path: ${data.image_path}
|
||
|
# cond_elevation_deg: ${data.default_elevation_deg}
|
||
|
# cond_azimuth_deg: ${data.default_azimuth_deg}
|
||
|
# cond_camera_distance: ${data.default_camera_distance}
|
||
|
# guidance_scale: 5.0
|
||
|
# min_step_percent: 0.2 # (start_iter, start_val, end_val, end_iter)
|
||
|
# max_step_percent: 0.5
|
||
|
|
||
|
# control_guidance_type: "stable-diffusion-controlnet-reg-guidance"
|
||
|
# control_guidance:
|
||
|
# min_step_percent: 0.1
|
||
|
# max_step_percent: 0.5
|
||
|
# control_prompt_processor_type: "stable-diffusion-prompt-processor"
|
||
|
# control_prompt_processor:
|
||
|
# pretrained_model_name_or_path: "SG161222/Realistic_Vision_V2.0"
|
||
|
# prompt: ${system.prompt_processor.prompt}
|
||
|
# front_threshold: 30.
|
||
|
# back_threshold: 30.
|
||
|
|
||
|
freq:
|
||
|
n_ref: 2
|
||
|
ref_only_steps: 0
|
||
|
ref_or_guidance: "alternate"
|
||
|
no_diff_steps: -1
|
||
|
guidance_eval: 0
|
||
|
|
||
|
loggers:
|
||
|
wandb:
|
||
|
enable: false
|
||
|
project: "threestudio"
|
||
|
|
||
|
loss:
|
||
|
lambda_sd: 0.01
|
||
|
lambda_lora: 0.1
|
||
|
lambda_pretrain: 0.1
|
||
|
lambda_3d_sd: 0.0
|
||
|
lambda_rgb: 1000.
|
||
|
lambda_mask: 100.
|
||
|
lambda_mask_binary: 0.0
|
||
|
lambda_depth: 0.0
|
||
|
lambda_depth_rel: 0.0
|
||
|
lambda_normal: 0.0
|
||
|
lambda_normal_smooth: 0.0
|
||
|
lambda_3d_normal_smooth: 0.0
|
||
|
lambda_z_variance: 0.0
|
||
|
lambda_reg: 0.0
|
||
|
|
||
|
optimizer:
|
||
|
name: AdamW
|
||
|
args:
|
||
|
betas: [0.9, 0.99]
|
||
|
eps: 1.e-4
|
||
|
params:
|
||
|
geometry.encoding:
|
||
|
lr: 0.01
|
||
|
geometry.feature_network:
|
||
|
lr: 0.001
|
||
|
guidance.train_unet:
|
||
|
lr: 0.00001
|
||
|
guidance.train_unet_lora:
|
||
|
lr: 0.00001
|
||
|
|
||
|
trainer:
|
||
|
max_steps: 5000
|
||
|
log_every_n_steps: 1
|
||
|
num_sanity_val_steps: 0
|
||
|
val_check_interval: 200
|
||
|
enable_progress_bar: true
|
||
|
precision: 32
|
||
|
strategy: "ddp_find_unused_parameters_true"
|
||
|
|
||
|
checkpoint:
|
||
|
save_last: true
|
||
|
save_top_k: -1
|
||
|
every_n_train_steps: ${trainer.max_steps}
|