Skip to content

Commit

Permalink
Effstabledreamfusion (#504)
Browse files Browse the repository at this point in the history
* Modified camera data module

* modified masking logic and shape adjust in SD input

* (Working)new sampling maskand SD loss edits

* Changing the subsampling a bit, not better results

* new exp with upsampling before SDS

* refactoring

---------

Co-authored-by: jadevaibhav <25821637+jadevaibhav@users.noreply.github.com>
  • Loading branch information
DSaurus and jadevaibhav authored Oct 2, 2024
1 parent a80b37a commit c16d083
Show file tree
Hide file tree
Showing 7 changed files with 706 additions and 1 deletion.
2 changes: 2 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -55,6 +55,8 @@ coverage.xml
.pytest_cache/
cover/

# Slurm logs
slurm*
# Translations
*.mo
*.pot
Expand Down
115 changes: 115 additions & 0 deletions configs/dreamfusion-sd-eff.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,115 @@
name: "dreamfusion-sd"
tag: "${rmspace:${system.prompt_processor.prompt},_}"
exp_root_dir: "outputs"
seed: 0

data_type: "eff-random-camera-datamodule"
data:
batch_size: 1
width: 128
height: 128
sample_width: 64
sample_height: 64
camera_distance_range: [1.5, 2.0]
fovy_range: [40, 70]
elevation_range: [-10, 45]
light_sample_strategy: "dreamfusion"
eval_camera_distance: 2.0
eval_fovy_deg: 70.

system_type: "efficient-dreamfusion-system"
system:
geometry_type: "implicit-volume"
geometry:
radius: 2.0
normal_type: "analytic"

# the density initialization proposed in the DreamFusion paper
# does not work very well
# density_bias: "blob_dreamfusion"
# density_activation: exp
# density_blob_scale: 5.
# density_blob_std: 0.2

# use Magic3D density initialization instead
density_bias: "blob_magic3d"
density_activation: softplus
density_blob_scale: 10.
density_blob_std: 0.5

# coarse to fine hash grid encoding
# to ensure smooth analytic normals
pos_encoding_config:
otype: ProgressiveBandHashGrid
n_levels: 16
n_features_per_level: 2
log2_hashmap_size: 19
base_resolution: 16
per_level_scale: 1.447269237440378 # max resolution 4096
start_level: 8 # resolution ~200
start_step: 2000
update_steps: 500

material_type: "diffuse-with-point-light-material"
material:
ambient_only_steps: 2001
albedo_activation: sigmoid

background_type: "neural-environment-map-background"
background:
color_activation: sigmoid

renderer_type: "nerf-volume-renderer"
renderer:
radius: ${system.geometry.radius}
num_samples_per_ray: 512

prompt_processor_type: "stable-diffusion-prompt-processor"
prompt_processor:
pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
prompt: ???

guidance_type: "stable-diffusion-guidance"
guidance:
pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
guidance_scale: 100.
weighting_strategy: sds
min_step_percent: 0.02
max_step_percent: 0.98

loggers:
wandb:
enable: false
project: "threestudio"
name: None

loss:
lambda_sds: 1.
lambda_orient: [0, 10., 1000., 5000]
lambda_sparsity: 1.
lambda_opaque: 0.

optimizer:
name: Adam
args:
lr: 0.01
betas: [0.9, 0.99]
eps: 1.e-15
params:
geometry:
lr: 0.01
background:
lr: 0.001

trainer:
max_steps: 10000
log_every_n_steps: 1
num_sanity_val_steps: 0
val_check_interval: 200
enable_progress_bar: true
precision: 16-mixed

checkpoint:
save_last: true # save at each validation time
save_top_k: -1
every_n_train_steps: ${trainer.max_steps}
2 changes: 1 addition & 1 deletion threestudio/data/__init__.py
Original file line number Diff line number Diff line change
@@ -1 +1 @@
from . import co3d, image, multiview, uncond
from . import co3d, image, multiview, uncond, uncond_eff
Loading

0 comments on commit c16d083

Please sign in to comment.