Skip to content

Commit

Permalink
initial commit
Browse files Browse the repository at this point in the history
Co-authored-by: Yoonwoo Jeong <jeongyw12382@postech.ac.kr>
Co-authored-by: Jinwoo Lee <chopper.lee@kakaobrain.com>
Co-authored-by: Chiheon Kim <chiheon.kim@kakaobrain.com>
Co-authored-by: Minsu Cho <mscho@postech.ac.kr>
Co-authored-by: Doyup Lee <doyup.lee@kakaobrain.com>
  • Loading branch information
5 people committed Jan 16, 2024
1 parent 2352f8d commit 5a20d0c
Show file tree
Hide file tree
Showing 211 changed files with 156,575 additions and 0 deletions.
15 changes: 15 additions & 0 deletions .github/workflows/black.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
name: Run black
on: [pull_request]

jobs:
lint:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v3
- name: Install venv
run: |
sudo apt-get -y install python3.10-venv
- uses: psf/black@stable
with:
options: "--check --verbose -l88"
src: "./sgm ./scripts ./main.py"
27 changes: 27 additions & 0 deletions .github/workflows/test-build.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
name: Build package

on:
push:
branches: [ main ]
pull_request:

jobs:
build:
name: Build
runs-on: ubuntu-latest
strategy:
fail-fast: false
matrix:
python-version: ["3.8", "3.10"]
requirements-file: ["pt2", "pt13"]
steps:
- uses: actions/checkout@v2
- name: Set up Python ${{ matrix.python-version }}
uses: actions/setup-python@v2
with:
python-version: ${{ matrix.python-version }}
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r requirements/${{ matrix.requirements-file }}.txt
pip install .
34 changes: 34 additions & 0 deletions .github/workflows/test-inference.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
name: Test inference

on:
pull_request:
push:
branches:
- main

jobs:
test:
name: "Test inference"
# This action is designed only to run on the Stability research cluster at this time, so many assumptions are made about the environment
if: github.repository == 'stability-ai/generative-models'
runs-on: [self-hosted, slurm, g40]
steps:
- uses: actions/checkout@v3
- name: "Symlink checkpoints"
run: ln -s ${{vars.SGM_CHECKPOINTS_PATH}} checkpoints
- name: "Setup python"
uses: actions/setup-python@v4
with:
python-version: "3.10"
- name: "Install Hatch"
run: pip install hatch
- name: "Run inference tests"
run: hatch run ci:test-inference --junit-xml test-results.xml
- name: Surface failing tests
if: always()
uses: pmeier/pytest-results-action@main
with:
path: test-results.xml
summary: true
display-options: fEX
fail-on-empty: true
3 changes: 3 additions & 0 deletions .gitmodules
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
[submodule "thirdparty/carvekit"]
path = thirdparty/carvekit
url = https://github.com/OPHoperHPO/image-background-remove-tool.git
2 changes: 2 additions & 0 deletions .project-root
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
# this file is required for inferring the project root directory
# do not delete
160 changes: 160 additions & 0 deletions 3drec/configs/nvsadapter.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,160 @@
name: "nvsadapter"
tag: "${data.random_camera.height}_${rmspace:${basename:${data.image_path}},_}_prog${data.random_camera.progressive_until}"
exp_root_dir: "./outputs"
seed: 0

data_type: "single-image-datamodule"
data: # threestudio/data/image.py -> SingleImageDataModuleConfig
image_path: ./load/images/hamburger_rgba.png
height: [128, 128, 512]
width: [128, 128, 512]
resolution_milestones: [2000, 5000]
default_elevation_deg: 0.0
default_azimuth_deg: 0.0
default_camera_distance: 1.5
default_fovy_deg: 49.1
requires_depth: ${cmaxgt0orcmaxgt0:${system.loss.lambda_depth},${system.loss.lambda_depth_rel}}
requires_normal: ${cmaxgt0:${system.loss.lambda_normal}}
random_camera: # threestudio/data/uncond.py -> RandomCameraDataModuleConfig
height: [64, 64, 256]
width: [64, 64, 256]
batch_size: [16, 16, 8] # nvs-adapter, must be times of num query
resolution_milestones: ${data.resolution_milestones} # nvs-adapter
eval_height: 512
eval_width: 512
eval_batch_size: 1
elevation_range: [-10, 80]
azimuth_range: [-180, 180]
camera_distance_range: [ 1.5, 1.5 ]
fovy_range: [49.1, 49.1] # objaverse dataset has fixed fovyq
progressive_until: 0
camera_perturb: 0.0
center_perturb: 0.0
up_perturb: 0.0
light_position_perturb: 1.0
light_distance_range: [7.5, 10.0]
eval_elevation_deg: 15
eval_camera_distance: ${data.default_camera_distance}
eval_fovy_deg: ${data.default_fovy_deg}
light_sample_strategy: "dreamfusion"
batch_uniform_azimuth: False
n_val_views: 30
n_test_views: 120

system_type: "nvsadapter-system"
system:
geometry_type: "implicit-volume"
geometry:
radius: 1.0
normal_type: "analytic"

# the density initialization proposed in the DreamFusion paper
# does not work very well
# density_bias: "blob_dreamfusion"
# density_activation: exp
# density_blob_scale: 5.
# density_blob_std: 0.2

# use Magic3D density initialization instead
density_bias: "blob_magic3d"
density_activation: softplus
density_blob_scale: 10.
density_blob_std: 0.5

# coarse to fine hash grid encoding
# to ensure smooth analytic normals
pos_encoding_config:
otype: HashGrid
n_levels: 16
n_features_per_level: 2
log2_hashmap_size: 19
base_resolution: 16
per_level_scale: 1.447269237440378 # max resolution 4096
mlp_network_config:
otype: "VanillaMLP"
activation: "ReLU"
output_activation: "none"
n_neurons: 64
n_hidden_layers: 2

material_type: "diffuse-with-point-light-material"
material:
ambient_only_steps: 100000
textureless_prob: 0.05
albedo_activation: sigmoid

# background_type: "neural-environment-map-background"
# background:
# color_activation: sigmoid

background_type: "solid-color-background" # unused

renderer_type: "nerf-volume-renderer"
renderer:
radius: ${system.geometry.radius}
num_samples_per_ray: 512
return_comp_normal: ${gt0:${system.loss.lambda_normal_smooth}}
return_normal_perturb: ${gt0:${system.loss.lambda_3d_normal_smooth}}

prompt_processor_type: "dummy-prompt-processor" # Zero123 doesn't use prompts
prompt_processor:
pretrained_model_name_or_path: ""
prompt: ""

guidance_type: "nvsadapter-guidance"
guidance:
pretrained_model_name_or_path: "../checkpoints/base_query_4_step_200000.ckpt"
pretrained_config: "../checkpoints/base_query_4.yaml"
cond_image_path: ${data.image_path}
cond_elevation_deg: ${data.default_elevation_deg}
cond_azimuth_deg: ${data.default_azimuth_deg}
cond_camera_distance: ${data.default_camera_distance}
cond_fovy_deg: ${data.default_fovy_deg}
guidance_scale: 3.0
min_step_percent: 0.02
max_step_percent: [0, 0.98, 0.5, 5000] # (start_iter, start_val, end_val, end_iter)
#max_step_percent: 0.98
num_query: 4

freq:
ref_only_steps: 0
guidance_eval: 0

loggers:
wandb:
enable: false
project: "threestudio"
name: None

loss:
lambda_sds: 0.1
lambda_rgb: 500.
lambda_mask: 50.
lambda_depth: 0. # 0.05
lambda_depth_rel: 0. # [0, 0, 0.05, 100]
lambda_normal: 0. # [0, 0, 0.05, 100]
lambda_normal_smooth: 8.0
lambda_3d_normal_smooth: 8.0
lambda_orient: 1.0
lambda_sparsity: 1.0 # should be tweaked for every model
lambda_opaque: 0.1

optimizer:
name: AdamW
args:
lr: 0.01
betas: [0.9, 0.99]
eps: 1.e-8

trainer:
max_steps: 8000
log_every_n_steps: 1
num_sanity_val_steps: 0
val_check_interval: 200
enable_progress_bar: true
precision: 16-mixed

checkpoint:
save_last: true # save at each validation time
save_top_k: -1
every_n_train_steps: 200 # ${trainer.max_steps}
Loading

0 comments on commit 5a20d0c

Please sign in to comment.