mirror of
https://hf-mirror.com/wushuang98/Direct3D-S2
synced 2026-04-02 18:12:54 +08:00
Upload 5 files
This commit is contained in:
161
direct3d-s2-v-1-0/config.yaml
Normal file
161
direct3d-s2-v-1-0/config.yaml
Normal file
@ -0,0 +1,161 @@
|
|||||||
|
dense_vae:
|
||||||
|
target: direct3d_s2.models.autoencoders.dense_vae.DenseShapeVAE
|
||||||
|
params:
|
||||||
|
use_checkpoint: true
|
||||||
|
embed_dim: 8
|
||||||
|
in_channels: 1
|
||||||
|
out_channels: 1
|
||||||
|
model_channels_encoder: [32, 128, 512]
|
||||||
|
num_res_blocks_encoder: 2
|
||||||
|
num_res_blocks_middle_encoder: 2
|
||||||
|
model_channels_decoder: [512, 128, 64]
|
||||||
|
num_res_blocks_decoder: 4
|
||||||
|
num_res_blocks_middle_decoder: 4
|
||||||
|
use_fp16: true
|
||||||
|
latents_scale: 1.0
|
||||||
|
latents_shift: 0.0
|
||||||
|
|
||||||
|
dense_dit:
|
||||||
|
target: direct3d_s2.models.transformers.dense_dit.DenseDiT
|
||||||
|
params:
|
||||||
|
resolution: 16
|
||||||
|
in_channels: 8
|
||||||
|
out_channels: 8
|
||||||
|
model_channels: 1024
|
||||||
|
cond_channels: 1024
|
||||||
|
num_blocks: 24
|
||||||
|
num_heads: 16
|
||||||
|
mlp_ratio: 4
|
||||||
|
patch_size: 1
|
||||||
|
pe_mode: ape
|
||||||
|
qk_rms_norm: true
|
||||||
|
use_checkpoint: true
|
||||||
|
use_fp16: true
|
||||||
|
latent_shape: [8, 16, 16, 16]
|
||||||
|
|
||||||
|
dense_image_encoder:
|
||||||
|
target: direct3d_s2.models.conditioner.DinoEncoder
|
||||||
|
params:
|
||||||
|
model: facebookresearch/dinov2
|
||||||
|
version: dinov2_vitl14_reg
|
||||||
|
size: 518
|
||||||
|
|
||||||
|
dense_scheduler:
|
||||||
|
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
||||||
|
params:
|
||||||
|
num_train_timesteps: 1000
|
||||||
|
shift: 6.0
|
||||||
|
|
||||||
|
sparse_vae_512:
|
||||||
|
target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
|
||||||
|
params:
|
||||||
|
use_checkpoint: true
|
||||||
|
embed_dim: 16
|
||||||
|
num_head_channels_encoder: 64
|
||||||
|
model_channels_encoder: 512
|
||||||
|
num_heads_encoder: 8
|
||||||
|
num_blocks_encoder: 4
|
||||||
|
num_head_channels_decoder: 64
|
||||||
|
model_channels_decoder: 512
|
||||||
|
num_heads_decoder: 8
|
||||||
|
num_blocks_decoder: 4
|
||||||
|
resolution: 64
|
||||||
|
out_channels: 1
|
||||||
|
use_fp16: true
|
||||||
|
latents_scale: 1.0
|
||||||
|
latents_shift: 0.0
|
||||||
|
|
||||||
|
sparse_dit_512:
|
||||||
|
target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
|
||||||
|
params:
|
||||||
|
resolution: 64
|
||||||
|
in_channels: 16
|
||||||
|
out_channels: 16
|
||||||
|
model_channels: 1024
|
||||||
|
cond_channels: 1024
|
||||||
|
num_blocks: 24
|
||||||
|
num_heads: 32
|
||||||
|
num_kv_heads: 2
|
||||||
|
compression_block_size: 4
|
||||||
|
selection_block_size: 8
|
||||||
|
topk: 32
|
||||||
|
compression_version: v2
|
||||||
|
pe_mode: ape
|
||||||
|
factor: 1.0
|
||||||
|
sparse_conditions: true
|
||||||
|
qk_rms_norm: true
|
||||||
|
use_shift: true
|
||||||
|
use_checkpoint: true
|
||||||
|
use_fp16: true
|
||||||
|
|
||||||
|
sparse_scheduler_512:
|
||||||
|
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
||||||
|
params:
|
||||||
|
num_train_timesteps: 1000
|
||||||
|
shift: 6.0
|
||||||
|
|
||||||
|
sparse_vae_1024:
|
||||||
|
target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
|
||||||
|
params:
|
||||||
|
use_checkpoint: true
|
||||||
|
embed_dim: 16
|
||||||
|
num_head_channels_encoder: 64
|
||||||
|
model_channels_encoder: 512
|
||||||
|
num_heads_encoder: 8
|
||||||
|
num_blocks_encoder: 4
|
||||||
|
num_head_channels_decoder: 64
|
||||||
|
model_channels_decoder: 512
|
||||||
|
num_heads_decoder: 8
|
||||||
|
num_blocks_decoder: 4
|
||||||
|
resolution: 128
|
||||||
|
out_channels: 1
|
||||||
|
use_fp16: true
|
||||||
|
latents_scale: 1.0
|
||||||
|
latents_shift: 0.0
|
||||||
|
chunk_size: 4
|
||||||
|
|
||||||
|
sparse_dit_1024:
|
||||||
|
target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
|
||||||
|
params:
|
||||||
|
resolution: 128
|
||||||
|
in_channels: 16
|
||||||
|
out_channels: 16
|
||||||
|
model_channels: 1024
|
||||||
|
cond_channels: 1024
|
||||||
|
num_blocks: 24
|
||||||
|
num_heads: 32
|
||||||
|
num_kv_heads: 2
|
||||||
|
compression_block_size: 4
|
||||||
|
selection_block_size: 8
|
||||||
|
topk: 8
|
||||||
|
compression_version: v2
|
||||||
|
pe_mode: ape
|
||||||
|
factor: 0.5
|
||||||
|
sparse_conditions: true
|
||||||
|
qk_rms_norm: true
|
||||||
|
use_shift: true
|
||||||
|
use_checkpoint: true
|
||||||
|
use_fp16: true
|
||||||
|
|
||||||
|
sparse_scheduler_1024:
|
||||||
|
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
||||||
|
params:
|
||||||
|
num_train_timesteps: 1000
|
||||||
|
shift: 8.0
|
||||||
|
|
||||||
|
sparse_image_encoder:
|
||||||
|
target: direct3d_s2.models.conditioner.DinoEncoder
|
||||||
|
params:
|
||||||
|
model: facebookresearch/dinov2
|
||||||
|
version: dinov2_vitl14_reg
|
||||||
|
size: 518
|
||||||
|
|
||||||
|
refiner:
|
||||||
|
target: direct3d_s2.models.refiner.unet_refiner.Voxel_RefinerXL
|
||||||
|
params:
|
||||||
|
in_channels: 1
|
||||||
|
out_channels: 1
|
||||||
|
layers_per_block: 2
|
||||||
|
layers_mid_block: 2
|
||||||
|
patch_size: 192
|
||||||
|
use_fp16: true
|
||||||
BIN
direct3d-s2-v-1-0/model_dense.ckpt
(Stored with Git LFS)
Normal file
BIN
direct3d-s2-v-1-0/model_dense.ckpt
(Stored with Git LFS)
Normal file
Binary file not shown.
BIN
direct3d-s2-v-1-0/model_refiner.ckpt
(Stored with Git LFS)
Normal file
BIN
direct3d-s2-v-1-0/model_refiner.ckpt
(Stored with Git LFS)
Normal file
Binary file not shown.
BIN
direct3d-s2-v-1-0/model_sparse_1024.ckpt
(Stored with Git LFS)
Normal file
BIN
direct3d-s2-v-1-0/model_sparse_1024.ckpt
(Stored with Git LFS)
Normal file
Binary file not shown.
BIN
direct3d-s2-v-1-0/model_sparse_512.ckpt
(Stored with Git LFS)
Normal file
BIN
direct3d-s2-v-1-0/model_sparse_512.ckpt
(Stored with Git LFS)
Normal file
Binary file not shown.
Reference in New Issue
Block a user