Aluren commited on
Commit
e6ab9cd
·
verified ·
1 Parent(s): de26657

Upload 10 files

Browse files
feature_extractor_1/preprocessor_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_valid_processor_keys": [
3
+ "images",
4
+ "do_resize",
5
+ "size",
6
+ "resample",
7
+ "do_center_crop",
8
+ "crop_size",
9
+ "do_rescale",
10
+ "rescale_factor",
11
+ "do_normalize",
12
+ "image_mean",
13
+ "image_std",
14
+ "do_convert_rgb",
15
+ "return_tensors",
16
+ "data_format",
17
+ "input_data_format"
18
+ ],
19
+ "crop_size": {
20
+ "height": 224,
21
+ "width": 224
22
+ },
23
+ "do_center_crop": true,
24
+ "do_convert_rgb": true,
25
+ "do_normalize": true,
26
+ "do_rescale": true,
27
+ "do_resize": true,
28
+ "image_mean": [
29
+ 0.485,
30
+ 0.456,
31
+ 0.406
32
+ ],
33
+ "image_processor_type": "BitImageProcessor",
34
+ "image_std": [
35
+ 0.229,
36
+ 0.224,
37
+ 0.225
38
+ ],
39
+ "resample": 3,
40
+ "rescale_factor": 0.00392156862745098,
41
+ "size": {
42
+ "shortest_edge": 256
43
+ }
44
+ }
image_encoder_1/config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/mnt/pfs/users/dengken/hugging_face/models--facebook--dinov2-large/snapshots/47b73eefe95e8d44ec3623f8890bd894b6ea2d6c",
3
+ "apply_layernorm": true,
4
+ "architectures": [
5
+ "Dinov2Model"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "drop_path_rate": 0.0,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 1024,
12
+ "image_size": 518,
13
+ "initializer_range": 0.02,
14
+ "layer_norm_eps": 1e-06,
15
+ "layerscale_value": 1.0,
16
+ "mlp_ratio": 4,
17
+ "model_type": "dinov2",
18
+ "num_attention_heads": 16,
19
+ "num_channels": 3,
20
+ "num_hidden_layers": 24,
21
+ "out_features": [
22
+ "stage24"
23
+ ],
24
+ "out_indices": [
25
+ 24
26
+ ],
27
+ "patch_size": 14,
28
+ "qkv_bias": true,
29
+ "reshape_hidden_states": true,
30
+ "stage_names": [
31
+ "stem",
32
+ "stage1",
33
+ "stage2",
34
+ "stage3",
35
+ "stage4",
36
+ "stage5",
37
+ "stage6",
38
+ "stage7",
39
+ "stage8",
40
+ "stage9",
41
+ "stage10",
42
+ "stage11",
43
+ "stage12",
44
+ "stage13",
45
+ "stage14",
46
+ "stage15",
47
+ "stage16",
48
+ "stage17",
49
+ "stage18",
50
+ "stage19",
51
+ "stage20",
52
+ "stage21",
53
+ "stage22",
54
+ "stage23",
55
+ "stage24"
56
+ ],
57
+ "torch_dtype": "float32",
58
+ "transformers_version": "4.41.0",
59
+ "use_swiglu_ffn": false
60
+ }
image_encoder_1/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:399fba97a95f22c36834418bc69373364a99af3a1153da1c0fb31db567c92e23
3
+ size 1217522888
model_index.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DetailGen3DPipeline",
3
+ "_diffusers_version": "0.32.0.dev0",
4
+ "feature_extractor_1": [
5
+ "transformers",
6
+ "BitImageProcessor"
7
+ ],
8
+ "image_encoder_1": [
9
+ "transformers",
10
+ "Dinov2Model"
11
+ ],
12
+ "noise_scheduler": [
13
+ "diffusers",
14
+ "DDPMScheduler"
15
+ ],
16
+ "scheduler": [
17
+ "detailgen3d.schedulers.scheduling_rectified_flow",
18
+ "RectifiedFlowScheduler"
19
+ ],
20
+ "transformer": [
21
+ "detailgen3d.models.transformers.detailgen3d_transformers",
22
+ "DetailGen3DDiTModel"
23
+ ],
24
+ "vae": [
25
+ "detailgen3d.models.autoencoders.autoencoder_kl_triposg",
26
+ "TripoSGVAEModel"
27
+ ]
28
+ }
noise_scheduler/scheduler_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DDPMScheduler",
3
+ "_diffusers_version": "0.32.0.dev0",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "clip_sample": false,
8
+ "clip_sample_range": 1.0,
9
+ "dynamic_thresholding_ratio": 0.995,
10
+ "num_train_timesteps": 1000,
11
+ "prediction_type": "epsilon",
12
+ "rescale_betas_zero_snr": false,
13
+ "sample_max_value": 1.0,
14
+ "steps_offset": 1,
15
+ "thresholding": false,
16
+ "timestep_spacing": "leading",
17
+ "trained_betas": null,
18
+ "variance_type": "fixed_small"
19
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "RectifiedFlowScheduler",
3
+ "_diffusers_version": "0.32.0.dev0",
4
+ "num_train_timesteps": 1000,
5
+ "shift": 1.0,
6
+ "use_dynamic_shifting": false
7
+ }
transformer/config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DetailGen3DDiTModel",
3
+ "_diffusers_version": "0.32.0.dev0",
4
+ "cross_attention_dim": 1024,
5
+ "in_channels": 64,
6
+ "num_attention_heads": 12,
7
+ "num_layers": 24,
8
+ "width": 768
9
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcc7abf6b049b91d8e4a93e8914a1df819b3f8edc352cdce67054e251f3a2c5f
3
+ size 1474293920
vae/config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "Tripo2VAEModel",
3
+ "_diffusers_version": "0.32.0.dev0",
4
+ "embed_frequency": 8,
5
+ "embed_include_pi": false,
6
+ "embedding_type": "frequency",
7
+ "in_channels": 3,
8
+ "latent_channels": 64,
9
+ "num_attention_heads": 8,
10
+ "num_layers_decoder": 16,
11
+ "num_layers_encoder": 8,
12
+ "width_decoder": 1024,
13
+ "width_encoder": 512
14
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:488d39edc7a7d3cd4d94baea243c4ed583ed830b3b5f0ae781ad6a00aa8d7369
3
+ size 970685468