kkail8 commited on
Commit
0894495
·
verified ·
1 Parent(s): c950fd3

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "VASTDiT3"
4
+ ],
5
+ "audio_hidden_size": 1152,
6
+ "audio_in_channels": 8,
7
+ "audio_input_size": [
8
+ null,
9
+ null
10
+ ],
11
+ "audio_patch_size": [
12
+ 4,
13
+ 1
14
+ ],
15
+ "caption_channels": 4096,
16
+ "class_dropout_prob": 0.1,
17
+ "depth": 28,
18
+ "drop_path": 0.0,
19
+ "enable_flash_attn": true,
20
+ "enable_layernorm_kernel": false,
21
+ "enable_sequence_parallelism": false,
22
+ "freeze_audio_branch": true,
23
+ "freeze_video_branch": true,
24
+ "freeze_y_embedder": true,
25
+ "hidden_size": 1152,
26
+ "in_channels": 4,
27
+ "input_size": [
28
+ null,
29
+ null,
30
+ null
31
+ ],
32
+ "input_sq_size": 512,
33
+ "mlp_ratio": 4.0,
34
+ "model_max_length": 300,
35
+ "model_type": "VASTDiT3",
36
+ "num_heads": 16,
37
+ "only_infer_audio": false,
38
+ "only_train_audio": false,
39
+ "only_train_temporal": false,
40
+ "patch_size": [
41
+ 1,
42
+ 2,
43
+ 2
44
+ ],
45
+ "pred_sigma": true,
46
+ "qk_norm": true,
47
+ "skip_y_embedder": false,
48
+ "spatial_prior_len": 32,
49
+ "st_prior_channel": 128,
50
+ "temporal_prior_len": 32,
51
+ "torch_dtype": "bfloat16",
52
+ "train_st_prior_attn": true,
53
+ "train_va_cross_attn": true,
54
+ "transformers_version": "4.39.3",
55
+ "weight_init_from": [
56
+ "./checkpoints/JavisDiT-audio-v0",
57
+ "./checkpoints/OpenSora-STDiT-v3/model.safetensors"
58
+ ]
59
+ }
pytorch_model-00001.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b7d7f3e974f97aa3f0baada67acf3dea7e0f07170b25c3a5bd711fbcc97957c
3
+ size 1070739616
pytorch_model-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44aa3a44fea82c261141ce239bf5eb543df43d49f60786894c35ed1c4f062877
3
+ size 1070893412
pytorch_model-00003.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687337c9c2e91acc40cfb05ac5e320f1319227ad73fd6485bb59b36f7feb9237
3
+ size 1072626064
pytorch_model-00004.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2992414f3a9f0350c7dd16da8147fe0135f24b3f632ef27a509c38862c04f149
3
+ size 1073558938
pytorch_model-00005.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f3adf60c440ffad9c09c8b04df0fbb3e35ddce5f448520e311d9f02b0ef9001
3
+ size 1073642040
pytorch_model-00006.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff17a37ad45e5c7f3b8d1f4e2875e68b3804515e6e45c01e3745ebd0796ae58a
3
+ size 1073723768
pytorch_model-00007.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe6d177f16105770036ab4c2011cb99af48691ba27cc450d925ddd44a2c158f
3
+ size 1010299692
pytorch_model.bin.index.json ADDED
The diff for this file is too large to render. See raw diff