JeffreyXiang commited on
Commit
f8e8cf0
·
verified ·
1 Parent(s): 6b928b8

Upload 6 files

Browse files
README.md CHANGED
@@ -1,3 +1,16 @@
1
- ---
2
- license: mit
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: trellis
3
+ pipeline_tag: text-to-3d
4
+ license: mit
5
+ language:
6
+ - en
7
+ ---
8
+ # TRELLIS Text Base
9
+
10
+ <!-- Provide a quick summary of what the model is/does. -->
11
+
12
+ The text conditioned version of TRELLIS with model size B, a large 3D genetive model. It was introduced in the paper [Structured 3D Latents for Scalable and Versatile 3D Generation](https://huggingface.co/papers/2412.01506).
13
+
14
+ Project page: https://trellis3d.github.io/
15
+
16
+ Code: https://github.com/Microsoft/TRELLIS
ckpts/slat_flow_txt_dit_B_64l8p2_fp16.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SLatFlowModel",
3
+ "args": {
4
+ "resolution": 64,
5
+ "in_channels": 8,
6
+ "out_channels": 8,
7
+ "model_channels": 768,
8
+ "cond_channels": 768,
9
+ "num_blocks": 12,
10
+ "num_heads": 12,
11
+ "mlp_ratio": 4,
12
+ "patch_size": 2,
13
+ "num_io_res_blocks": 2,
14
+ "io_block_channels": [128],
15
+ "pe_mode": "ape",
16
+ "qk_rms_norm": true,
17
+ "use_fp16": true
18
+ }
19
+ }
ckpts/slat_flow_txt_dit_B_64l8p2_fp16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36312c77a150947041638c0a1eb382be73d5381e086ea0bfa2ba9525af4408ad
3
+ size 372419896
ckpts/ss_flow_txt_dit_B_16l8_fp16.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SparseStructureFlowModel",
3
+ "args": {
4
+ "resolution": 16,
5
+ "in_channels": 8,
6
+ "out_channels": 8,
7
+ "model_channels": 768,
8
+ "cond_channels": 768,
9
+ "num_blocks": 12,
10
+ "num_heads": 12,
11
+ "mlp_ratio": 4,
12
+ "patch_size": 1,
13
+ "pe_mode": "ape",
14
+ "qk_rms_norm": true,
15
+ "use_fp16": true
16
+ }
17
+ }
ckpts/ss_flow_txt_dit_B_16l8_fp16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9fa7a2c5deae18307ebfcb29c955b11130e4eb1a88de05c384104c493dee3ff
3
+ size 327736456
pipeline.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "TrellisTextTo3DPipeline",
3
+ "args": {
4
+ "models": {
5
+ "sparse_structure_decoder": "JeffreyXiang/TRELLIS-image-large/ckpts/ss_dec_conv3d_16l8_fp16",
6
+ "sparse_structure_flow_model": "ckpts/ss_flow_txt_dit_B_16l8_fp16",
7
+ "slat_decoder_gs": "JeffreyXiang/TRELLIS-image-large/ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16",
8
+ "slat_decoder_rf": "JeffreyXiang/TRELLIS-image-large/ckpts/slat_dec_rf_swin8_B_64l8r16_fp16",
9
+ "slat_decoder_mesh": "JeffreyXiang/TRELLIS-image-large/ckpts/slat_dec_mesh_swin8_B_64l8m256c_fp16",
10
+ "slat_flow_model": "ckpts/slat_flow_txt_dit_B_64l8p2_fp16"
11
+ },
12
+ "sparse_structure_sampler": {
13
+ "name": "FlowEulerGuidanceIntervalSampler",
14
+ "args": {
15
+ "sigma_min": 1e-5
16
+ },
17
+ "params": {
18
+ "steps": 25,
19
+ "cfg_strength": 7.5,
20
+ "cfg_interval": [0.5, 0.95],
21
+ "rescale_t": 3.0
22
+ }
23
+ },
24
+ "slat_sampler": {
25
+ "name": "FlowEulerGuidanceIntervalSampler",
26
+ "args": {
27
+ "sigma_min": 1e-5
28
+ },
29
+ "params": {
30
+ "steps": 25,
31
+ "cfg_strength": 7.5,
32
+ "cfg_interval": [0.5, 0.95],
33
+ "rescale_t": 3.0
34
+ }
35
+ },
36
+ "slat_normalization": {
37
+ "mean": [
38
+ -2.1687545776367188,
39
+ -0.004347046371549368,
40
+ -0.13352349400520325,
41
+ -0.08418072760105133,
42
+ -0.5271206498146057,
43
+ 0.7238689064979553,
44
+ -1.1414450407028198,
45
+ 1.2039363384246826
46
+ ],
47
+ "std": [
48
+ 2.377650737762451,
49
+ 2.386378288269043,
50
+ 2.124418020248413,
51
+ 2.1748552322387695,
52
+ 2.663944721221924,
53
+ 2.371192216873169,
54
+ 2.6217446327209473,
55
+ 2.684523105621338
56
+ ]
57
+ },
58
+ "text_cond_model": "openai/clip-vit-large-patch14"
59
+ }
60
+ }