ghunkins commited on
Commit
7f6b706
1 Parent(s): ae09a3d

Upload HunyuanVideoPipeline

Browse files
model_index.json CHANGED
@@ -1,9 +1,10 @@
1
  {
2
  "_class_name": "HunyuanVideoPipeline",
3
  "_diffusers_version": "0.31.0",
 
4
  "scheduler": [
5
- "hyvideo",
6
- "FlowMatchDiscreteScheduler"
7
  ],
8
  "text_encoder": [
9
  "transformers",
@@ -22,11 +23,11 @@
22
  "CLIPTokenizer"
23
  ],
24
  "transformer": [
25
- "hyvideo",
26
  "HYVideoDiffusionTransformer"
27
  ],
28
  "vae": [
29
- "hyvideo",
30
  "AutoencoderKLCausal3D"
31
  ]
32
  }
 
1
  {
2
  "_class_name": "HunyuanVideoPipeline",
3
  "_diffusers_version": "0.31.0",
4
+ "_name_or_path": "magespace/hyvideo-diffusers",
5
  "scheduler": [
6
+ "diffusers",
7
+ "FlowMatchEulerDiscreteScheduler"
8
  ],
9
  "text_encoder": [
10
  "transformers",
 
23
  "CLIPTokenizer"
24
  ],
25
  "transformer": [
26
+ "hyvideo.modules.models",
27
  "HYVideoDiffusionTransformer"
28
  ],
29
  "vae": [
30
+ "hyvideo.vae.autoencoder_kl_causal_3d",
31
  "AutoencoderKLCausal3D"
32
  ]
33
  }
scheduler/scheduler_config.json CHANGED
@@ -1,9 +1,11 @@
1
  {
2
- "_class_name": "FlowMatchDiscreteScheduler",
3
  "_diffusers_version": "0.31.0",
4
- "n_tokens": null,
 
 
 
5
  "num_train_timesteps": 1000,
6
- "reverse": false,
7
  "shift": 7.0,
8
- "solver": "euler"
9
  }
 
1
  {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
  "_diffusers_version": "0.31.0",
4
+ "base_image_seq_len": 256,
5
+ "base_shift": 0.5,
6
+ "max_image_seq_len": 4096,
7
+ "max_shift": 1.15,
8
  "num_train_timesteps": 1000,
 
9
  "shift": 7.0,
10
+ "use_dynamic_shifting": false
11
  }
text_encoder/config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "LlamaForCausalLM"
4
  ],
@@ -23,7 +24,7 @@
23
  "rope_theta": 500000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
- "transformers_version": "4.46.3",
27
  "use_cache": true,
28
  "vocab_size": 128320
29
  }
 
1
  {
2
+ "_name_or_path": "/root/.cache/huggingface/hub/models--magespace--hyvideo-diffusers/snapshots/ae09a3d1e5306c922f86a6aaf8db5b691947d204/text_encoder",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
24
  "rope_theta": 500000.0,
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.47.0",
28
  "use_cache": true,
29
  "vocab_size": 128320
30
  }
text_encoder/generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 128000,
4
  "eos_token_id": 128001,
5
- "transformers_version": "4.46.3"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 128000,
4
  "eos_token_id": 128001,
5
+ "transformers_version": "4.47.0"
6
  }
text_encoder_2/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/clip-vit-large-patch14",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -20,6 +20,6 @@
20
  "pad_token_id": 1,
21
  "projection_dim": 768,
22
  "torch_dtype": "bfloat16",
23
- "transformers_version": "4.46.3",
24
  "vocab_size": 49408
25
  }
 
1
  {
2
+ "_name_or_path": "/root/.cache/huggingface/hub/models--magespace--hyvideo-diffusers/snapshots/ae09a3d1e5306c922f86a6aaf8db5b691947d204/text_encoder_2",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
 
20
  "pad_token_id": 1,
21
  "projection_dim": 768,
22
  "torch_dtype": "bfloat16",
23
+ "transformers_version": "4.47.0",
24
  "vocab_size": 49408
25
  }
tokenizer/tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2c593db4aa75b17a42c1f74d7cc38e257eaeed222e6a52674c65544165dcbaa
3
- size 17210098
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1cb63338521d084aba234e273e56a3a0bb0e41f6438e205a2cbc1db8f02fd1f
3
+ size 17210368
tokenizer/tokenizer_config.json CHANGED
@@ -2080,6 +2080,7 @@
2080
  "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
2081
  "clean_up_tokenization_spaces": true,
2082
  "eos_token": "<|end_of_text|>",
 
2083
  "legacy": true,
2084
  "model_input_names": [
2085
  "input_ids",
 
2080
  "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
2081
  "clean_up_tokenization_spaces": true,
2082
  "eos_token": "<|end_of_text|>",
2083
+ "extra_special_tokens": {},
2084
  "legacy": true,
2085
  "model_input_names": [
2086
  "input_ids",
tokenizer_2/tokenizer_config.json CHANGED
@@ -23,6 +23,7 @@
23
  "do_lower_case": true,
24
  "eos_token": "<|endoftext|>",
25
  "errors": "replace",
 
26
  "max_length": 77,
27
  "model_max_length": 77,
28
  "pad_token": "<|endoftext|>",
 
23
  "do_lower_case": true,
24
  "eos_token": "<|endoftext|>",
25
  "errors": "replace",
26
+ "extra_special_tokens": {},
27
  "max_length": 77,
28
  "model_max_length": 77,
29
  "pad_token": "<|endoftext|>",
transformer/config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "_class_name": "HYVideoDiffusionTransformer",
3
  "_diffusers_version": "0.31.0",
 
4
  "guidance_embed": true,
5
  "heads_num": 24,
6
  "hidden_size": 3072,
 
1
  {
2
  "_class_name": "HYVideoDiffusionTransformer",
3
  "_diffusers_version": "0.31.0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--magespace--hyvideo-diffusers/snapshots/ae09a3d1e5306c922f86a6aaf8db5b691947d204/transformer",
5
  "guidance_embed": true,
6
  "heads_num": 24,
7
  "hidden_size": 3072,
vae/config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKLCausal3D",
3
  "_diffusers_version": "0.31.0",
 
4
  "act_fn": "silu",
5
  "block_out_channels": [
6
  128,
 
1
  {
2
  "_class_name": "AutoencoderKLCausal3D",
3
  "_diffusers_version": "0.31.0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--magespace--hyvideo-diffusers/snapshots/ae09a3d1e5306c922f86a6aaf8db5b691947d204/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,