{
"ae": {
"model_id": "hunyuanvideo_15_vae",
"from_pretrained": "HunyuanVideo1.5/vae/diffusion_pytorch_model.safetensors",
"dtype": "float16",
"block_out_channels": [
128,
256,
512,
1024,
1024
],
"downsample_match_channel": true,
"ffactor_spatial": 16,
"ffactor_temporal": 4,
"in_channels": 3,
"latent_channels": 32,
"layers_per_block": 2,
"out_channels": 3,
"sample_size": 256,
"sample_tsize": 64,
"scaling_factor": 1.03682,
"shift_factor": null,
"upsample_match_channel": true,
"enable_tiling": true
},
"tokenizer": [
{
"autotokenizer_name": "hunyuan15MLLmTokenizer",
"hub_backend": "hf",
"from_pretrained": "HunyuanVideo1.5/text_encoder/llm",
"padding_side": "right",
"template_file_path": "examples/hunyuanvideo_1.5/template.json",
"template_id": "li-dit-encode-video-json",
"model_max_length": 300
},
{
"autotokenizer_name": "hunyuan15GlyphTokenizer",
"hub_backend": "hf",
"from_pretrained": "HunyuanVideo1.5/text_encoder/byt5-small",
"byt5_max_length": 256,
"color_ann_path": "HunyuanVideo1.5/text_encoder/Glyph-SDXL-v2/assets/color_idx.json",
"font_ann_path": "HunyuanVideo1.5/text_encoder/Glyph-SDXL-v2/assets/multilingual_10-lang_idx.json"
}
],
"text_encoder": [
{
"model_id": "Hunyuan15MLLmModel",
"dtype": "fp16",
"from_pretrained": "HunyuanVideo1.5/text_encoder/llm",
"hub_backend": "hf",
"use_attention_mask": true,
"hidden_state_skip_layer": 2,
"output_key": "hidden_states",
"template_file_path": "examples/hunyuanvideo_1.5/template.json",
"template_id": "li-dit-encode-video-json",
"low_cpu_mem_usage": true
},
{
"model_id": "Hunyuan15GlyphModel",
"dtype": "fp16",
"hub_backend": "hf",
"from_pretrained": "HunyuanVideo1.5/text_encoder/byt5-small",
"byt5_max_length": 256,
"hidden_state_skip_layer": 2,
"output_key": "hidden_states",
"byT5_ckpt_path": "HunyuanVideo1.5/text_encoder/Glyph-SDXL-v2/checkpoints/byt5_model.pt",
"color_ann_path": "HunyuanVideo1.5/text_encoder/Glyph-SDXL-v2/assets/color_idx.json",
"font_ann_path": "HunyuanVideo1.5/text_encoder/Glyph-SDXL-v2/assets/multilingual_10-lang_idx.json"
}
],
"predictor": {
"model_id": "hunyuanvideo15dit",
"from_pretrained": "HunyuanVideo1.5/transformer/720p_t2v/diffusion_pytorch_model.safetensors",
"dtype": "bf16",
"patch_size": [1, 1, 1],
"in_channels": 32,
"concat_condition": true,
"out_channels": 32,
"hidden_size": 2048,
"num_heads": 16,
"head_dim": 128,
"mlp_width_ratio": 4,
"mlp_act_type": "gelu_tanh",
"mm_double_blocks_depth": 54,
"mm_single_blocks_depth": 0,
"rope_dim_list": [16, 56, 56],
"qkv_bias": true,
"qk_norm": true,
"qk_norm_type": "rms",
"guidance_embed": false,
"use_meanflow": false,
"text_projection": "single_refiner",
"use_attention_mask": true,
"text_states_dim": 3584,
"text_states_dim_2": null,
"text_pool_type": null,
"rope_theta": 256,
"attn_mode": "flash2",
"attn_param": {
"win_size": [[3, 3, 3]],
"win_type": "fixed",
"win_ratio": 10,
"tile_size": [6, 8, 8],
"ssta_topk": 64,
"ssta_threshold": 0.0,
"ssta_lambda": 0.7,
"ssta_sampling_type": "importance",
"ssta_adaptive_pool": null,
"attn_sparse_type": "ssta",
"attn_pad_type": "zero",
"attn_use_text_mask": 1,
"attn_mask_share_within_head": 0
},
"glyph_byT5_v2": true,
"vision_projection": "linear",
"vision_states_dim": 1152,
"is_reshape_temporal_channels": false,
"use_cond_type_embedding": true,
"task_type": "t2v"
},
"diffusion": {
"model_id": "hunyuanvideo_15_diffusion",
"num_inference_timesteps": 50,
"shift": 5.0,
"reverse": true,
"solver": "euler",
"snr": "lognorm",
"sp_size": 8,
"dp_replicate": 1
},
"pipeline_config": {
"input_size": [
121,
480,
848
],
"guidance_scale": 6.0,
"guidance_rescale": 0.0,
"cpu_offload": false,
"aspect_ratio":"16:9",
"resolution":"480p",
"ideal_resolution": "480p",
"glyph_byT5_v2": true,
"flow_shift": 5.0,
"vision_num_semantic_tokens": 729,
"task": "t2v",
"use_attention_mask": true,
"seed": 42,
"use_meanflow": false,
"enable_offloading": true
},
"save_path": "./hunyuanvideo_t2v_samples/",
"prompt": "examples/hunyuanvideo_1.5/t2v/samples_prompts.txt",
"dtype": "bf16",
"device": "npu",
"pipeline_class": "HunyuanVideo15Pipeline",
"frame_interval": 1,
"fps": 24,
"use_prompt_preprocess": false
}