{
"predictor": {
"model_id": "videoditsparsei2v",
"from_pretrained": "./weights/sparsedit/sparsediti2v_mm.pth",
"dtype": "fp16",
"num_layers" : 32,
"num_heads": 24,
"head_dim": 96,
"in_channels": 8,
"out_channels": 8,
"dropout": 0.0,
"cross_attention_dim": 2304,
"attention_q_bias":true,
"attention_k_bias":true,
"attention_v_bias":true,
"fa_layout":"sbh",
"patch_size_thw": [1, 2, 2],
"activation_fn": "gelu-approximate",
"norm_elementwise_affine": false,
"norm_eps": 1e-06,
"caption_channels": 4096,
"interpolation_scale": [1.0, 1.0, 1.0],
"sparse1d": true,
"sparse_n": 4
},
"ae": {
"model_id": "wfvae",
"from_pretrained": "./weights/vae/wfvae_mm.pt",
"dtype": "fp16",
"base_channels": 128,
"decoder_energy_flow_hidden_size": 128,
"decoder_num_resblocks": 2,
"dropout": 0.0,
"encoder_energy_flow_hidden_size": 64,
"encoder_num_resblocks": 2,
"latent_dim": 8,
"use_attention": true,
"norm_type": "aelayernorm",
"t_interpolation": "trilinear",
"vae_scale_factor": [4, 8, 8]
},
"text_encoder": {
"model_id": "MT5",
"hub_backend": "hf",
"from_pretrained": "./weights/google/mt5-xxl",
"dtype": "fp16"
},
"tokenizer":{
"hub_backend": "hf",
"autotokenizer_name": "AutoTokenizer",
"from_pretrained": "./weights/google/mt5-xxl",
"model_max_length": 512
},
"diffusion": {
"model_id": "EulerAncestralDiscrete",
"num_inference_steps":100,
"guidance_scale":7.5,
"prediction_type": "v_prediction",
"rescale_betas_zero_snr": true,
"device": "npu",
"timestep_spacing": "trailing"
},
"pipeline_config": {
"version": "v1.3",
"use_attention_mask": true,
"input_size": [93, 352, 640],
"model_type": "i2v"
},
"frame_interval":1,
"save_path":"examples/opensoraplan1.3/i2v/samples/",
"fps":18,
"prompt": "examples/opensoraplan1.3/i2v/cond_prompt.txt",
"use_prompt_preprocess": false,
"pipeline_class": "OpenSoraPlanPipeline",
"device":"npu",
"dtype": "fp16",
"conditional_pixel_values_path": "examples/opensoraplan1.3/i2v/cond_pix_path.txt",
"mask_type": "i2v",
"crop_for_hw": true,
"max_hxw": 236544
}