{
  "_comment": "Wan2.2 i2v MoE 4-step distill, fp8 e4m3 quantized. Built for 24 GB-class GPUs — cpu_offload keeps DIT layers swapping in block-by-block. Derived from LightX2V's configs/distill/wan22/wan_moe_i2v_distill_4090.json plus the quant scheme + ckpt overrides from wan_moe_i2v_distill_quant.json. high_noise_quantized_ckpt / low_noise_quantized_ckpt are filled in at runtime by server/video_models/wan22.py with absolute paths to the files downloaded into HF_HOME.",

  "infer_steps": 4,
  "target_video_length": 81,
  "text_len": 512,

  "resize_mode": "adaptive",
  "resolution": "480p",
  "target_height": 480,
  "target_width": 480,
  "fps": 16,

  "self_attn_1_type": "flash_attn3",
  "cross_attn_1_type": "flash_attn3",
  "cross_attn_2_type": "flash_attn3",

  "sample_guide_scale": [3.5, 3.5],
  "sample_shift": 5.0,
  "enable_cfg": false,

  "cpu_offload": true,
  "offload_granularity": "block",
  "lazy_load": true,
  "t5_cpu_offload": true,
  "vae_cpu_offload": false,

  "use_image_encoder": false,

  "boundary_step_index": 2,
  "denoising_step_list": [1000, 750, 500, 250],

  "dit_quantized": true,
  "dit_quant_scheme": "fp8-sgl",
  "t5_quantized": false
}