Force fp16 input to fp32 to avoid nan output in timestep_transform

2026-04-10 12:49:38 +02:00 · 2024-06-21 11:15:39 +03:00 · 2024-06-21 11:15:39 +03:00 · 04d2ee0182
commit 04d2ee0182
parent 033c2b3c82
1 changed files with 5 additions and 0 deletions
--- a/opensora/schedulers/rf/rectified_flow.py
+++ b/opensora/schedulers/rf/rectified_flow.py
@ -15,6 +15,11 @@ def timestep_transform(
    scale=1.0,
    num_timesteps=1,
 ):
+    # Force fp16 input to fp32 to avoid nan output
+    for key in ["height", "width", "num_frames"]:
+        if model_kwargs[key].dtype == torch.float16:
+            model_kwargs[key] = model_kwargs[key].float()
+            
    t = t / num_timesteps
    resolution = model_kwargs["height"] * model_kwargs["width"]
    ratio_space = (resolution / base_resolution).sqrt()