Merge pull request #523 from BurkeHulk/hotfix/fp16_nan_output

Force fp16 input to fp32 to avoid nan output in timestep_transform
2026-04-10 12:49:38 +02:00 · 2024-06-21 18:01:17 +08:00 · 2024-06-21 18:01:17 +08:00 · 9b668e1c4e
commit 9b668e1c4e
parent 10b5c5f27b 04d2ee0182
1 changed files with 5 additions and 0 deletions
--- a/opensora/schedulers/rf/rectified_flow.py
+++ b/opensora/schedulers/rf/rectified_flow.py
@ -15,6 +15,11 @@ def timestep_transform(
    scale=1.0,
    num_timesteps=1,
 ):
+    # Force fp16 input to fp32 to avoid nan output
+    for key in ["height", "width", "num_frames"]:
+        if model_kwargs[key].dtype == torch.float16:
+            model_kwargs[key] = model_kwargs[key].float()
+            
    t = t / num_timesteps
    resolution = model_kwargs["height"] * model_kwargs["width"]
    ratio_space = (resolution / base_resolution).sqrt()