mirror of
https://github.com/hpcaitech/Open-Sora.git
synced 2026-04-10 21:01:26 +02:00
fix typo
This commit is contained in:
parent
2ca632a2d1
commit
bbc64bcb72
|
|
@ -12,7 +12,7 @@ dtype = "bf16"
|
||||||
|
|
||||||
model = dict(
|
model = dict(
|
||||||
type="STDiT3-XL/2",
|
type="STDiT3-XL/2",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-STDiT-v4",
|
from_pretrained="hpcaitech/OpenSora-STDiT-v4",
|
||||||
qk_norm=True,
|
qk_norm=True,
|
||||||
enable_flash_attn=True,
|
enable_flash_attn=True,
|
||||||
enable_layernorm_kernel=True,
|
enable_layernorm_kernel=True,
|
||||||
|
|
@ -22,7 +22,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
@ -35,7 +35,7 @@ vae = dict(
|
||||||
)
|
)
|
||||||
text_encoder = dict(
|
text_encoder = dict(
|
||||||
type="t5",
|
type="t5",
|
||||||
from_pretrained="/mnt/jfs-hdd/sora/checkpoints/pretrained_models/t5-v1_1-xxl",
|
from_pretrained="DeepFloyd/t5-v1_1-xxl",
|
||||||
model_max_length=300,
|
model_max_length=300,
|
||||||
)
|
)
|
||||||
scheduler = dict(
|
scheduler = dict(
|
||||||
|
|
|
||||||
|
|
@ -18,7 +18,7 @@ use_oscillation_guidance_for_image = True
|
||||||
|
|
||||||
model = dict(
|
model = dict(
|
||||||
type="STDiT3-XL/2",
|
type="STDiT3-XL/2",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-STDiT-v4",
|
from_pretrained="hpcaitech/OpenSora-STDiT-v4",
|
||||||
qk_norm=True,
|
qk_norm=True,
|
||||||
enable_flash_attn=True,
|
enable_flash_attn=True,
|
||||||
enable_layernorm_kernel=True,
|
enable_layernorm_kernel=True,
|
||||||
|
|
@ -29,7 +29,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
@ -42,7 +42,7 @@ vae = dict(
|
||||||
)
|
)
|
||||||
text_encoder = dict(
|
text_encoder = dict(
|
||||||
type="t5",
|
type="t5",
|
||||||
from_pretrained="/mnt/jfs-hdd/sora/checkpoints/pretrained_models/t5-v1_1-xxl",
|
from_pretrained="DeepFloyd/t5-v1_1-xxl",
|
||||||
model_max_length=300,
|
model_max_length=300,
|
||||||
)
|
)
|
||||||
scheduler = dict(
|
scheduler = dict(
|
||||||
|
|
|
||||||
|
|
@ -25,7 +25,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -26,22 +26,16 @@ plugin = "zero2"
|
||||||
# Model settings
|
# Model settings
|
||||||
model = dict(
|
model = dict(
|
||||||
type="STDiT3-XL/2",
|
type="STDiT3-XL/2",
|
||||||
from_pretrained="outputs/0373-STDiT3-XL-2/epoch3-global_step36000/ema.pt",
|
from_pretrained=None,
|
||||||
qk_norm=True,
|
qk_norm=True,
|
||||||
enable_flash_attn=True,
|
enable_flash_attn=True,
|
||||||
enable_layernorm_kernel=True,
|
enable_layernorm_kernel=True,
|
||||||
adapt_16ch=True,
|
adapt_16ch=True,
|
||||||
skip_temporal=True,
|
skip_temporal=True,
|
||||||
)
|
)
|
||||||
# vae = dict(
|
|
||||||
# type="VideoAutoencoderKL",
|
|
||||||
# from_pretrained="PixArt-alpha/pixart_sigma_sdxlvae_T5_diffusers",
|
|
||||||
# subfolder="vae",
|
|
||||||
# scaling_factor=0.13025,
|
|
||||||
# )
|
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -63,7 +63,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
@ -76,7 +76,7 @@ vae = dict(
|
||||||
)
|
)
|
||||||
text_encoder = dict(
|
text_encoder = dict(
|
||||||
type="t5",
|
type="t5",
|
||||||
from_pretrained="pretrained_models/t5-v1_1-xxl",
|
from_pretrained="DeepFloyd/t5-v1_1-xxl",
|
||||||
model_max_length=300,
|
model_max_length=300,
|
||||||
shardformer=True,
|
shardformer=True,
|
||||||
)
|
)
|
||||||
|
|
|
||||||
|
|
@ -33,7 +33,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -53,7 +53,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -24,14 +24,14 @@ plugin = "zero2"
|
||||||
# Model settings
|
# Model settings
|
||||||
model = dict(
|
model = dict(
|
||||||
type="STDiT3-XL/2",
|
type="STDiT3-XL/2",
|
||||||
from_pretrained="outputs/0461-STDiT3-XL-2/epoch3-global_step40000/ema.pt",
|
from_pretrained=None,
|
||||||
qk_norm=True,
|
qk_norm=True,
|
||||||
enable_flash_attn=True,
|
enable_flash_attn=True,
|
||||||
enable_layernorm_kernel=True,
|
enable_layernorm_kernel=True,
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -33,7 +33,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
|
|
@ -33,7 +33,7 @@ model = dict(
|
||||||
)
|
)
|
||||||
vae = dict(
|
vae = dict(
|
||||||
type="OpenSoraVAE_V1_3",
|
type="OpenSoraVAE_V1_3",
|
||||||
from_pretrained="/home/guoxinying/open_source_video_ocean_V1/OpenSora-VAE-v1.3",
|
from_pretrained="hpcaitech/OpenSora-VAE-v1.3",
|
||||||
z_channels=16,
|
z_channels=16,
|
||||||
micro_batch_size=1,
|
micro_batch_size=1,
|
||||||
micro_batch_size_2d=4,
|
micro_batch_size_2d=4,
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue