self.learn_sigma = learn_sigma @@ -118,6 +119,7 @@ def __init__( self.no_temporal_pos_emb = no_temporal_pos_emb self.mlp_ratio = mlp_ratio self.depth = depth assert enable_sequence_parallelism is False, "Sequence parallelism is not supported in DiT" self.register_buffer("pos_embe...