Increase model size to match diffusion.

This commit is contained in:
Mahi Shafiullah 2025-02-03 23:30:47 -05:00
parent d4e7b355a9
commit e82b4c9460
1 changed files with 4 additions and 4 deletions

View File

@ -122,11 +122,11 @@ class DiTFlowConfig(PreTrainedConfig):
# Diffusion Transformer (DiT) parameters.
frequency_embedding_dim: int = 256
hidden_dim: int = 256
hidden_dim: int = 512
num_blocks: int = 6
num_heads: int = 8
dropout: float = 0.0
dim_feedforward: int = 2048
num_heads: int = 16
dropout: float = 0.1
dim_feedforward: int = 4096
activation: str = "gelu"
# Noise scheduler.