Increase model size to match diffusion.
This commit is contained in:
parent
d4e7b355a9
commit
e82b4c9460
|
@ -122,11 +122,11 @@ class DiTFlowConfig(PreTrainedConfig):
|
||||||
|
|
||||||
# Diffusion Transformer (DiT) parameters.
|
# Diffusion Transformer (DiT) parameters.
|
||||||
frequency_embedding_dim: int = 256
|
frequency_embedding_dim: int = 256
|
||||||
hidden_dim: int = 256
|
hidden_dim: int = 512
|
||||||
num_blocks: int = 6
|
num_blocks: int = 6
|
||||||
num_heads: int = 8
|
num_heads: int = 16
|
||||||
dropout: float = 0.0
|
dropout: float = 0.1
|
||||||
dim_feedforward: int = 2048
|
dim_feedforward: int = 4096
|
||||||
activation: str = "gelu"
|
activation: str = "gelu"
|
||||||
|
|
||||||
# Noise scheduler.
|
# Noise scheduler.
|
||||||
|
|
Loading…
Reference in New Issue