name: tiny type: dimamba hidden_size: 128 cond_dim: 128 length: ${model.length} # Same length as diffusion model n_blocks: 4 scale_by_sigma: True dropout: 0.1 tie_word_embeddings: False bidirectional: True, bidirectional_strategy: add bidirectional_weight_tie: True num_classes: ${data.num_classes} pooling: mean