Transformer_500M / modules.py
yagizdevre's picture
config and model are added
cbda9b7
from .attn import Attention
from .attn import AttentionSDPA
from .mlp import MLP
from .stu import STU