Fix Graphormer Large Architecture (#83)
This commit is contained in:
Родитель
9578d1b2ad
Коммит
769567c787
|
@ -331,11 +331,11 @@ def graphormer_slim_architecture(args):
|
|||
|
||||
@register_model_architecture("graphormer", "graphormer_large")
|
||||
def graphormer_large_architecture(args):
|
||||
args.encoder_embed_dim = getattr(args, "encoder_embed_dim", 768)
|
||||
args.encoder_embed_dim = getattr(args, "encoder_embed_dim", 1024)
|
||||
|
||||
args.encoder_layers = getattr(args, "encoder_layers", 24)
|
||||
|
||||
args.encoder_attention_heads = getattr(args, "encoder_attention_heads", 42)
|
||||
args.encoder_attention_heads = getattr(args, "encoder_attention_heads", 32)
|
||||
args.encoder_ffn_embed_dim = getattr(args, "encoder_ffn_embed_dim", 1024)
|
||||
|
||||
args.activation_fn = getattr(args, "activation_fn", "gelu")
|
||||
|
|
Загрузка…
Ссылка в новой задаче