From 2448e700e32cd7a6659658a6f19e52bf2a879a79 Mon Sep 17 00:00:00 2001 From: Edward Hu <41635632+edwardjhu@users.noreply.github.com> Date: Sun, 22 Jan 2023 12:28:55 -0800 Subject: [PATCH] Update main.py --- examples/Transformer/main.py | 1 - 1 file changed, 1 deletion(-) diff --git a/examples/Transformer/main.py b/examples/Transformer/main.py index 9af4383..3c6dc80 100644 --- a/examples/Transformer/main.py +++ b/examples/Transformer/main.py @@ -312,7 +312,6 @@ if __name__ == '__main__': if args.deferred_init: from torchdistx.deferred_init import deferred_init # We don't need to instantiate the base and delta models - # Note: this only works with torch nightly since unsqueeze isn't supported for fake tensors in stable base_shapes = get_shapes( deferred_init(mdl.TransformerModel, args, ntokens, ninp=args.d_model, nhead=args.nhead, nhid=args.d_model*args.ffn_ratio, nlayers=args.nlayers, dropout=args.dropout, tied=args.tied, bias=args.bias, encoder_var=args.init_var,