зеркало из https://github.com/microsoft/archai.git
fix(config_hf_gpt2): Fixes weight initialization range value.
This commit is contained in:
Родитель
cbad680dfa
Коммит
6d8d827ba5
|
@ -33,7 +33,7 @@ class HfGPT2Config(Config, PretrainedConfig):
|
|||
d_inner: Optional[int] = 2048,
|
||||
dropout: Optional[float] = 0.1,
|
||||
dropatt: Optional[float] = 0.0,
|
||||
weight_init_std: Optional[float] = 0.0,
|
||||
weight_init_std: Optional[float] = 0.02,
|
||||
n_layer: Optional[int] = 16,
|
||||
n_head: Optional[int] = 8,
|
||||
embd_pdrop: Optional[float] = 0.0,
|
||||
|
@ -111,7 +111,7 @@ class HfGPT2FlexConfig(HfGPT2Config):
|
|||
d_inner: Optional[Union[int, List[int]]] = 2048,
|
||||
dropout: Optional[float] = 0.1,
|
||||
dropatt: Optional[float] = 0.0,
|
||||
weight_init_std: Optional[float] = 0.0,
|
||||
weight_init_std: Optional[float] = 0.02,
|
||||
n_layer: Optional[int] = 16,
|
||||
n_head: Optional[Union[int, List[int]]] = 8,
|
||||
embd_pdrop: Optional[float] = 0.0,
|
||||
|
|
Загрузка…
Ссылка в новой задаче