We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 236dc78 commit 1c402d3Copy full SHA for 1c402d3
1 file changed
src/fairseq2/models/opt/_config.py
@@ -28,7 +28,7 @@ class OPTConfig:
28
max_seq_len: int = 2048 + 1
29
"""The maximum sequence length."""
30
31
- vocab_size: int = 50272
+ vocab_size: int = 258
32
"""The size of the vocabulary."""
33
34
pad_idx: int | None = 1
@@ -61,3 +61,11 @@ def register_opt_configs(context: RuntimeContext) -> None:
61
@arch("opt_125m")
62
def opt_125m() -> OPTConfig:
63
return OPTConfig()
64
+
65
+ @arch("opt_350m")
66
+ def opt_350m() -> OPTConfig:
67
+ config = opt_125m()
68
69
+ config.model_dim = 1024
70
+ config.num_layers = 24
71
+ config.num_attn_heads = 16
0 commit comments