We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ceba38f commit cc8ff45Copy full SHA for cc8ff45
nemo/collections/llm/gpt/model/hyena.py
@@ -316,6 +316,7 @@ class Hyena1bConfig(HyenaConfig):
316
317
hybrid_override_pattern: str = "SDH*SDHSDH*SDHSDH*SDHSDH*"
318
num_layers: int = 25
319
+ recompute_num_layers: int = 5 # needs to be a multiple of num_layers
320
seq_length: int = 8192
321
hidden_size: int = 1920
322
num_groups_hyena: int = 1920
0 commit comments