Skip to content

Commit

Permalink
minor fix
Browse files Browse the repository at this point in the history
  • Loading branch information
Ali Taghibakhshi committed Dec 16, 2024
1 parent 30006df commit dcf81f5
Showing 1 changed file with 5 additions and 0 deletions.
5 changes: 5 additions & 0 deletions nemo/collections/llm/gpt/model/hyena.py
Original file line number Diff line number Diff line change
Expand Up @@ -99,12 +99,17 @@ class HyenaConfig(TransformerConfig, io.IOMixin):
remove_activation_post_first_layer: bool = True
cross_entropy_loss_fusion: bool = True
tp_comm_overlap: bool = True
bias_activation_fusion: bool = True
bias_dropout_add_fusion: bool = True

def __post_init__(self):
super().__post_init__()
self.hyena_no_weight_decay_cond_fn = hyena_no_weight_decay_cond if self.hyena_filter_no_wd else None

def configure_model(self, tokenizer) -> "MCoreHyenaModel":

self.bias_activation_fusion = False if self.remove_activation_post_first_layer else self.bias_activation_fusion

model = MCoreHyenaModel(
self,
hyena_stack_spec=hyena_stack_spec,
Expand Down

0 comments on commit dcf81f5

Please sign in to comment.