Skip to content

Commit

Permalink
reflect use_parallel_residual to mlp_after_attn
Browse files Browse the repository at this point in the history
  • Loading branch information
twaka authored Aug 24, 2023
1 parent 3e82cb6 commit 02516c3
Showing 1 changed file with 1 addition and 0 deletions.
1 change: 1 addition & 0 deletions deepspeed/module_inject/containers/gptneox.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@ def __init__(self, **kwargs):
super().__init__(**kwargs)

# All model specific things should be defined here instead of the base class.
self.mlp_after_attn = not getattr(self.model_config, "use_parallel_residual", not self.mlp_after_attn)

def create_module(self, config=None):
_config = config if config is not None else self.ds_model_config
Expand Down

0 comments on commit 02516c3

Please sign in to comment.