Skip to content

Commit afee1b7

Browse files
committed
nemotron-h 56b auto backend
Signed-off-by: Malay Nagda <[email protected]>
1 parent b3571fb commit afee1b7

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

src/megatron/bridge/models/nemotronh/nemotron_h_provider.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@
1818
from typing import Callable
1919

2020
from megatron.core.activations import squared_relu
21+
from megatron.core.transformer.enums import AttnBackend
2122

2223
from megatron.bridge.models.mamba.mamba_provider import MambaModelProvider
2324
from megatron.bridge.utils.common_utils import get_rank_safe
@@ -102,6 +103,8 @@ class NemotronHModelProvider56B(NemotronHModelProvider):
102103
ffn_hidden_size: int = 32768
103104
num_attention_heads: int = 64
104105

106+
attention_backend: AttnBackend = AttnBackend.auto
107+
105108

106109
@dataclass
107110
class NemotronNanoModelProvider9Bv2(NemotronHModelProvider):

0 commit comments

Comments
 (0)