Skip to content

Commit c26bd22

Browse files
author
Ali Taghibakhshi
committed
cleanup
1 parent 57008da commit c26bd22

File tree

1 file changed

+4
-27
lines changed

1 file changed

+4
-27
lines changed

scripts/checkpoint_converters/convert_mamba2_pyt_to_nemo.py

Lines changed: 4 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
import re
1717
from argparse import ArgumentParser
1818
from collections import defaultdict
19-
2019
import torch
2120
import torch.distributed as dist
2221
from megatron.core.dist_checkpointing.serialization import load_plain_tensors
@@ -25,7 +24,10 @@
2524
from megatron.core.transformer.spec_utils import import_module
2625
from megatron.training.arguments import core_transformer_config_from_args
2726
from omegaconf.omegaconf import OmegaConf
28-
27+
from datetime import timedelta
28+
import megatron.core.parallel_state as ps
29+
from torch._C._distributed_c10d import PrefixStore
30+
from torch.distributed import rendezvous
2931
from nemo.collections.nlp.models.language_modeling.megatron_mamba_model import MegatronMambaModel
3032
from nemo.collections.nlp.parts.megatron_trainer_builder import MegatronLMPPTrainerBuilder
3133
from nemo.collections.nlp.parts.utils_funcs import torch_dtype_from_precision
@@ -92,31 +94,6 @@ def get_args():
9294
args = parser.parse_args()
9395
return args
9496

95-
96-
import os
97-
from datetime import timedelta
98-
99-
import megatron.core.parallel_state as ps
100-
import torch
101-
from torch._C._distributed_c10d import PrefixStore
102-
from torch.distributed import rendezvous
103-
104-
105-
class TestModel(torch.nn.Module):
106-
def __init__(
107-
self,
108-
input_dim: int,
109-
output_dim: int,
110-
num_layers: int,
111-
bias: bool,
112-
shared_embedding: bool = False,
113-
):
114-
super().__init__()
115-
self.layers = torch.nn.ModuleList([torch.nn.Linear(input_dim, output_dim, bias) for _ in range(num_layers)])
116-
if shared_embedding:
117-
self.layers[-1].weight.shared_embedding = True
118-
119-
12097
try:
12198

12299
class Utils:

0 commit comments

Comments
 (0)