EleutherAI · haileyschoelkopf · Mar 27, 2024 · Mar 27, 2024
@@ -34,29 +34,17 @@
 )
 
 
-try:
- from nemo.collections.nlp.models.language_modeling.megatron_gpt_model import (
- MegatronGPTModel,
- )
- from nemo.collections.nlp.modules.common.text_generation_utils import generate
- from nemo.collections.nlp.parts.nlp_overrides import (
- NLPDDPStrategy,
- NLPSaveRestoreConnector,
- )
- from nemo.utils.app_state import AppState
- from pytorch_lightning.trainer.trainer import Trainer
-except ModuleNotFoundError:
- raise Exception(
- "Attempted to use 'nemo_lm' model type, but package `nemo` is not installed"
- "Please install nemo following the instructions in the README: either with a NVIDIA PyTorch or NeMo container, "
- "or installing nemo following https://github.com/NVIDIA/NeMo.",
- )
-
-
 def _patch_pretrained_cfg(
  pretrained_cfg, trainer, tensor_model_parallel_size, pipeline_model_parallel_size
 ):
- import omegaconf
+ try:
+ import omegaconf
+ except ModuleNotFoundError:
+ raise Exception(
+ "Attempted to use 'nemo_lm' model type, but package `nemo` is not installed"
+ "Please install nemo following the instructions in the README: either with a NVIDIA PyTorch or NeMo container, "
+ "or installing nemo following https://github.com/NVIDIA/NeMo.",
+ )
 
  omegaconf.OmegaConf.set_struct(pretrained_cfg, True)
  with omegaconf.open_dict(pretrained_cfg):
@@ -86,6 +74,17 @@ def load_model(
  tensor_model_parallel_size: int,
  pipeline_model_parallel_size: int,
 ) -> torch.nn.Module:
+ try:
+ from nemo.collections.nlp.models.language_modeling.megatron_gpt_model import (
+ MegatronGPTModel,
+ )
+ from nemo.collections.nlp.parts.nlp_overrides import NLPSaveRestoreConnector
+ except ModuleNotFoundError:
+ raise Exception(
+ "Attempted to use 'nemo_lm' model type, but package `nemo` is not installed"
+ "Please install nemo following the instructions in the README: either with a NVIDIA PyTorch or NeMo container, "
+ "or installing nemo following https://github.com/NVIDIA/NeMo.",
+ )
  model_path = pathlib.Path(model_path)
 
  save_restore_connector = NLPSaveRestoreConnector()
@@ -139,6 +138,15 @@ def _synced_build_tokenizer(self):
 
 
 def setup_distributed_environment(trainer):
+ try:
+ from nemo.utils.app_state import AppState
+ except ModuleNotFoundError:
+ raise Exception(
+ "Attempted to use 'nemo_lm' model type, but package `nemo` is not installed"
+ "Please install nemo following the instructions in the README: either with a NVIDIA PyTorch or NeMo container, "
+ "or installing nemo following https://github.com/NVIDIA/NeMo.",
+ )
+
  def dummy():
  return
 
@@ -178,6 +186,21 @@ def __init__(
  ] = "bf16",
  **kwargs,
  ):
+ try:
+ from nemo.collections.nlp.modules.common.text_generation_utils import (
+ generate,
+ )
+ from nemo.collections.nlp.parts.nlp_overrides import NLPDDPStrategy
+ from pytorch_lightning.trainer.trainer import Trainer
+
+ self.generate = generate
+ except ModuleNotFoundError:
+ raise Exception(
+ "Attempted to use 'nemo_lm' model type, but package `nemo` is not installed"
+ "Please install nemo following the instructions in the README: either with a NVIDIA PyTorch or NeMo container, "
+ "or installing nemo following https://github.com/NVIDIA/NeMo.",
+ )
+
  super().__init__()
 
  if (
@@ -396,7 +419,7 @@ def _collate(x):
 
  inps.append(self.tok_decode(inp))
 
- output = generate(
+ output = self.generate(
  self.model,
  inputs=inps,
  tokens_to_generate=1,
@@ -490,7 +513,7 @@ def _collate(x):
  encoded_context = encoded_context[-remaining_length:]
  contexts.append(self.tok_decode(encoded_context))
 
- output = generate(
+ output = self.generate(
  self.model,
  inputs=contexts,
  tokens_to_generate=max_gen_toks,