diff --git a/nemo/export/trt_llm/nemo/convert.py b/nemo/export/trt_llm/nemo/convert.py index 5ffe7e9e0894..c87d2c7f0e21 100644 --- a/nemo/export/trt_llm/nemo/convert.py +++ b/nemo/export/trt_llm/nemo/convert.py @@ -520,9 +520,5 @@ def save_tranpose(val, key, shared=False): elif "vocab_embedding" in key or "lm_head.weight" in key: save(key, gpu_val) else: - if torch.cuda.current_device() == 0: - import pdb - pdb.set_trace() - torch.distributed.barrier() raise RuntimeError(f"{key} not handled by NeMo->TRTLLM converter!")