From f2780780903f957c9a59e44bfd70198a732a66c4 Mon Sep 17 00:00:00 2001
From: John St John <jstjohn@nvidia.com>
Date: Wed, 14 Aug 2024 19:01:14 +0000
Subject: [PATCH] Skip megatron training test on CPU nodes

---
 tests/collections/llm/test_mnist_model_nemo2.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/collections/llm/test_mnist_model_nemo2.py b/tests/collections/llm/test_mnist_model_nemo2.py
index 4226c501dc452..96e4aefbf2289 100644
--- a/tests/collections/llm/test_mnist_model_nemo2.py
+++ b/tests/collections/llm/test_mnist_model_nemo2.py
@@ -19,6 +19,7 @@
 from typing import Any, Dict, Iterable, Iterator, List, Optional, Sequence, Tuple, TypedDict, TypeVar, Union
 
 import megatron.core.num_microbatches_calculator
+import pytest
 import pytorch_lightning as pl
 import torch
 import torch.distributed
@@ -492,6 +493,7 @@ def clean_parallel_state_context() -> Iterator[None]:
         _teardown_apex_megatron_cuda()
 
 
+@pytest.mark.skipif(not torch.cuda.is_available(), reason="No GPU available")
 def test_train_mnist_litautoencoder_with_megatron_strategy_single_gpu(tmpdir):
     with clean_parallel_state_context():
         # Configure our custom Checkpointer