diff --git a/.lightning/workflows/tests.yaml b/.lightning/workflows/tests.yaml
index 5014fccf59..7d9f35556c 100644
--- a/.lightning/workflows/tests.yaml
+++ b/.lightning/workflows/tests.yaml
@@ -43,7 +43,9 @@ run: |
   python -c "import torch ; gpus = torch.cuda.device_count() ; assert gpus >= 2, f'GPU: {gpus}'"
   python -c "from torch import __version__ as ver ; assert str(ver).split('+')[0] == '${TORCH_VERSION}', f'PyTorch: installed {ver} but expected ${TORCH_VERSION}'"
 
-  pytest -v --durations=100
+  pytest -v --durations=100 tests/ --ignore=tests/test_serve.py
+  pytest -v --durations=100 tests/test_serve.py
+
 
   wget https://raw.githubusercontent.com/Lightning-AI/utilities/main/scripts/run_standalone_tests.sh
   PL_RUN_STANDALONE_TESTS=1 bash run_standalone_tests.sh "tests"
diff --git a/tests/test_serve.py b/tests/test_serve.py
index dfe99e1839..1abf532468 100644
--- a/tests/test_serve.py
+++ b/tests/test_serve.py
@@ -209,7 +209,9 @@ def run_server():
     try:
         # Test server health
         response = requests.get("http://127.0.0.1:8000/health")
-        assert response.status_code == 200, f"Server health check failed with status code {response.status_code}"
+        assert response.status_code == 200, (
+            f"Server health check failed with status code {response.status_code}: {response.text}"
+        )
         assert response.text == "ok", "Server did not respond as expected."
 
         # Test non-streaming chat completion
@@ -221,7 +223,7 @@ def run_server():
             },
         )
         assert response.status_code == 200, (
-            f"Non-streaming chat completion failed with status code {response.status_code}"
+            f"Non-streaming chat completion failed with status code {response.status_code}: {response.text}"
         )
         response_json = response.json()
         assert "choices" in response_json, "Response JSON does not contain 'choices'."