From 60d87b7785400f9f9cb6e2ac9a7c8d6a261073fd Mon Sep 17 00:00:00 2001 From: Zvonko Kaiser Date: Tue, 19 Aug 2025 16:15:28 +0000 Subject: [PATCH] gpu: Add more debugging to CI/CD Capture NVRC logs via journalctl Signed-off-by: Zvonko Kaiser --- tests/integration/kubernetes/k8s-nvidia-nim.bats | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/tests/integration/kubernetes/k8s-nvidia-nim.bats b/tests/integration/kubernetes/k8s-nvidia-nim.bats index 9b9021ffa4..8bf450798a 100644 --- a/tests/integration/kubernetes/k8s-nvidia-nim.bats +++ b/tests/integration/kubernetes/k8s-nvidia-nim.bats @@ -58,6 +58,13 @@ create_inference_embedqa_pods() { echo "# POD_IP_EMBEDQA=${POD_IP_EMBEDQA}" >&3 } +enable_nvrc_trace() { + if [[ ${RUNTIME_CLASS_NAME} == "kata-qemu-nvidia-gpu" ]]; then + config_file="/opt/kata/share/defaults/kata-containers/configuration-qemu-nvidia-gpu.toml" + fi + sudo sed -i -e 's/^kernel_params = "\(.*\)"/kernel_params = "\1 nvrc.log=trace"/g' "${config_file}" +} + setup_file() { dpkg -s jq >/dev/null 2>&1 || sudo apt -y install jq @@ -82,6 +89,8 @@ setup_file() { export POD_INSTRUCT_YAML="${pod_instruct_yaml}" export POD_EMBEDQA_YAML="${pod_embedqa_yaml}" + enable_nvrc_trace + setup_langchain_flow create_inference_embedqa_pods } @@ -324,4 +333,5 @@ EOF teardown_file() { kubectl delete -f "${POD_INSTRUCT_YAML}" + kubectl delete -f "${POD_EMBEDQA_YAML}" }