From 679cc9d47c55dc77fc1e0a00cab370de1122eafc Mon Sep 17 00:00:00 2001 From: Zvonko Kaiser Date: Thu, 1 May 2025 15:11:42 +0000 Subject: [PATCH] gpu: Update runtimeClasses for correct podoverhead We cannot only rely only on default_cpu and default_memory in the config, default is 1 and 2Gi but we need some overhead for QEMU and the other related binaries running as the pod overhead. Especially when QEMU is hot-plugging GPUs, CPUs, and memory it can consume more memory. Signed-off-by: Zvonko Kaiser --- .../kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-snp.yaml | 4 ++-- .../kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-tdx.yaml | 4 ++-- .../kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu.yaml | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-snp.yaml b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-snp.yaml index 8558580630..0e22e09bf8 100644 --- a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-snp.yaml +++ b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-snp.yaml @@ -6,8 +6,8 @@ metadata: handler: kata-qemu-nvidia-gpu-snp overhead: podFixed: - memory: "2048Mi" - cpu: "1.0" + memory: "4096Mi" + cpu: "1" scheduling: nodeSelector: katacontainers.io/kata-runtime: "true" diff --git a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-tdx.yaml b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-tdx.yaml index 272924ca63..237782608d 100644 --- a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-tdx.yaml +++ b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu-tdx.yaml @@ -6,8 +6,8 @@ metadata: handler: kata-qemu-nvidia-gpu-tdx overhead: podFixed: - memory: "2048Mi" - cpu: "1.0" + memory: "4096Mi" + cpu: "1" scheduling: nodeSelector: katacontainers.io/kata-runtime: "true" diff --git a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu.yaml b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu.yaml index f99d3a2808..369d2d82b1 100644 --- a/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu.yaml +++ b/tools/packaging/kata-deploy/runtimeclasses/kata-qemu-nvidia-gpu.yaml @@ -6,8 +6,8 @@ metadata: handler: kata-qemu-nvidia-gpu overhead: podFixed: - memory: "160Mi" - cpu: "250m" + memory: "4096Mi" + cpu: "1" scheduling: nodeSelector: katacontainers.io/kata-runtime: "true"