Add 12.8 CUDA tests

zkoopmans · gvisor-bot · commit 60ec4e7a009d · 2025-04-25T16:16:48.000-07:00
Add 12.8 basic CUDA image and smoke tests. A later submission
will add CUDA tests similar to the current 12.2 tests.

PiperOrigin-RevId: 751593396
diff --git a/Makefile b/Makefile
@@ -291,7 +291,7 @@ simple-tests: unit-tests # Compatibility target.
 .PHONY: simple-tests
 
 # Images needed for GPU smoke tests.
-gpu-smoke-images: load-gpu_cuda-tests
+gpu-smoke-images: load-gpu_cuda-tests load-gpu_cuda-tests-12-8
 .PHONY: gpu-smoke-images
 
 gpu-smoke-tests: gpu-smoke-images $(RUNTIME_BIN)
diff --git a/images/gpu/cuda-tests-12-8/Dockerfile b/images/gpu/cuda-tests-12-8/Dockerfile
@@ -0,0 +1,49 @@
+FROM nvidia/cuda:12.8.1-devel-ubuntu22.04
+
+WORKDIR /
+ENV PATH=$PATH:/usr/local/nvidia/bin
+RUN export DEBIAN_FRONTEND=noninteractive; \
+    apt-get update && \
+    apt-get install -y \
+      build-essential \
+      cmake \
+      freeglut3 freeglut3-dev \
+      git \
+      golang \
+      imagemagick \
+      libegl-dev \
+      libfreeimage3 libfreeimage-dev \
+      libfreeimageplus3 libfreeimageplus-dev \
+      libgles2-mesa-dev \
+      libglfw3 libglfw3-dev \
+      libglu1-mesa libglu1-mesa-dev \
+      libxi-dev \
+      libxmu-dev \
+      llvm \
+      mpich \
+      pkg-config \
+      vim \
+      x11-xserver-utils \
+      xdotool \
+      xvfb \
+      zlib1g zlib1g-dev
+
+RUN git clone  \
+      https://github.com/NVIDIA/cuda-samples.git /cuda-samples && cd /cuda-samples && \
+      git checkout 7b60178984e96bc09d066077d5455df71fee2a9f && cd /
+
+RUN apt install -y wget && apt -y purge golang*
+
+RUN wget https://go.dev/dl/go1.24.1.linux-amd64.tar.gz && tar -C /usr/local -xzf go1.24.1.linux-amd64.tar.gz && \
+   ln -s /usr/local/go/bin/go /usr/local/bin/go
+
+ADD *.cu *.h *.sh *.py *.cc /
+
+RUN chmod 555 /*.sh && gcc -o /unsupported_ioctl /unsupported_ioctl.cc
+
+RUN mkdir /cuda-samples/build && cd /cuda-samples/build && \
+      cmake ..
+
+# Override entrypoint to nothing, otherwise all invocations will have
+# a copyright notice printed, which breaks parsing the stdout logs.
+ENTRYPOINT []
diff --git a/images/gpu/cuda-tests-12-8/cuda_malloc.cu b/images/gpu/cuda-tests-12-8/cuda_malloc.cu
@@ -0,0 +1,205 @@
+// Copyright 2023 The gVisor Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <cuda_runtime.h>
+#include <err.h>
+#include <errno.h>
+#include <stdlib.h>
+#include <unistd.h>
+
+#include <cstdint>
+#include <iostream>
+#include <random>
+
+#include "cuda_test_util.h"  // NOLINT(build/include)
+
+__global__ void addKernel(std::uint32_t* data) {
+  size_t index = blockIdx.x * blockDim.x + threadIdx.x;
+  data[index] += static_cast<std::uint32_t>(index);
+}
+
+void TestMallocManagedRoundTrip(int device, unsigned int malloc_flags,
+                                bool prefetch) {
+  constexpr size_t kNumBlocks = 32;
+  constexpr size_t kNumThreads = 64;
+  constexpr size_t kNumElems = kNumBlocks * kNumThreads;
+
+  std::uint32_t* data = nullptr;
+  constexpr size_t kNumBytes = kNumElems * sizeof(*data);
+  CHECK_CUDA(cudaMallocManaged(&data, kNumBytes, malloc_flags));
+
+  // Initialize all elements in the array with a random value on the host.
+  std::default_random_engine rd;
+  const std::uint32_t init_val =
+      std::uniform_int_distribution<std::uint32_t>()(rd);
+  for (size_t i = 0; i < kNumElems; i++) {
+    data[i] = init_val;
+  }
+
+  if (prefetch) {
+    CHECK_CUDA(cudaMemPrefetchAsync(data, kNumBytes, device));
+  }
+
+  // Mutate the array on the device.
+  addKernel<<<kNumBlocks, kNumThreads>>>(data);
+  CHECK_CUDA(cudaGetLastError());
+  CHECK_CUDA(cudaDeviceSynchronize());
+
+  if (prefetch) {
+    CHECK_CUDA(cudaMemPrefetchAsync(data, kNumBytes, cudaCpuDeviceId));
+  }
+
+  // Check that the array has the expected result.
+  for (size_t i = 0; i < kNumElems; i++) {
+    std::uint32_t want = init_val + static_cast<std::uint32_t>(i);
+    if (data[i] != want) {
+      std::cout << "data[" << i << "]: got " << data[i] << ", wanted " << want
+                << " = " << init_val << " + " << i << std::endl;
+      abort();
+    }
+  }
+
+  CHECK_CUDA(cudaFree(data));
+}
+
+void TestMallocManagedReadWrite(int device) {
+  constexpr size_t kNumBlocks = 32;
+  constexpr size_t kNumThreads = 64;
+  constexpr size_t kNumElems = kNumBlocks * kNumThreads;
+
+  std::uint32_t* data = nullptr;
+  constexpr size_t kNumBytes = kNumElems * sizeof(*data);
+  CHECK_CUDA(cudaMallocManaged(&data, kNumBytes, cudaMemAttachGlobal));
+
+  // Initialize all elements in the array with a random value on the host.
+  std::default_random_engine rd;
+  const std::uint32_t init_val =
+      std::uniform_int_distribution<std::uint32_t>()(rd);
+  for (size_t i = 0; i < kNumElems; i++) {
+    data[i] = init_val;
+  }
+
+  // Write the array's contents to a temporary file.
+  char filename[] = "/tmp/cudaMallocManagedTest.XXXXXX";
+  int fd = mkstemp(filename);
+  if (fd < 0) {
+    err(1, "mkstemp");
+  }
+  size_t done = 0;
+  while (done < kNumBytes) {
+    ssize_t n = write(fd, reinterpret_cast<char*>(data) + done,
+                      kNumBytes - done);
+    if (n >= 0) {
+      done += n;
+    } else if (n < 0 && errno != EINTR) {
+      err(1, "write");
+    }
+  }
+
+  // Mutate the array on the device.
+  addKernel<<<kNumBlocks, kNumThreads>>>(data);
+  CHECK_CUDA(cudaGetLastError());
+  CHECK_CUDA(cudaDeviceSynchronize());
+
+  // Check that the array has the expected result.
+  for (size_t i = 0; i < kNumElems; i++) {
+    std::uint32_t want = init_val + static_cast<std::uint32_t>(i);
+    if (data[i] != want) {
+      std::cout << "data[" << i << "]: got " << data[i] << ", wanted " << want
+                << " = " << init_val << " + " << i << std::endl;
+      abort();
+    }
+  }
+
+  // Read the array's original contents back from the temporary file.
+  if (lseek(fd, 0, SEEK_SET) < 0) {
+    err(1, "lseek");
+  }
+  done = 0;
+  while (done < kNumBytes) {
+    ssize_t n = read(fd, reinterpret_cast<char*>(data) + done,
+                     kNumBytes - done);
+    if (n > 0) {
+      done += n;
+    } else if (n == 0) {
+      errx(1, "read: unexpected EOF after %zu bytes", done);
+    } else if (n < 0 && errno != EINTR) {
+      err(1, "read");
+    }
+  }
+
+  // Check that the array matches what we originally wrote.
+  for (size_t i = 0; i < kNumElems; i++) {
+    std::uint32_t want = init_val;
+    if (data[i] != want) {
+      std::cout << "data[" << i << "]: got " << data[i] << ", wanted " << want
+                << " = " << init_val << " + " << i << std::endl;
+      abort();
+    }
+  }
+
+  // Mutate the array on the device again.
+  addKernel<<<kNumBlocks, kNumThreads>>>(data);
+  CHECK_CUDA(cudaGetLastError());
+  CHECK_CUDA(cudaDeviceSynchronize());
+
+  // Check that the array has the expected result again.
+  for (size_t i = 0; i < kNumElems; i++) {
+    std::uint32_t want = init_val + static_cast<std::uint32_t>(i);
+    if (data[i] != want) {
+      std::cout << "data[" << i << "]: got " << data[i] << ", wanted " << want
+                << " = " << init_val << " + " << i << std::endl;
+      abort();
+    }
+  }
+
+  close(fd);
+  CHECK_CUDA(cudaFree(data));
+}
+
+int main() {
+  int device;
+  CHECK_CUDA(cudaGetDevice(&device));
+
+  std::cout << "Testing cudaMallocManaged(flags=cudaMemAttachGlobal)"
+            << std::endl;
+  TestMallocManagedRoundTrip(device, cudaMemAttachGlobal, false);
+
+  int cma = 0;
+  CHECK_CUDA(
+      cudaDeviceGetAttribute(&cma, cudaDevAttrConcurrentManagedAccess, device));
+  if (!cma) {
+    std::cout << "cudaDevAttrConcurrentManagedAccess not available"
+              << std::endl;
+  } else {
+    std::cout << "Testing cudaMallocManaged(flags=cudaMemAttachGlobal) "
+                 "with prefetching"
+              << std::endl;
+    TestMallocManagedRoundTrip(device, cudaMemAttachGlobal, true);
+    std::cout << "Testing cudaMallocManaged(flags=cudaMemAttachHost)"
+              << std::endl;
+    TestMallocManagedRoundTrip(device, cudaMemAttachHost, false);
+    std::cout << "Testing cudaMallocManaged(flags=cudaMemAttachHost) "
+                 "with prefetching"
+              << std::endl;
+    TestMallocManagedRoundTrip(device, cudaMemAttachHost, true);
+  }
+
+  std::cout << "Testing read/write syscalls on cudaMallocManaged memory"
+            << std::endl;
+  TestMallocManagedReadWrite(device);
+
+  std::cout << "All tests passed" << std::endl;
+  return 0;
+}
diff --git a/images/gpu/cuda-tests-12-8/cuda_test_util.h b/images/gpu/cuda-tests-12-8/cuda_test_util.h
@@ -0,0 +1,42 @@
+// Copyright 2023 The gVisor Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef THIRD_PARTY_GVISOR_IMAGES_GPU_CUDA_TESTS_CUDA_TEST_UTIL_H_
+#define THIRD_PARTY_GVISOR_IMAGES_GPU_CUDA_TESTS_CUDA_TEST_UTIL_H_
+
+#include <iostream>
+
+// cudaError_t is returned by CUDA runtime functions.
+#define CHECK_CUDA(expr)                                                     \
+  do {                                                                       \
+    cudaError_t code = (expr);                                               \
+    if (code != cudaSuccess) {                                               \
+      std::cout << "Check failed at " << __FILE__ << ":" << __LINE__ << ": " \
+                << #expr << ": " << cudaGetErrorString(code) << std::endl;   \
+      abort();                                                               \
+    }                                                                        \
+  } while (0)
+
+// CUresult is returned by CUDA driver functions.
+#define CHECK_CUDA_RESULT(expr)                                              \
+  do {                                                                       \
+    CUresult code = (expr);                                                  \
+    if (code != CUDA_SUCCESS) {                                              \
+      std::cout << "Check failed at " << __FILE__ << ":" << __LINE__ << ": " \
+                << #expr << ": " << code << std::endl;                       \
+      abort();                                                               \
+    }                                                                        \
+  } while (0)
+
+#endif  // THIRD_PARTY_GVISOR_IMAGES_GPU_CUDA_TESTS_CUDA_TEST_UTIL_H_
diff --git a/images/gpu/cuda-tests-12-8/run_cuda_test.py b/images/gpu/cuda-tests-12-8/run_cuda_test.py
@@ -0,0 +1,56 @@
+# Copyright 2025 The gVisor Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import argparse
+import os
+import shlex
+import subprocess
+import sys
+
+ROOT_CMAKE_DIR = '/cuda-samples/build'
+SAMPLES_DIR = ROOT_CMAKE_DIR + '/Samples'
+
+parser = argparse.ArgumentParser()
+
+parser.add_argument(
+    'test',
+    help=(
+        'Test to run. This should be some thing like'
+        ' "0_Introduction/UnifiedMemoryStreams"'
+    ),
+    type=str,
+)
+
+
+def run_test(test_dir: str = ''):
+  make_path = os.path.join(SAMPLES_DIR, test_dir)
+  cmd = shlex.split(f'make -C {make_path}')
+  subprocess.run(
+      args=cmd,
+      check=True,
+      stdout=sys.stdout,
+      stderr=sys.stderr,
+  )
+  test_path = [os.path.join(make_path, os.path.basename(test_dir))]
+  subprocess.run(
+      args=test_path,
+      check=True,
+      stdout=sys.stdout,
+      stderr=sys.stderr,
+  )
+
+
+if __name__ == '__main__':
+  args = parser.parse_args(sys.argv[1:])
+  run_test(test_dir=args.test)
diff --git a/images/gpu/cuda-tests-12-8/run_smoke.sh b/images/gpu/cuda-tests-12-8/run_smoke.sh
@@ -0,0 +1,22 @@
+#!/bin/bash
+
+# Copyright 2021 The gVisor Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+set -euxo pipefail
+
+cd /
+nvcc cuda_malloc.cu -o cuda_malloc -Wno-deprecated-gpu-targets
+./cuda_malloc
+echo 'All tests passed'
diff --git a/images/gpu/cuda-tests-12-8/unsupported_ioctl.cc b/images/gpu/cuda-tests-12-8/unsupported_ioctl.cc
diff --git a/pkg/test/dockerutil/gpu.go b/pkg/test/dockerutil/gpu.go
diff --git a/test/gpu/smoke_test.go b/test/gpu/smoke_test.go