From 5cf83b5a98809c55d0dc7883cc109e154bd50b4b Mon Sep 17 00:00:00 2001 From: Shawn Zeng Date: Tue, 3 Mar 2026 12:15:15 +0800 Subject: [PATCH 1/4] Bug 3570274 and 3570274: Check Unified Memory is supported or not for executing Unified Memory samples --- .../UnifiedMemoryPerf/matrixMultiplyPerf.cu | 12 +++++++++++- 1 file changed, 11 insertions(+), 1 deletion(-) diff --git a/Samples/6_Performance/UnifiedMemoryPerf/matrixMultiplyPerf.cu b/Samples/6_Performance/UnifiedMemoryPerf/matrixMultiplyPerf.cu index 59533cfd..0a2a8149 100644 --- a/Samples/6_Performance/UnifiedMemoryPerf/matrixMultiplyPerf.cu +++ b/Samples/6_Performance/UnifiedMemoryPerf/matrixMultiplyPerf.cu @@ -664,7 +664,17 @@ int main(int argc, char **argv) verboseResults = 1; } - int device_id = findCudaDevice(argc, (const char **)argv); + // set device + cudaDeviceProp device_prop; + int device_id = findCudaDevice(argc, (const char **)argv); + checkCudaErrors(cudaGetDeviceProperties(&device_prop, device_id)); + + if (!device_prop.managedMemory) { + // This samples requires being run on a device that supports Unified Memory + fprintf(stderr, "Unified Memory not supported on this device\n"); + + exit(EXIT_WAIVED); + } matrixMultiplyPerfRunner(reportAsBandwidth, print_launch_transfer_results, print_std_deviation, device_id); From e32d17e67e3a55f8e192edef24d1a6bfa155b2d6 Mon Sep 17 00:00:00 2001 From: Shawn Zeng Date: Tue, 10 Mar 2026 16:05:27 +0800 Subject: [PATCH 2/4] Bug 5952280: Add cuModuleUnload(Module) to release resource for 6 samples --- Samples/0_Introduction/matrixMulDrv/matrixMulDrv.cpp | 1 + .../matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp | 10 ++++++---- .../simpleTextureDrv/simpleTextureDrv.cpp | 1 + Samples/0_Introduction/vectorAddDrv/vectorAddDrv.cpp | 1 + Samples/0_Introduction/vectorAddMMAP/vectorAddMMAP.cpp | 1 + Samples/3_CUDA_Features/memMapIPCDrv/memMapIpc.cpp | 1 + 6 files changed, 11 insertions(+), 4 deletions(-) diff --git a/Samples/0_Introduction/matrixMulDrv/matrixMulDrv.cpp b/Samples/0_Introduction/matrixMulDrv/matrixMulDrv.cpp index 815801b8..add08ebb 100644 --- a/Samples/0_Introduction/matrixMulDrv/matrixMulDrv.cpp +++ b/Samples/0_Introduction/matrixMulDrv/matrixMulDrv.cpp @@ -255,6 +255,7 @@ void runTest(int argc, char **argv) checkCudaErrors(cuMemFree(d_A)); checkCudaErrors(cuMemFree(d_B)); checkCudaErrors(cuMemFree(d_C)); + checkCudaErrors(cuModuleUnload(cuModule)); checkCudaErrors(cuCtxDestroy(cuContext)); } diff --git a/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp b/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp index 3260a2ee..34302dfe 100644 --- a/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp +++ b/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp @@ -68,6 +68,7 @@ extern "C" void computeGold(float *, const float *, const float *, unsigned int, // Globals //////////////////////////////////////////////////////////////////////////////// CUcontext g_cuContext; +CUmodule g_cuModule; bool noprompt = false; static const char *sSDKsample = "matrixMulDynlinkJIT (CUDA dynamic linking)"; @@ -90,7 +91,6 @@ CUresult initCUDA(int argc, char **argv, CUfunction *pMatrixMul, int *block_size { CUresult status; CUdevice cuDevice; - CUmodule cuModule; CUfunction cuFunction; int major, minor, block_size, devID = 0; char deviceName[256]; @@ -185,10 +185,10 @@ CUresult initCUDA(int argc, char **argv, CUfunction *pMatrixMul, int *block_size #if defined(_WIN64) || defined(__LP64__) status = - cuModuleLoadDataEx(&cuModule, matrixMul_kernel_64_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); + cuModuleLoadDataEx(&g_cuModule, matrixMul_kernel_64_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); #else status = - cuModuleLoadDataEx(&cuModule, matrixMul_kernel_32_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); + cuModuleLoadDataEx(&g_cuModule, matrixMul_kernel_32_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); #endif printf("> PTX JIT log:\n%s\n", jitLogBuffer); @@ -206,9 +206,10 @@ CUresult initCUDA(int argc, char **argv, CUfunction *pMatrixMul, int *block_size // retrieve CUDA function from the compiled module status = cuModuleGetFunction( - &cuFunction, cuModule, (block_size == 16) ? "matrixMul_bs16_32bit" : "matrixMul_bs32_32bit"); + &cuFunction, g_cuModule, (block_size == 16) ? "matrixMul_bs16_32bit" : "matrixMul_bs32_32bit"); if (CUDA_SUCCESS != status) { + cuModuleUnload(g_cuModule); cuCtxDestroy(g_cuContext); exit(EXIT_FAILURE); } @@ -337,6 +338,7 @@ int main(int argc, char **argv) checkCudaErrors(cuMemFree(d_A)); checkCudaErrors(cuMemFree(d_B)); checkCudaErrors(cuMemFree(d_C)); + checkCudaErrors(cuModuleUnload(g_cuModule)); checkCudaErrors(cuCtxDestroy(g_cuContext)); printf("Test run %s\n", (1 == res) ? "success!" : "failed!"); diff --git a/Samples/0_Introduction/simpleTextureDrv/simpleTextureDrv.cpp b/Samples/0_Introduction/simpleTextureDrv/simpleTextureDrv.cpp index aa6b2627..85c29d8c 100644 --- a/Samples/0_Introduction/simpleTextureDrv/simpleTextureDrv.cpp +++ b/Samples/0_Introduction/simpleTextureDrv/simpleTextureDrv.cpp @@ -297,6 +297,7 @@ void runTest(int argc, char **argv) free(image_path); free(ref_path); + checkCudaErrors(cuModuleUnload(cuModule)); checkCudaErrors(cuCtxDestroy(cuContext)); exit(bTestResults ? EXIT_SUCCESS : EXIT_FAILURE); diff --git a/Samples/0_Introduction/vectorAddDrv/vectorAddDrv.cpp b/Samples/0_Introduction/vectorAddDrv/vectorAddDrv.cpp index e6a1a051..9d36f777 100644 --- a/Samples/0_Introduction/vectorAddDrv/vectorAddDrv.cpp +++ b/Samples/0_Introduction/vectorAddDrv/vectorAddDrv.cpp @@ -211,6 +211,7 @@ int CleanupNoFailure() free(h_C); } + checkCudaErrors(cuModuleUnload(cuModule)); checkCudaErrors(cuCtxDestroy(cuContext)); return EXIT_SUCCESS; diff --git a/Samples/0_Introduction/vectorAddMMAP/vectorAddMMAP.cpp b/Samples/0_Introduction/vectorAddMMAP/vectorAddMMAP.cpp index c5c28ff5..5a07ff33 100644 --- a/Samples/0_Introduction/vectorAddMMAP/vectorAddMMAP.cpp +++ b/Samples/0_Introduction/vectorAddMMAP/vectorAddMMAP.cpp @@ -247,6 +247,7 @@ int CleanupNoFailure() free(h_C); } + checkCudaErrors(cuModuleUnload(cuModule)); checkCudaErrors(cuCtxDestroy(cuContext)); return EXIT_SUCCESS; diff --git a/Samples/3_CUDA_Features/memMapIPCDrv/memMapIpc.cpp b/Samples/3_CUDA_Features/memMapIPCDrv/memMapIpc.cpp index 09937acc..d8355f2b 100644 --- a/Samples/3_CUDA_Features/memMapIPCDrv/memMapIpc.cpp +++ b/Samples/3_CUDA_Features/memMapIPCDrv/memMapIpc.cpp @@ -419,6 +419,7 @@ static void childProcess(int devId, int id, char **argv) // Clean up! checkCudaErrors(cuStreamDestroy(stream)); + checkCudaErrors(cuModuleUnload(cuModule)); checkCudaErrors(cuCtxDestroy(ctx)); // Unmap the allocations from our address space. Unmapping will also free the From 722c5dd06996aaf9ba456b315c3775cd9effea0e Mon Sep 17 00:00:00 2001 From: Shawn Zeng Date: Wed, 11 Mar 2026 16:22:10 +0800 Subject: [PATCH 3/4] Bug 5970525: Update a minor issue of Samples/0_Introduction/fp16ScalarProduct --- Samples/0_Introduction/fp16ScalarProduct/fp16ScalarProduct.cu | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/Samples/0_Introduction/fp16ScalarProduct/fp16ScalarProduct.cu b/Samples/0_Introduction/fp16ScalarProduct/fp16ScalarProduct.cu index 297095fd..7f1fdb7a 100644 --- a/Samples/0_Introduction/fp16ScalarProduct/fp16ScalarProduct.cu +++ b/Samples/0_Introduction/fp16ScalarProduct/fp16ScalarProduct.cu @@ -94,7 +94,7 @@ scalarProductKernel_intrinsics(half2 const *const a, half2 const *const b, float shArray[threadIdx.x] = __float2half2_rn(0.f); half2 value = __float2half2_rn(0.f); - for (int i = threadIdx.x + blockDim.x + blockIdx.x; i < size; i += stride) { + for (int i = threadIdx.x + blockDim.x * blockIdx.x; i < size; i += stride) { value = __hfma2(a[i], b[i], value); } @@ -118,7 +118,7 @@ scalarProductKernel_native(half2 const *const a, half2 const *const b, float *co half2 value(0.f, 0.f); shArray[threadIdx.x] = value; - for (int i = threadIdx.x + blockDim.x + blockIdx.x; i < size; i += stride) { + for (int i = threadIdx.x + blockDim.x * blockIdx.x; i < size; i += stride) { value = a[i] * b[i] + value; } From f69622b6b69c8d2da834ffd9394770e3e9ba90c2 Mon Sep 17 00:00:00 2001 From: Shawn Zeng Date: Thu, 12 Mar 2026 16:44:47 +0800 Subject: [PATCH 4/4] Bug 5970583: Update the incorrect links of dependencies for Samples --- README.md | 5 +++++ Samples/0_Introduction/UnifiedMemoryStreams/README.md | 2 +- Samples/0_Introduction/fp16ScalarProduct/README.md | 2 +- .../matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp | 8 ++++---- Samples/0_Introduction/simpleAWBarrier/README.md | 2 +- Samples/0_Introduction/simpleCUDA2GL/README.md | 2 +- Samples/0_Introduction/simpleIPC/README.md | 2 +- Samples/0_Introduction/simpleMPI/README.md | 2 +- Samples/0_Introduction/simpleTexture3D/README.md | 2 +- Samples/0_Introduction/systemWideAtomics/README.md | 2 +- .../2_Concepts_and_Techniques/FunctionPointers/README.md | 2 +- Samples/2_Concepts_and_Techniques/boxFilter/README.md | 2 +- .../2_Concepts_and_Techniques/imageDenoising/README.md | 3 +-- Samples/2_Concepts_and_Techniques/particles/README.md | 2 +- Samples/2_Concepts_and_Techniques/reduction/README.md | 2 +- .../reductionMultiBlockCG/README.md | 2 +- Samples/2_Concepts_and_Techniques/shfl_scan/README.md | 2 +- Samples/3_CUDA_Features/bf16TensorCoreGemm/README.md | 2 +- Samples/3_CUDA_Features/bindlessTexture/README.md | 2 +- Samples/3_CUDA_Features/cdpAdvancedQuicksort/README.md | 2 +- Samples/3_CUDA_Features/cdpBezierTessellation/README.md | 2 +- Samples/3_CUDA_Features/cdpQuadtree/README.md | 2 +- Samples/3_CUDA_Features/cdpSimplePrint/README.md | 2 +- Samples/3_CUDA_Features/cdpSimpleQuicksort/README.md | 2 +- Samples/3_CUDA_Features/dmmaTensorCoreGemm/README.md | 2 +- Samples/3_CUDA_Features/globalToShmemAsyncCopy/README.md | 2 +- Samples/3_CUDA_Features/memMapIPCDrv/README.md | 2 +- Samples/3_CUDA_Features/tf32TensorCoreGemm/README.md | 2 +- .../conjugateGradientMultiBlockCG/README.md | 2 +- .../conjugateGradientMultiDeviceCG/README.md | 2 +- Samples/4_CUDA_Libraries/conjugateGradientUM/README.md | 2 +- Samples/4_CUDA_Libraries/oceanFFT/README.md | 2 +- Samples/4_CUDA_Libraries/randomFog/README.md | 2 +- Samples/4_CUDA_Libraries/simpleCUFFT_callback/README.md | 2 +- Samples/5_Domain_Specific/Mandelbrot/README.md | 2 +- Samples/5_Domain_Specific/SobelFilter/README.md | 2 +- Samples/5_Domain_Specific/bicubicTexture/README.md | 2 +- Samples/5_Domain_Specific/bilateralFilter/README.md | 2 +- Samples/5_Domain_Specific/fluidsGL/README.md | 2 +- Samples/5_Domain_Specific/marchingCubes/README.md | 2 +- Samples/5_Domain_Specific/nbody/README.md | 2 +- Samples/5_Domain_Specific/postProcessGL/README.md | 2 +- Samples/5_Domain_Specific/recursiveGaussian/README.md | 2 +- Samples/5_Domain_Specific/simpleGL/README.md | 2 +- Samples/5_Domain_Specific/simpleVulkan/README.md | 2 +- Samples/5_Domain_Specific/simpleVulkanMMAP/README.md | 2 +- Samples/5_Domain_Specific/smokeParticles/README.md | 2 +- Samples/5_Domain_Specific/volumeFiltering/README.md | 2 +- Samples/5_Domain_Specific/volumeRender/README.md | 2 +- Samples/5_Domain_Specific/vulkanImageCUDA/README.md | 2 +- Samples/6_Performance/UnifiedMemoryPerf/README.md | 2 +- .../Tegra/EGLSync_CUDAEvent_Interop/README.md | 2 +- Samples/8_Platform_Specific/Tegra/fluidsGLES/README.md | 2 +- .../8_Platform_Specific/Tegra/nbody_opengles/README.md | 2 +- Samples/8_Platform_Specific/Tegra/simpleGLES/README.md | 2 +- .../Tegra/simpleGLES_EGLOutput/README.md | 2 +- 56 files changed, 63 insertions(+), 59 deletions(-) diff --git a/README.md b/README.md index 50602ce7..056e7d5c 100644 --- a/README.md +++ b/README.md @@ -604,6 +604,11 @@ NVJPEG library provides high-performance, GPU accelerated JPEG decoding function NVRTC (CUDA RunTime Compilation) is a runtime compilation library for CUDA C++. +#### NVJITLINK + +NVJITLINK is a CUDA runtime library that links multiple GPU device code objects at runtime and enables just‑in‑time link‑time optimization (JIT LTO). +It can take device code from tools such as NVCC and NVRTC, link and optimize it on the fly, and produce the final GPU binary.For more details, see: https://docs.nvidia.com/cuda/nvjitlink/index.html + #### Stream Priorities Stream Priorities allows the creation of streams with specified priorities. Stream Priorities is only available on GPUs with SM architecture of 3.5 or above. diff --git a/Samples/0_Introduction/UnifiedMemoryStreams/README.md b/Samples/0_Introduction/UnifiedMemoryStreams/README.md index 3805cb21..ac22e5c4 100644 --- a/Samples/0_Introduction/UnifiedMemoryStreams/README.md +++ b/Samples/0_Introduction/UnifiedMemoryStreams/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaStreamDestroy, cudaFree, cudaMallocManaged, cudaStreamAttachMemAsync, cudaSetDevice, cudaDeviceSynchronize, cudaStreamSynchronize, cudaStreamCreate, cudaGetDeviceProperties ## Dependencies needed to build/run -[OpenMP](../../../README.md#openmp), [UVM](../../../README.md#uvm), [CUBLAS](../../../README.md#cublas) +[OpenMP](../../../README.md#openmp), [UVM](../../../README.md#unified-virtual-memory), [CUBLAS](../../../README.md#cublas) ## Prerequisites diff --git a/Samples/0_Introduction/fp16ScalarProduct/README.md b/Samples/0_Introduction/fp16ScalarProduct/README.md index c86a605b..c2feb10e 100644 --- a/Samples/0_Introduction/fp16ScalarProduct/README.md +++ b/Samples/0_Introduction/fp16ScalarProduct/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaMemcpy, cudaFree, cudaMallocHost, cudaFreeHost, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[FP16](../../../README.md#fp16) +[FP16](../../../README.md#16-bit-floating-point) ## Prerequisites diff --git a/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp b/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp index 34302dfe..fb555eca 100644 --- a/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp +++ b/Samples/0_Introduction/matrixMulDynlinkJIT/matrixMulDynlinkJIT.cpp @@ -184,11 +184,11 @@ CUresult initCUDA(int argc, char **argv, CUfunction *pMatrixMul, int *block_size printf("> Compiling CUDA module\n"); #if defined(_WIN64) || defined(__LP64__) - status = - cuModuleLoadDataEx(&g_cuModule, matrixMul_kernel_64_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); + status = cuModuleLoadDataEx( + &g_cuModule, matrixMul_kernel_64_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); #else - status = - cuModuleLoadDataEx(&g_cuModule, matrixMul_kernel_32_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); + status = cuModuleLoadDataEx( + &g_cuModule, matrixMul_kernel_32_ptxdump, jitNumOptions, jitOptions, (void **)jitOptVals); #endif printf("> PTX JIT log:\n%s\n", jitLogBuffer); diff --git a/Samples/0_Introduction/simpleAWBarrier/README.md b/Samples/0_Introduction/simpleAWBarrier/README.md index b196c8c6..b479b2d2 100644 --- a/Samples/0_Introduction/simpleAWBarrier/README.md +++ b/Samples/0_Introduction/simpleAWBarrier/README.md @@ -26,7 +26,7 @@ x86_64, armv7l, aarch64 cudaStreamCreateWithFlags, cudaFree, cudaDeviceGetAttribute, cudaMallocHost, cudaFreeHost, cudaStreamSynchronize, cudaLaunchCooperativeKernel, cudaMalloc, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaMemcpyAsync, cudaOccupancyMaxPotentialBlockSize ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11), [MBCG](../../../README.md#mbcg) +[C++11 CUDA](../../../README.md#c11-cuda), [MBCG](../../../README.md#multi-block-cooperative-groups) ## Prerequisites diff --git a/Samples/0_Introduction/simpleCUDA2GL/README.md b/Samples/0_Introduction/simpleCUDA2GL/README.md index 45b68b70..cc6e807f 100644 --- a/Samples/0_Introduction/simpleCUDA2GL/README.md +++ b/Samples/0_Introduction/simpleCUDA2GL/README.md @@ -26,7 +26,7 @@ x86_64 cudaHostAlloc, cudaGraphicsUnmapResources, cudaMalloc, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaMemcpyToArray, cudaDeviceSynchronize, cudaProcess, cudaGraphicsUnregisterResource, cudaGraphicsSubResourceGetMappedArray, cudaGraphicsGLRegisterBuffer, cudaGraphicsGLRegisterImage ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/0_Introduction/simpleIPC/README.md b/Samples/0_Introduction/simpleIPC/README.md index 09c8f49b..4e4c647e 100644 --- a/Samples/0_Introduction/simpleIPC/README.md +++ b/Samples/0_Introduction/simpleIPC/README.md @@ -26,7 +26,7 @@ x86_64, ppc64le cudaSetDevice, cudaIpcCloseMemHandle, cudaEventDestroy, cudaGetDeviceCount, cudaMemcpyAsync, cudaDeviceCanAccessPeer, cudaStreamCreateWithFlags, cudaStreamDestroy, cudaGetLastError, cudaIpcOpenEventHandle, cudaIpcOpenMemHandle, cudaIpcGetEventHandle, cudaStreamWaitEvent, cudaEventCreate, cudaFree, cudaEventSynchronize, cudaEventRecord, cudaIpcGetMemHandle, cudaStreamSynchronize, cudaDeviceEnablePeerAccess, cudaMalloc, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaGetDeviceProperties ## Dependencies needed to build/run -[IPC](../../../README.md#ipc) +[IPC](../../../README.md#cuda-interprocess-communication) ## Prerequisites diff --git a/Samples/0_Introduction/simpleMPI/README.md b/Samples/0_Introduction/simpleMPI/README.md index 55897069..ae1d08b9 100644 --- a/Samples/0_Introduction/simpleMPI/README.md +++ b/Samples/0_Introduction/simpleMPI/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMalloc, cudaGetLastError, cudaMemcpy, cudaFree ## Dependencies needed to build/run -[MPI](../../../README.md#mpi) +[MPI](../../../README.md#message-passing-interface) ## Prerequisites diff --git a/Samples/0_Introduction/simpleTexture3D/README.md b/Samples/0_Introduction/simpleTexture3D/README.md index 80848544..60b0ce78 100644 --- a/Samples/0_Introduction/simpleTexture3D/README.md +++ b/Samples/0_Introduction/simpleTexture3D/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFreeArray, cudaFree, cudaPitchedPtr, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaExtent, cudaDeviceSynchronize, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/0_Introduction/systemWideAtomics/README.md b/Samples/0_Introduction/systemWideAtomics/README.md index 66609bb3..7a1ca4c6 100644 --- a/Samples/0_Introduction/systemWideAtomics/README.md +++ b/Samples/0_Introduction/systemWideAtomics/README.md @@ -26,7 +26,7 @@ x86_64, ppc64le cudaDeviceSynchronize, cudaMallocManaged, cudaGetDeviceProperties, cudaFree ## Dependencies needed to build/run -[UVM](../../../README.md#uvm) +[UVM](../../../README.md#unified-virtual-memory) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/FunctionPointers/README.md b/Samples/2_Concepts_and_Techniques/FunctionPointers/README.md index f7d0cb71..57ef1296 100644 --- a/Samples/2_Concepts_and_Techniques/FunctionPointers/README.md +++ b/Samples/2_Concepts_and_Techniques/FunctionPointers/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaMemcpyFromSymbol, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaDeviceSynchronize, cudaCreateTextureObject, cudaMemcpyToSymbol, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/boxFilter/README.md b/Samples/2_Concepts_and_Techniques/boxFilter/README.md index 6e9c0a76..528e1b60 100644 --- a/Samples/2_Concepts_and_Techniques/boxFilter/README.md +++ b/Samples/2_Concepts_and_Techniques/boxFilter/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaCreateChannelDesc, cudaMallocArray, cudaFreeArray, cudaFree, cudaGetErrorString, cudaMemcpy, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaDeviceSynchronize, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/imageDenoising/README.md b/Samples/2_Concepts_and_Techniques/imageDenoising/README.md index 3824c8cc..d66d6e77 100644 --- a/Samples/2_Concepts_and_Techniques/imageDenoising/README.md +++ b/Samples/2_Concepts_and_Techniques/imageDenoising/README.md @@ -26,8 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaCreateTextureObject, cudaGLRegisterBufferObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) - +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites Download and install the [CUDA Toolkit](https://developer.nvidia.com/cuda-downloads) for your corresponding platform. diff --git a/Samples/2_Concepts_and_Techniques/particles/README.md b/Samples/2_Concepts_and_Techniques/particles/README.md index 279de7d1..9e48fbb1 100644 --- a/Samples/2_Concepts_and_Techniques/particles/README.md +++ b/Samples/2_Concepts_and_Techniques/particles/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaMemset, cudaMemcpyToSymbol, cudaGraphicsGLRegisterBuffer, cudaGraphicsUnregisterResource, cudaMalloc, cudaInit, cudaGLInit ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/reduction/README.md b/Samples/2_Concepts_and_Techniques/reduction/README.md index b89a1f38..48e74c21 100644 --- a/Samples/2_Concepts_and_Techniques/reduction/README.md +++ b/Samples/2_Concepts_and_Techniques/reduction/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaMemcpy, cudaFree, cudaSetDevice, cudaDeviceSynchronize, cudaGetDevice, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/reductionMultiBlockCG/README.md b/Samples/2_Concepts_and_Techniques/reductionMultiBlockCG/README.md index f4bbf8ff..978200d7 100644 --- a/Samples/2_Concepts_and_Techniques/reductionMultiBlockCG/README.md +++ b/Samples/2_Concepts_and_Techniques/reductionMultiBlockCG/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMemcpy, cudaFree, cudaSetDevice, cudaDeviceSynchronize, cudaLaunchCooperativeKernel, cudaMalloc, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaGetDeviceProperties, cudaOccupancyMaxPotentialBlockSize ## Dependencies needed to build/run -[MBCG](../../../README.md#mbcg), [CPP11](../../../README.md#cpp11) +[MBCG](../../../README.md#multi-block-cooperative-groups), [C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/2_Concepts_and_Techniques/shfl_scan/README.md b/Samples/2_Concepts_and_Techniques/shfl_scan/README.md index a685b67e..586962c6 100644 --- a/Samples/2_Concepts_and_Techniques/shfl_scan/README.md +++ b/Samples/2_Concepts_and_Techniques/shfl_scan/README.md @@ -24,7 +24,7 @@ x86_64, armv7l, aarch64 cudaMemcpy, cudaFree, cudaMallocHost, cudaEventSynchronize, cudaEventRecord, cudaFreeHost, cudaGetDevice, cudaMemset, cudaMalloc, cudaEventElapsedTime, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/3_CUDA_Features/bf16TensorCoreGemm/README.md b/Samples/3_CUDA_Features/bf16TensorCoreGemm/README.md index a0c7cc36..bc36fa91 100644 --- a/Samples/3_CUDA_Features/bf16TensorCoreGemm/README.md +++ b/Samples/3_CUDA_Features/bf16TensorCoreGemm/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMemcpy, cudaFree, cudaGetErrorString, cudaGetLastError, cudaEventSynchronize, cudaFuncSetAttribute, cudaEventRecord, cudaMemset, cudaMalloc, cudaEventElapsedTime, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/3_CUDA_Features/bindlessTexture/README.md b/Samples/3_CUDA_Features/bindlessTexture/README.md index d9fff21b..386f3eca 100644 --- a/Samples/3_CUDA_Features/bindlessTexture/README.md +++ b/Samples/3_CUDA_Features/bindlessTexture/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaMemcpy, cudaGetMipmappedArrayLevel, cudaGraphicsMapResources, cudaDestroySurfaceObject, cudaExtent, cudaDeviceSynchronize, cudaCreateSurfaceObject, cudaMallocMipmappedArray, cudaPitchedPtr, cudaGraphicsResourceGetMappedPointer, cudaCreateTextureObject, cudaGraphicsUnmapResources, cudaMallocArray, cudaFreeArray, cudaArrayGetInfo, cudaGetLastError, cudaDestroyTextureObject, cudaGraphicsGLRegisterBuffer, cudaFreeMipmappedArray, cudaFree, cudaGraphicsUnregisterResource, cudaMalloc ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/3_CUDA_Features/cdpAdvancedQuicksort/README.md b/Samples/3_CUDA_Features/cdpAdvancedQuicksort/README.md index 5486a3bb..5e717c70 100644 --- a/Samples/3_CUDA_Features/cdpAdvancedQuicksort/README.md +++ b/Samples/3_CUDA_Features/cdpAdvancedQuicksort/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaStreamCreateWithFlags, cudaMemcpy, cudaMemcpyAsync, cudaFree, cudaGetErrorString, cudaGetLastError, cudaPeekAtLastError, cudaDeviceSynchronize, cudaEventRecord, cudaMemset, cudaMalloc, cudaEventElapsedTime, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[CDP](../../../README.md#cdp) +[CDP](../../../README.md#cuda-dynamic-parallellism) ## Prerequisites diff --git a/Samples/3_CUDA_Features/cdpBezierTessellation/README.md b/Samples/3_CUDA_Features/cdpBezierTessellation/README.md index 4924a839..1b6643b9 100644 --- a/Samples/3_CUDA_Features/cdpBezierTessellation/README.md +++ b/Samples/3_CUDA_Features/cdpBezierTessellation/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaMemcpy, cudaFree, cudaGetDeviceCount, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[CDP](../../../README.md#cdp) +[CDP](../../../README.md#cuda-dynamic-parallellism) ## Prerequisites diff --git a/Samples/3_CUDA_Features/cdpQuadtree/README.md b/Samples/3_CUDA_Features/cdpQuadtree/README.md index 13df2faa..624340f4 100644 --- a/Samples/3_CUDA_Features/cdpQuadtree/README.md +++ b/Samples/3_CUDA_Features/cdpQuadtree/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaMemcpy, cudaFree, cudaGetLastError, cudaDeviceSetLimit, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[CDP](../../../README.md#cdp) +[CDP](../../../README.md#cuda-dynamic-parallellism) ## Prerequisites diff --git a/Samples/3_CUDA_Features/cdpSimplePrint/README.md b/Samples/3_CUDA_Features/cdpSimplePrint/README.md index 623dd2ac..20fe63fe 100644 --- a/Samples/3_CUDA_Features/cdpSimplePrint/README.md +++ b/Samples/3_CUDA_Features/cdpSimplePrint/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaDeviceSynchronize, cudaGetLastError, cudaGetDeviceProperties, cudaDeviceSetLimit ## Dependencies needed to build/run -[CDP](../../../README.md#cdp) +[CDP](../../../README.md#cuda-dynamic-parallellism) ## Prerequisites diff --git a/Samples/3_CUDA_Features/cdpSimpleQuicksort/README.md b/Samples/3_CUDA_Features/cdpSimpleQuicksort/README.md index e5ddf02b..950ca0e5 100644 --- a/Samples/3_CUDA_Features/cdpSimpleQuicksort/README.md +++ b/Samples/3_CUDA_Features/cdpSimpleQuicksort/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaStreamCreateWithFlags, cudaMemcpy, cudaStreamDestroy, cudaFree, cudaDeviceSynchronize, cudaDeviceSetLimit, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[CDP](../../../README.md#cdp) +[CDP](../../../README.md#cuda-dynamic-parallellism) ## Prerequisites diff --git a/Samples/3_CUDA_Features/dmmaTensorCoreGemm/README.md b/Samples/3_CUDA_Features/dmmaTensorCoreGemm/README.md index e9498e5d..536cf265 100644 --- a/Samples/3_CUDA_Features/dmmaTensorCoreGemm/README.md +++ b/Samples/3_CUDA_Features/dmmaTensorCoreGemm/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMemcpy, cudaFree, cudaGetErrorString, cudaGetLastError, cudaEventSynchronize, cudaFuncSetAttribute, cudaEventRecord, cudaMemset, cudaMalloc, cudaEventElapsedTime, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/3_CUDA_Features/globalToShmemAsyncCopy/README.md b/Samples/3_CUDA_Features/globalToShmemAsyncCopy/README.md index 46c198b3..43b79358 100644 --- a/Samples/3_CUDA_Features/globalToShmemAsyncCopy/README.md +++ b/Samples/3_CUDA_Features/globalToShmemAsyncCopy/README.md @@ -26,7 +26,7 @@ x86_64, armv7l, aarch64 cudaStreamCreateWithFlags, cudaMalloc, cudaDeviceGetAttribute, cudaFree, cudaMallocHost, cudaEventSynchronize, cudaEventRecord, cudaFreeHost, cudaStreamSynchronize, cudaEventDestroy, cudaEventElapsedTime, cudaMemsetAsync, cudaMemcpyAsync, cudaEventCreate ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/3_CUDA_Features/memMapIPCDrv/README.md b/Samples/3_CUDA_Features/memMapIPCDrv/README.md index ae717fec..ba2ba26a 100644 --- a/Samples/3_CUDA_Features/memMapIPCDrv/README.md +++ b/Samples/3_CUDA_Features/memMapIPCDrv/README.md @@ -26,7 +26,7 @@ x86_64, armv7l, aarch64 cuDeviceCanAccessPeer, cuMemImportFromShareableHandle, cuModuleLoadDataEx, cuModuleGetFunction, cuMemSetAccess, cuModuleLoad, cuStreamCreate, cuMemRelease, cuInit, cuLaunchKernel, cuMemcpyDtoHAsync, cuMemCreate, cuDeviceGet, cuCtxDestroy, cuDeviceGetCount, cuMemMap, cuMemExportToShareableHandle, cuStreamSynchronize, cuCtxEnablePeerAccess, cuDeviceGetAttribute, cuOccupancyMaxActiveBlocksPerMultiprocessor, cuCtxSetCurrent, cuMemGetAllocationGranularity, cuMemAddressFree, cuMemUnmap, cuCtxCreate, cuStreamDestroy, cuMemAddressReserve ## Dependencies needed to build/run -[IPC](../../../README.md#ipc) +[IPC](../../../README.md#cuda-interprocess-communication) ## Prerequisites diff --git a/Samples/3_CUDA_Features/tf32TensorCoreGemm/README.md b/Samples/3_CUDA_Features/tf32TensorCoreGemm/README.md index 7c75298b..2cd78da8 100644 --- a/Samples/3_CUDA_Features/tf32TensorCoreGemm/README.md +++ b/Samples/3_CUDA_Features/tf32TensorCoreGemm/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMemcpy, cudaFree, cudaGetErrorString, cudaGetLastError, cudaEventSynchronize, cudaFuncSetAttribute, cudaEventRecord, cudaMemset, cudaMalloc, cudaEventElapsedTime, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[CPP11](../../../README.md#cpp11) +[C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/conjugateGradientMultiBlockCG/README.md b/Samples/4_CUDA_Libraries/conjugateGradientMultiBlockCG/README.md index 0d18d5b5..b23dc941 100644 --- a/Samples/4_CUDA_Libraries/conjugateGradientMultiBlockCG/README.md +++ b/Samples/4_CUDA_Libraries/conjugateGradientMultiBlockCG/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaFree, cudaMallocManaged, cudaDeviceSynchronize, cudaEventRecord, cudaLaunchCooperativeKernel, cudaEventDestroy, cudaEventElapsedTime, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaGetDeviceProperties, cudaEventCreate ## Dependencies needed to build/run -[UVM](../../../README.md#uvm), [MBCG](../../../README.md#mbcg) +[UVM](../../../README.md#unified-virtual-memory), [MBCG](../../../README.md#multi-block-cooperative-groups) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/conjugateGradientMultiDeviceCG/README.md b/Samples/4_CUDA_Libraries/conjugateGradientMultiDeviceCG/README.md index f219d7a6..3f9f0794 100644 --- a/Samples/4_CUDA_Libraries/conjugateGradientMultiDeviceCG/README.md +++ b/Samples/4_CUDA_Libraries/conjugateGradientMultiDeviceCG/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaHostAlloc, cudaMemPrefetchAsync, cudaFree, cudaLaunchCooperativeKernel, cudaMallocManaged, cudaSetDevice, cudaGetDeviceCount, cudaGetDeviceProperties, cudaFreeHost, cudaMemset, cudaStreamCreate, cudaStreamSynchronize, cudaDeviceEnablePeerAccess, cudaMemAdvise, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaDeviceCanAccessPeer ## Dependencies needed to build/run -[UVM](../../../README.md#uvm), [MDCG](../../../README.md#mdcg), [CPP11](../../../README.md#cpp11) +[UVM](../../../README.md#unified-virtual-memory), [MDCG](../../../README.md#multi-device-cooperative-groups), [C++11 CUDA](../../../README.md#c11-cuda) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/conjugateGradientUM/README.md b/Samples/4_CUDA_Libraries/conjugateGradientUM/README.md index 4d3ca843..36038190 100644 --- a/Samples/4_CUDA_Libraries/conjugateGradientUM/README.md +++ b/Samples/4_CUDA_Libraries/conjugateGradientUM/README.md @@ -24,7 +24,7 @@ x86_64, armv7l cudaFree, cudaMallocManaged, cudaDeviceSynchronize, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[UVM](../../../README.md#uvm), [CUBLAS](../../../README.md#cublas), [CUSPARSE](../../../README.md#cusparse) +[UVM](../../../README.md#unified-virtual-memory), [CUBLAS](../../../README.md#cublas), [CUSPARSE](../../../README.md#cusparse) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/oceanFFT/README.md b/Samples/4_CUDA_Libraries/oceanFFT/README.md index adf634b7..0df0f36c 100644 --- a/Samples/4_CUDA_Libraries/oceanFFT/README.md +++ b/Samples/4_CUDA_Libraries/oceanFFT/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMalloc, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaCalculateSlopeKernel, cudaGraphicsMapResources, cudaUpdateHeightmapKernel, cudaGraphicsUnregisterResource, cudaGenerateSpectrumKernel, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl), [CUFFT](../../../README.md#cufft) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew), [CUFFT](../../../README.md#cufft) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/randomFog/README.md b/Samples/4_CUDA_Libraries/randomFog/README.md index 895f6c44..fda52268 100644 --- a/Samples/4_CUDA_Libraries/randomFog/README.md +++ b/Samples/4_CUDA_Libraries/randomFog/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaMalloc, cudaGetErrorString, cudaMemcpy, cudaFree ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl), [CURAND](../../../README.md#curand) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew), [CURAND](../../../README.md#curand) ## Prerequisites diff --git a/Samples/4_CUDA_Libraries/simpleCUFFT_callback/README.md b/Samples/4_CUDA_Libraries/simpleCUFFT_callback/README.md index faf20779..0ac3eafc 100644 --- a/Samples/4_CUDA_Libraries/simpleCUFFT_callback/README.md +++ b/Samples/4_CUDA_Libraries/simpleCUFFT_callback/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaMemcpy, cudaFree, cudaMemcpyFromSymbol, cudaGetDevice, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[callback](../../../README.md#callback), [CUFFT](../../../README.md#cufft) +[CUFFT Callback Routines](../../../README.md#cufft-callback-routines), [CUFFT](../../../README.md#cufft) ## Prerequisites diff --git a/Samples/5_Domain_Specific/Mandelbrot/README.md b/Samples/5_Domain_Specific/Mandelbrot/README.md index d3bf1cf0..82f79d3d 100644 --- a/Samples/5_Domain_Specific/Mandelbrot/README.md +++ b/Samples/5_Domain_Specific/Mandelbrot/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGLUnmapBufferObject, cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGLMapBufferObject, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaGLUnregisterBufferObject, cudaDeviceSynchronize, cudaGLRegisterBufferObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/SobelFilter/README.md b/Samples/5_Domain_Specific/SobelFilter/README.md index 3693a773..9fd1cf16 100644 --- a/Samples/5_Domain_Specific/SobelFilter/README.md +++ b/Samples/5_Domain_Specific/SobelFilter/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaGetErrorString, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaDeviceSynchronize, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/bicubicTexture/README.md b/Samples/5_Domain_Specific/bicubicTexture/README.md index 21c45a38..2294da0a 100644 --- a/Samples/5_Domain_Specific/bicubicTexture/README.md +++ b/Samples/5_Domain_Specific/bicubicTexture/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaCreateChannelDesc, cudaMallocArray, cudaFreeArray, cudaFree, cudaMemcpy, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaDeviceSynchronize, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/bilateralFilter/README.md b/Samples/5_Domain_Specific/bilateralFilter/README.md index 2673923b..0eb3ce78 100644 --- a/Samples/5_Domain_Specific/bilateralFilter/README.md +++ b/Samples/5_Domain_Specific/bilateralFilter/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaRuntimeGetVersion, cudaGraphicsUnmapResources, cudaMallocPitch, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaDeviceSynchronize, cudaCreateTextureObject, cudaMemcpyToSymbol, cudaGraphicsUnregisterResource, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/fluidsGL/README.md b/Samples/5_Domain_Specific/fluidsGL/README.md index ad43bfec..aabe7d65 100644 --- a/Samples/5_Domain_Specific/fluidsGL/README.md +++ b/Samples/5_Domain_Specific/fluidsGL/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaMallocPitch, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl), [CUFFT](../../../README.md#cufft) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew), [CUFFT](../../../README.md#cufft) ## Prerequisites diff --git a/Samples/5_Domain_Specific/marchingCubes/README.md b/Samples/5_Domain_Specific/marchingCubes/README.md index b23e9d25..fb6a7460 100644 --- a/Samples/5_Domain_Specific/marchingCubes/README.md +++ b/Samples/5_Domain_Specific/marchingCubes/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGLUnmapBufferObject, cudaGraphicsUnmapResources, cudaCreateChannelDesc, cudaMemcpy, cudaFree, cudaGLMapBufferObject, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaGLUnregisterBufferObject, cudaCreateTextureObject, cudaGLRegisterBufferObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/nbody/README.md b/Samples/5_Domain_Specific/nbody/README.md index cc8befbe..7b65fcfb 100644 --- a/Samples/5_Domain_Specific/nbody/README.md +++ b/Samples/5_Domain_Specific/nbody/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaSetDeviceFlags, cudaGraphicsResourceSetMapFlags, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaSetDevice, cudaEventSynchronize, cudaGetDeviceCount, cudaGetDeviceProperties, cudaDeviceSynchronize, cudaEventRecord, cudaGetDevice, cudaMemcpyToSymbol, cudaStreamQuery, cudaEventDestroy, cudaEventElapsedTime, cudaDeviceCanAccessPeer, cudaEventCreate ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/postProcessGL/README.md b/Samples/5_Domain_Specific/postProcessGL/README.md index 20f48423..bdabbf6f 100644 --- a/Samples/5_Domain_Specific/postProcessGL/README.md +++ b/Samples/5_Domain_Specific/postProcessGL/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaHostAlloc, cudaGraphicsUnmapResources, cudaMalloc, cudaFree, cudaGetChannelDesc, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaMemcpyToArray, cudaDeviceSynchronize, cudaCreateTextureObject, cudaProcess, cudaGraphicsUnregisterResource, cudaGraphicsSubResourceGetMappedArray, cudaGraphicsGLRegisterBuffer, cudaGraphicsGLRegisterImage ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/recursiveGaussian/README.md b/Samples/5_Domain_Specific/recursiveGaussian/README.md index 710027f5..522274a8 100644 --- a/Samples/5_Domain_Specific/recursiveGaussian/README.md +++ b/Samples/5_Domain_Specific/recursiveGaussian/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaGetDevice, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/simpleGL/README.md b/Samples/5_Domain_Specific/simpleGL/README.md index 1731d5a2..3280e144 100644 --- a/Samples/5_Domain_Specific/simpleGL/README.md +++ b/Samples/5_Domain_Specific/simpleGL/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/simpleVulkan/README.md b/Samples/5_Domain_Specific/simpleVulkan/README.md index d202019a..a3d755d4 100644 --- a/Samples/5_Domain_Specific/simpleVulkan/README.md +++ b/Samples/5_Domain_Specific/simpleVulkan/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaStreamCreateWithFlags, cudaExternalMemoryGetMappedBuffer, cudaSignalSemaphore, cudaWaitExternalSemaphoresAsync, cudaVertMem, cudaImportExternalSemaphore, cudaWaitSemaphore, cudaHeightMap, cudaSetDevice, cudaGetDeviceCount, cudaSignalExternalSemaphoresAsync, cudaTimelineSemaphore, cudaStreamSynchronize, cudaDestroyExternalMemory, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaImportExternalMemory, cudaGetDeviceProperties, cudaDestroyExternalSemaphore ## Dependencies needed to build/run -[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan) +[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan), [GLFW](../../../README.md#glfw) ## Prerequisites diff --git a/Samples/5_Domain_Specific/simpleVulkanMMAP/README.md b/Samples/5_Domain_Specific/simpleVulkanMMAP/README.md index a38c667a..3880d2fe 100644 --- a/Samples/5_Domain_Specific/simpleVulkanMMAP/README.md +++ b/Samples/5_Domain_Specific/simpleVulkanMMAP/README.md @@ -29,7 +29,7 @@ cuMemCreate, cuMemAddressReserve, cuMemGetAllocationGranularity, cuMemAddressFre cudaWaitExternalSemaphoresAsync, cudaImportExternalSemaphore, cudaDeviceGetAttribute, cudaSetDevice, cudaLaunchHostFunc, cudaMallocHost, cudaSignalExternalSemaphoresAsync, cudaFreeHost, cudaMemsetAsync, cudaMemcpyAsync, cudaGetDeviceCount, cudaStreamCreateWithFlags, cudaStreamDestroy, cudaDestroyExternalSemaphore, cudaSignalSemaphore, cudaWaitSemaphore, cudaFree, cudaStreamSynchronize, cudaMalloc, cudaOccupancyMaxActiveBlocksPerMultiprocessor, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan) +[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan), [GLFW](../../../README.md#glfw) ## Prerequisites diff --git a/Samples/5_Domain_Specific/smokeParticles/README.md b/Samples/5_Domain_Specific/smokeParticles/README.md index e5de93ed..9f040a5c 100644 --- a/Samples/5_Domain_Specific/smokeParticles/README.md +++ b/Samples/5_Domain_Specific/smokeParticles/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaExtent, cudaPitchedPtr, cudaCreateTextureObject, cudaMemcpyToSymbol ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/volumeFiltering/README.md b/Samples/5_Domain_Specific/volumeFiltering/README.md index 3e64d058..123b2f47 100644 --- a/Samples/5_Domain_Specific/volumeFiltering/README.md +++ b/Samples/5_Domain_Specific/volumeFiltering/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaMemcpy, cudaGraphicsMapResources, cudaDestroySurfaceObject, cudaExtent, cudaDeviceSynchronize, cudaCreateSurfaceObject, cudaMemcpyToSymbol, cudaPitchedPtr, cudaGraphicsResourceGetMappedPointer, cudaCreateTextureObject, cudaGraphicsUnmapResources, cudaMallocArray, cudaFreeArray, cudaDestroyTextureObject, cudaMemset, cudaGraphicsGLRegisterBuffer, cudaFree, cudaGraphicsUnregisterResource, cudaMalloc ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/volumeRender/README.md b/Samples/5_Domain_Specific/volumeRender/README.md index ae424442..3efb1b15 100644 --- a/Samples/5_Domain_Specific/volumeRender/README.md +++ b/Samples/5_Domain_Specific/volumeRender/README.md @@ -26,7 +26,7 @@ x86_64, armv7l cudaProfilerStop, cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaPitchedPtr, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaExtent, cudaDeviceSynchronize, cudaCreateTextureObject, cudaMemset, cudaMemcpyToSymbol, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GL](../../../README.md#gl) +[X11](../../../README.md#x11), [OpenGL](../../../README.md#opengl), [Freeglut](../../../README.md#freeglut), [GLEW](../../../README.md#glew) ## Prerequisites diff --git a/Samples/5_Domain_Specific/vulkanImageCUDA/README.md b/Samples/5_Domain_Specific/vulkanImageCUDA/README.md index 2cb33f51..752bd881 100644 --- a/Samples/5_Domain_Specific/vulkanImageCUDA/README.md +++ b/Samples/5_Domain_Specific/vulkanImageCUDA/README.md @@ -26,7 +26,7 @@ x86_64, aarch64 cudaVkSemaphoreSignal, cudaWaitExternalSemaphoresAsync, cudaMemcpy, cudaVkImportSemaphore, cudaImportExternalSemaphore, cudaGetMipmappedArrayLevel, cudaSetDevice, cudaDestroySurfaceObject, cudaExtent, cudaMallocMipmappedArray, cudaCreateSurfaceObject, cudaStreamCreate, cudaSignalExternalSemaphoresAsync, cudaUpdateVkImage, cudaCreateTextureObject, cudaGetDeviceCount, cudaExternalMemoryGetMappedMipmappedArray, cudaDestroyTextureObject, cudaVkImportImageMem, cudaDestroyExternalMemory, cudaVkSemaphoreWait, cudaImportExternalMemory, cudaDestroyExternalSemaphore, cudaFreeMipmappedArray, cudaFree, cudaMalloc, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan) +[X11](../../../README.md#x11), [VULKAN](../../../README.md#vulkan), [GLFW](../../../README.md#glfw) ## Prerequisites diff --git a/Samples/6_Performance/UnifiedMemoryPerf/README.md b/Samples/6_Performance/UnifiedMemoryPerf/README.md index a9e6d637..3692b9e5 100644 --- a/Samples/6_Performance/UnifiedMemoryPerf/README.md +++ b/Samples/6_Performance/UnifiedMemoryPerf/README.md @@ -24,7 +24,7 @@ x86_64, armv7l, aarch64 cudaMemcpy, cudaStreamDestroy, cudaMemPrefetchAsync, cudaFree, cudaMallocHost, cudaMallocManaged, cudaStreamAttachMemAsync, cudaHostGetDevicePointer, cudaFreeHost, cudaStreamSynchronize, cudaMalloc, cudaMemcpyAsync, cudaStreamCreate, cudaGetDeviceProperties ## Dependencies needed to build/run -[UVM](../../../README.md#uvm) +[UVM](../../../README.md#unified-virtual-memory) ## Prerequisites diff --git a/Samples/8_Platform_Specific/Tegra/EGLSync_CUDAEvent_Interop/README.md b/Samples/8_Platform_Specific/Tegra/EGLSync_CUDAEvent_Interop/README.md index a2163c3e..f5e36508 100644 --- a/Samples/8_Platform_Specific/Tegra/EGLSync_CUDAEvent_Interop/README.md +++ b/Samples/8_Platform_Specific/Tegra/EGLSync_CUDAEvent_Interop/README.md @@ -29,7 +29,7 @@ cuEventRecord, cuDeviceGetAttribute, cuEventCreate, cuCtxSynchronize, cuEventDes cudaMemcpy, cudaGetErrorString, cudaFree, cudaDeviceSynchronize, cudaGetValueMismatch, cudaMalloc ## Dependencies needed to build/run -[EGL](../../../README.md#egl), [EGLSync](../../../README.md#eglsync), [X11](../../../README.md#x11), [GLES](../../../README.md#gles) +[EGL](../../../README.md#egl), [EGLSync](../../../README.md#eglsync), [X11](../../../README.md#x11), [OpenGL ES](../../../README.md#opengl-es) ## Prerequisites diff --git a/Samples/8_Platform_Specific/Tegra/fluidsGLES/README.md b/Samples/8_Platform_Specific/Tegra/fluidsGLES/README.md index d8b90b0a..48e0721a 100644 --- a/Samples/8_Platform_Specific/Tegra/fluidsGLES/README.md +++ b/Samples/8_Platform_Specific/Tegra/fluidsGLES/README.md @@ -26,7 +26,7 @@ armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaMallocArray, cudaFreeArray, cudaFree, cudaMallocPitch, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDestroyTextureObject, cudaCreateTextureObject, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer, cudaGetDeviceProperties ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GLES](../../../README.md#gles), [CUFFT](../../../README.md#cufft) +[X11](../../../README.md#x11), [OpenGL ES](../../../README.md#opengl-es), [CUFFT](../../../README.md#cufft) ## Prerequisites diff --git a/Samples/8_Platform_Specific/Tegra/nbody_opengles/README.md b/Samples/8_Platform_Specific/Tegra/nbody_opengles/README.md index 35a8283e..596199e2 100644 --- a/Samples/8_Platform_Specific/Tegra/nbody_opengles/README.md +++ b/Samples/8_Platform_Specific/Tegra/nbody_opengles/README.md @@ -26,7 +26,7 @@ armv7l cudaGraphicsUnmapResources, cudaSetDeviceFlags, cudaGraphicsResourceSetMapFlags, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaSetDevice, cudaEventSynchronize, cudaGetDeviceProperties, cudaDeviceSynchronize, cudaEventRecord, cudaGetDevice, cudaMemcpyToSymbol, cudaStreamQuery, cudaEventDestroy, cudaEventElapsedTime, cudaGetDeviceCount, cudaEventCreate ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GLES](../../../README.md#gles) +[X11](../../../README.md#x11), [OpenGL ES](../../../README.md#opengl-es) ## Prerequisites diff --git a/Samples/8_Platform_Specific/Tegra/simpleGLES/README.md b/Samples/8_Platform_Specific/Tegra/simpleGLES/README.md index b7cf1d8e..1769bfc9 100644 --- a/Samples/8_Platform_Specific/Tegra/simpleGLES/README.md +++ b/Samples/8_Platform_Specific/Tegra/simpleGLES/README.md @@ -26,7 +26,7 @@ armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[X11](../../../README.md#x11), [GLES](../../../README.md#gles) +[X11](../../../README.md#x11), [OpenGL ES](../../../README.md#opengl-es) ## Prerequisites diff --git a/Samples/8_Platform_Specific/Tegra/simpleGLES_EGLOutput/README.md b/Samples/8_Platform_Specific/Tegra/simpleGLES_EGLOutput/README.md index e36e5870..25f4706b 100644 --- a/Samples/8_Platform_Specific/Tegra/simpleGLES_EGLOutput/README.md +++ b/Samples/8_Platform_Specific/Tegra/simpleGLES_EGLOutput/README.md @@ -31,7 +31,7 @@ armv7l cudaGraphicsUnmapResources, cudaMemcpy, cudaFree, cudaGraphicsResourceGetMappedPointer, cudaGraphicsMapResources, cudaDeviceSynchronize, cudaGraphicsUnregisterResource, cudaMalloc, cudaGraphicsGLRegisterBuffer ## Dependencies needed to build/run -[EGLOutput](../../../README.md#egloutput), [GLES](../../../README.md#gles) +[EGLOutput](../../../README.md#egloutput), [OpenGL ES](../../../README.md#opengl-es) ## Prerequisites