streamOrderedAllocationIPC --std=c++11 cuDeviceGetAttribute cuDeviceGet cudaDeviceGetAttribute cudaMemPoolImportFromShareableHandle cudaSetDevice cudaMemPoolExportPointer cudaMemPoolGetAccess cudaMemPoolDestroy cudaMemPoolSetAccess cudaMallocAsync cudaMemPoolImportPointer cudaGetDeviceCount cudaMemcpyAsync cudaDeviceCanAccessPeer cudaFreeAsync cudaStreamCreateWithFlags cudaStreamDestroy cudaGetLastError cudaMemPoolCreate cudaMemPoolExportToShareableHandle cudaStreamSynchronize cudaDeviceEnablePeerAccess cudaOccupancyMaxActiveBlocksPerMultiprocessor cudaGetDeviceProperties whole ./ ../ ../../../Common Performance Strategies cuda CUDA true streamOrderedAllocationIPC.cu 1:CUDA Basic Topics 1:Performance Strategies sm60 sm61 sm70 sm72 sm75 sm80 sm86 sm87 sm90 ../../../Common/helper_multiprocess.cpp ../../../Common/helper_multiprocess.h x86_64 linux 6.0 stream Ordered Allocation IPC Pools exe