2018-08-25 01:05:15 +08:00
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE entry SYSTEM "SamplesInfo.dtd">
<entry >
<name > UnifiedMemoryPerf</name>
<cuda_api_list >
2022-10-15 08:43:37 +08:00
<toolkit > cudaMemcpy</toolkit>
2022-01-13 14:05:24 +08:00
<toolkit > cudaStreamDestroy</toolkit>
2022-10-15 08:43:37 +08:00
<toolkit > cudaMemPrefetchAsync</toolkit>
2022-01-13 14:05:24 +08:00
<toolkit > cudaFree</toolkit>
<toolkit > cudaMallocHost</toolkit>
2018-08-25 01:05:15 +08:00
<toolkit > cudaMallocManaged</toolkit>
<toolkit > cudaStreamAttachMemAsync</toolkit>
2022-10-15 08:43:37 +08:00
<toolkit > cudaHostGetDevicePointer</toolkit>
2022-01-13 14:05:24 +08:00
<toolkit > cudaFreeHost</toolkit>
2022-10-15 08:43:37 +08:00
<toolkit > cudaStreamSynchronize</toolkit>
2018-08-25 01:05:15 +08:00
<toolkit > cudaMalloc</toolkit>
2022-01-13 14:05:24 +08:00
<toolkit > cudaMemcpyAsync</toolkit>
2022-10-15 08:43:37 +08:00
<toolkit > cudaStreamCreate</toolkit>
2022-01-13 14:05:24 +08:00
<toolkit > cudaGetDeviceProperties</toolkit>
2018-08-25 01:05:15 +08:00
</cuda_api_list>
<description > <![CDATA[This sample demonstrates the performance comparision using matrix multiplication kernel of Unified Memory with/without hints and other types of memory like zero copy buffers, pageable, pagelocked memory performing synchronous and Asynchronous transfers on a single GPU.]]> </description>
<devicecompilation > whole</devicecompilation>
<includepaths >
<path > ./</path>
<path > ../</path>
2022-01-13 14:05:24 +08:00
<path > ../../../Common</path>
2018-08-25 01:05:15 +08:00
</includepaths>
<keyconcepts >
<concept level= "basic" > CUDA Systems Integration</concept>
<concept level= "basic" > Unified Memory</concept>
<concept level= "basic" > CUDA Streams and Events</concept>
<concept level= "basic" > Pinned System Paged Memory</concept>
</keyconcepts>
<keywords >
<keyword > CUDA</keyword>
<keyword > Unified Memory</keyword>
<keyword > Pinned Memory</keyword>
<keyword > Zero copy buffer</keyword>
<keyword > UVM</keyword>
<keyword > Streams</keyword>
</keywords>
<libraries >
</libraries>
<librarypaths >
</librarypaths>
<nsight_eclipse > true</nsight_eclipse>
<primary_file > matrixMultiplyPerf.cu</primary_file>
<required_dependencies >
<dependency > UVM</dependency>
</required_dependencies>
<scopes >
<scope > 1:CUDA Basic Topics</scope>
<scope > 1:CUDA Systems Integration</scope>
<scope > 1:Unified Memory</scope>
</scopes>
<supported_envs >
<env >
<arch > x86_64</arch>
<platform > linux</platform>
</env>
<env >
<arch > x86_64</arch>
<platform > macosx</platform>
</env>
<env >
<platform > windows7</platform>
</env>
<env >
<arch > arm</arch>
</env>
2022-01-13 14:05:24 +08:00
<env >
<arch > sbsa</arch>
</env>
2018-08-25 01:05:15 +08:00
<env >
<arch > aarch64</arch>
</env>
<env >
<arch > ppc64le</arch>
<platform > linux</platform>
</env>
</supported_envs>
<supported_sm_architectures >
2022-01-13 14:05:24 +08:00
<from > 3.5</from>
2018-08-25 01:05:15 +08:00
</supported_sm_architectures>
<title > Unified and other CUDA Memories Performance</title>
<type > exe</type>
</entry>