mirror of
https://github.com/NVIDIA/cuda-samples.git
synced 2025-01-19 22:15:55 +08:00
120 lines
4.6 KiB
XML
120 lines
4.6 KiB
XML
<?xml version="1.0" encoding="UTF-8"?>
|
|
<!DOCTYPE entry SYSTEM "SamplesInfo.dtd">
|
|
<entry>
|
|
<name>nbody</name>
|
|
<cflags>
|
|
<flag>-ftz=true</flag>
|
|
</cflags>
|
|
<cuda_api_list>
|
|
<toolkit>cudaGraphicsUnmapResources</toolkit>
|
|
<toolkit>cudaSetDeviceFlags</toolkit>
|
|
<toolkit>cudaGraphicsResourceSetMapFlags</toolkit>
|
|
<toolkit>cudaGraphicsResourceGetMappedPointer</toolkit>
|
|
<toolkit>cudaGraphicsMapResources</toolkit>
|
|
<toolkit>cudaSetDevice</toolkit>
|
|
<toolkit>cudaEventSynchronize</toolkit>
|
|
<toolkit>cudaGetDeviceCount</toolkit>
|
|
<toolkit>cudaGetDeviceProperties</toolkit>
|
|
<toolkit>cudaDeviceSynchronize</toolkit>
|
|
<toolkit>cudaEventRecord</toolkit>
|
|
<toolkit>cudaGetDevice</toolkit>
|
|
<toolkit>cudaMemcpyToSymbol</toolkit>
|
|
<toolkit>cudaStreamQuery</toolkit>
|
|
<toolkit>cudaEventDestroy</toolkit>
|
|
<toolkit>cudaEventElapsedTime</toolkit>
|
|
<toolkit>cudaDeviceCanAccessPeer</toolkit>
|
|
<toolkit>cudaEventCreate</toolkit>
|
|
</cuda_api_list>
|
|
<description><![CDATA[This sample demonstrates efficient all-pairs simulation of a gravitational n-body simulation in CUDA. This sample accompanies the GPU Gems 3 chapter "Fast N-Body Simulation with CUDA". With CUDA 5.5, performance on Tesla K20c has increased to over 1.8TFLOP/s single precision. Double Performance has also improved on all Kepler and Fermi GPU architectures as well. Starting in CUDA 4.0, the nBody sample has been updated to take advantage of new features to easily scale the n-body simulation across multiple GPUs in a single PC. Adding "-numbodies=<bodies>" to the command line will allow users to set # of bodies for simulation. Adding “-numdevices=<N>” to the command line option will cause the sample to use N devices (if available) for simulation. In this mode, the position and velocity data for all bodies are read from system memory using “zero copy” rather than from device memory. For a small number of devices (4 or fewer) and a large enough number of bodies, bandwidth is not a bottleneck so we can achieve strong scaling across these devices.]]></description>
|
|
<devicecompilation>whole</devicecompilation>
|
|
<files>
|
|
<file>./galaxy_20K.bin</file>
|
|
<file>./CMakeLists.txt</file>
|
|
</files>
|
|
<includepaths>
|
|
<path>./</path>
|
|
<path>../</path>
|
|
<path>../../../Common</path>
|
|
</includepaths>
|
|
<keyconcepts>
|
|
<concept level="advanced">Graphics Interop</concept>
|
|
<concept level="advanced">Data Parallel Algorithms</concept>
|
|
<concept level="advanced">Physically-Based Simulation</concept>
|
|
</keyconcepts>
|
|
<keywords>
|
|
<keyword>CUDA</keyword>
|
|
<keyword>GPGPU</keyword>
|
|
<keyword>n-body</keyword>
|
|
<keyword>simulation</keyword>
|
|
<keyword>astrophysics</keyword>
|
|
<keyword>opengl</keyword>
|
|
<keyword>openGL</keyword>
|
|
</keywords>
|
|
<libraries>
|
|
<library>GLU</library>
|
|
<library>GL</library>
|
|
<library framework="true" os="macosx">GLUT</library>
|
|
<library os="linux">GLEW</library>
|
|
<library os="linux">glut</library>
|
|
<library os="linux">X11</library>
|
|
</libraries>
|
|
<librarypaths>
|
|
<path arch="x86_64" os="linux">../../../common/lib/linux/x86_64</path>
|
|
<path arch="armv7l" os="linux">../../../common/lib/linux/armv7l</path>
|
|
<path os="macosx">../../../common/lib/darwin</path>
|
|
</librarypaths>
|
|
<nsight_eclipse>true</nsight_eclipse>
|
|
<primary_file>nbody.cpp</primary_file>
|
|
<qatests>
|
|
<qatest>-benchmark -compare -cpu</qatest>
|
|
</qatests>
|
|
<required_dependencies>
|
|
<dependency>X11</dependency>
|
|
<dependency>GL</dependency>
|
|
</required_dependencies>
|
|
<scopes>
|
|
<scope>2:Graphics Interop</scope>
|
|
<scope>1:CUDA Advanced Topics</scope>
|
|
<scope>1:Data-Parallel Algorithms</scope>
|
|
<scope>3:Physically-Based Simulation</scope>
|
|
</scopes>
|
|
<sm-arch>sm50</sm-arch>
|
|
<sm-arch>sm52</sm-arch>
|
|
<sm-arch>sm53</sm-arch>
|
|
<sm-arch>sm60</sm-arch>
|
|
<sm-arch>sm61</sm-arch>
|
|
<sm-arch>sm70</sm-arch>
|
|
<sm-arch>sm72</sm-arch>
|
|
<sm-arch>sm75</sm-arch>
|
|
<sm-arch>sm80</sm-arch>
|
|
<sm-arch>sm86</sm-arch>
|
|
<sm-arch>sm87</sm-arch>
|
|
<sm-arch>sm89</sm-arch>
|
|
<sm-arch>sm90</sm-arch>
|
|
<supported_envs>
|
|
<env>
|
|
<arch>x86_64</arch>
|
|
<platform>linux</platform>
|
|
</env>
|
|
<env>
|
|
<platform>windows7</platform>
|
|
</env>
|
|
<env>
|
|
<arch>x86_64</arch>
|
|
<platform>macosx</platform>
|
|
</env>
|
|
<env>
|
|
<arch>arm</arch>
|
|
</env>
|
|
<env>
|
|
<arch>sbsa</arch>
|
|
</env>
|
|
</supported_envs>
|
|
<supported_sm_architectures>
|
|
<include>all</include>
|
|
</supported_sm_architectures>
|
|
<title>CUDA N-Body Simulation</title>
|
|
<type>exe</type>
|
|
<whitepaper>doc/nbody_gems3_ch31.pdf</whitepaper>
|
|
</entry>
|