forked from NVIDIA/cuda-samples
-
Notifications
You must be signed in to change notification settings - Fork 0
/
NsightEclipse.xml
100 lines (100 loc) · 3.11 KB
/
NsightEclipse.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE entry SYSTEM "SamplesInfo.dtd">
<entry>
<name>conjugateGradientMultiDeviceCG</name>
<cflags>
<flag>-ewp</flag>
<flag>-maxrregcount=64</flag>
<flag>--std=c++11</flag>
</cflags>
<cuda_api_list>
<toolkit>cudaHostAlloc</toolkit>
<toolkit>cudaMemPrefetchAsync</toolkit>
<toolkit>cudaFree</toolkit>
<toolkit>cudaLaunchCooperativeKernel</toolkit>
<toolkit>cudaMallocManaged</toolkit>
<toolkit>cudaSetDevice</toolkit>
<toolkit>cudaGetDeviceCount</toolkit>
<toolkit>cudaGetDeviceProperties</toolkit>
<toolkit>cudaFreeHost</toolkit>
<toolkit>cudaMemset</toolkit>
<toolkit>cudaStreamCreate</toolkit>
<toolkit>cudaStreamSynchronize</toolkit>
<toolkit>cudaDeviceEnablePeerAccess</toolkit>
<toolkit>cudaMemAdvise</toolkit>
<toolkit>cudaOccupancyMaxActiveBlocksPerMultiprocessor</toolkit>
<toolkit>cudaDeviceCanAccessPeer</toolkit>
</cuda_api_list>
<description><![CDATA[This sample implements a conjugate gradient solver on multiple GPUs using Multi Device Cooperative Groups, also uses Unified Memory optimized using prefetching and usage hints.]]></description>
<devicecompilation>whole</devicecompilation>
<includepaths>
<path>./</path>
<path>../</path>
<path>../../../Common</path>
</includepaths>
<keyconcepts>
<concept level="basic">Unified Memory</concept>
<concept level="advanced">Linear Algebra</concept>
<concept level="basic">Cooperative Groups</concept>
<concept level="advanced">MultiDevice Cooperative Groups</concept>
<concept level="advanced">CUBLAS Library</concept>
<concept level="advanced">CUSPARSE Library</concept>
</keyconcepts>
<keywords>
<keyword>CUDA</keyword>
<keyword>Sparse Matrix</keyword>
<keyword>Unified Memory</keyword>
<keyword>Multi-GPU</keyword>
<keyword>CPP11</keyword>
</keywords>
<libraries>
<library>cudadevrt</library>
</libraries>
<librarypaths>
</librarypaths>
<nsight_eclipse>true</nsight_eclipse>
<primary_file>conjugateGradientMultiDeviceCG.cu</primary_file>
<required_dependencies>
<dependency>UVM</dependency>
<dependency>MDCG</dependency>
<dependency>CPP11</dependency>
</required_dependencies>
<scopes>
<scope>1:CUDA Advanced Topics</scope>
<scope>3:Linear Algebra</scope>
</scopes>
<sm-arch>sm60</sm-arch>
<sm-arch>sm61</sm-arch>
<sm-arch>sm70</sm-arch>
<sm-arch>sm72</sm-arch>
<sm-arch>sm75</sm-arch>
<sm-arch>sm80</sm-arch>
<sm-arch>sm86</sm-arch>
<sm-arch>sm87</sm-arch>
<sm-arch>sm89</sm-arch>
<sm-arch>sm90</sm-arch>
<supported_envs>
<env>
<arch>x86_64</arch>
<platform>linux</platform>
</env>
<env>
<arch>ppc64le</arch>
<platform>linux</platform>
</env>
<env>
<platform>windows</platform>
</env>
<env>
<platform>aarch64</platform>
</env>
<env>
<platform>sbsa</platform>
</env>
</supported_envs>
<supported_sm_architectures>
<from>6.0</from>
</supported_sm_architectures>
<title>conjugateGradient using MultiDevice Cooperative Groups</title>
<type>exe</type>
</entry>