HIP: Heterogenous-computing Interface for Portability
hip_runtime_api.h
1 /*
2 Copyright (c) 2015 - present Advanced Micro Devices, Inc. All rights reserved.
3 
4 Permission is hereby granted, free of charge, to any person obtaining a copy
5 of this software and associated documentation files (the "Software"), to deal
6 in the Software without restriction, including without limitation the rights
7 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
8 copies of the Software, and to permit persons to whom the Software is
9 furnished to do so, subject to the following conditions:
10 
11 The above copyright notice and this permission notice shall be included in
12 all copies or substantial portions of the Software.
13 
14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
17 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
18 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
19 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
20 THE SOFTWARE.
21 */
22 
30 #ifndef HIP_INCLUDE_HIP_HIP_RUNTIME_API_H
31 #define HIP_INCLUDE_HIP_HIP_RUNTIME_API_H
32 
33 
34 #include <string.h> // for getDeviceProp
35 #include <hip/hip_version.h>
36 #include <hip/hip_common.h>
37 
38 enum {
39  HIP_SUCCESS = 0,
40  HIP_ERROR_INVALID_VALUE,
41  HIP_ERROR_NOT_INITIALIZED,
42  HIP_ERROR_LAUNCH_OUT_OF_RESOURCES
43 };
44 
45 typedef struct {
46  // 32-bit Atomics
47  unsigned hasGlobalInt32Atomics : 1;
48  unsigned hasGlobalFloatAtomicExch : 1;
49  unsigned hasSharedInt32Atomics : 1;
50  unsigned hasSharedFloatAtomicExch : 1;
51  unsigned hasFloatAtomicAdd : 1;
52 
53  // 64-bit Atomics
54  unsigned hasGlobalInt64Atomics : 1;
55  unsigned hasSharedInt64Atomics : 1;
56 
57  // Doubles
58  unsigned hasDoubles : 1;
59 
60  // Warp cross-lane operations
61  unsigned hasWarpVote : 1;
62  unsigned hasWarpBallot : 1;
63  unsigned hasWarpShuffle : 1;
64  unsigned hasFunnelShift : 1;
65 
66  // Sync
67  unsigned hasThreadFenceSystem : 1;
68  unsigned hasSyncThreadsExt : 1;
69 
70  // Misc
71  unsigned hasSurfaceFuncs : 1;
72  unsigned has3dGrid : 1;
73  unsigned hasDynamicParallelism : 1;
75 
76 
77 //---
78 // Common headers for both NVCC and HCC paths:
79 
84 typedef struct hipDeviceProp_t {
85  char name[256];
86  size_t totalGlobalMem;
89  int warpSize;
91  int maxThreadsDim[3];
92  int maxGridSize[3];
93  int clockRate;
96  size_t totalConstMem;
97  int major;
98  int minor;
101  int multiProcessorCount;
108  hipDeviceArch_t arch;
112  int pciBusID;
117  int gcnArch;
118  char gcnArchName[256];
123  int maxTexture2D[2];
124  int maxTexture3D[3];
125  unsigned int* hdpMemFlushCntl;
126  unsigned int* hdpRegFlushCntl;
127  size_t memPitch;
132  int tccDriver;
134  int cooperativeMultiDeviceUnmatchedGridDim;
136  int cooperativeMultiDeviceUnmatchedBlockDim;
138  int cooperativeMultiDeviceUnmatchedSharedMem;
140  int isLargeBar;
144 
145 
149 typedef enum hipMemoryType {
150  hipMemoryTypeHost,
151  hipMemoryTypeDevice,
152  hipMemoryTypeArray,
154  hipMemoryTypeUnified
156 }hipMemoryType;
157 
158 
162 typedef struct hipPointerAttribute_t {
163  enum hipMemoryType memoryType;
164  int device;
165  void* devicePointer;
166  void* hostPointer;
167  int isManaged;
168  unsigned allocationFlags; /* flags specified when memory was allocated*/
169  /* peers? */
171 
172 
173 // hack to get these to show up in Doxygen:
180 // Ignoring error-code return values from hip APIs is discouraged. On C++17,
181 // we can make that yield a warning
182 #if __cplusplus >= 201703L
183 #define __HIP_NODISCARD [[nodiscard]]
184 #else
185 #define __HIP_NODISCARD
186 #endif
187 
188 /*
189  * @brief hipError_t
190  * @enum
191  * @ingroup Enumerations
192  */
193 // Developer note - when updating these, update the hipErrorName and hipErrorString functions in
194 // NVCC and HCC paths Also update the hipCUDAErrorTohipError function in NVCC path.
195 
196 typedef enum __HIP_NODISCARD hipError_t {
197  hipSuccess = 0,
198  hipErrorInvalidValue = 1,
199  hipErrorOutOfMemory = 2,
201  // Deprecated
202  hipErrorMemoryAllocation = 2,
203  hipErrorNotInitialized = 3,
204  // Deprecated
205  hipErrorInitializationError = 3,
206  hipErrorDeinitialized = 4,
207  hipErrorProfilerDisabled = 5,
208  hipErrorProfilerNotInitialized = 6,
209  hipErrorProfilerAlreadyStarted = 7,
210  hipErrorProfilerAlreadyStopped = 8,
211  hipErrorInvalidConfiguration = 9,
212  hipErrorInvalidSymbol = 13,
213  hipErrorInvalidDevicePointer = 17,
214  hipErrorInvalidMemcpyDirection = 21,
215  hipErrorInsufficientDriver = 35,
216  hipErrorMissingConfiguration = 52,
217  hipErrorPriorLaunchFailure = 53,
218  hipErrorInvalidDeviceFunction = 98,
219  hipErrorNoDevice = 100,
220  hipErrorInvalidDevice = 101,
221  hipErrorInvalidImage = 200,
222  hipErrorInvalidContext = 201,
223  hipErrorContextAlreadyCurrent = 202,
224  hipErrorMapFailed = 205,
225  // Deprecated
226  hipErrorMapBufferObjectFailed = 205,
227  hipErrorUnmapFailed = 206,
228  hipErrorArrayIsMapped = 207,
229  hipErrorAlreadyMapped = 208,
230  hipErrorNoBinaryForGpu = 209,
231  hipErrorAlreadyAcquired = 210,
232  hipErrorNotMapped = 211,
233  hipErrorNotMappedAsArray = 212,
234  hipErrorNotMappedAsPointer = 213,
235  hipErrorECCNotCorrectable = 214,
236  hipErrorUnsupportedLimit = 215,
237  hipErrorContextAlreadyInUse = 216,
238  hipErrorPeerAccessUnsupported = 217,
239  hipErrorInvalidKernelFile = 218,
240  hipErrorInvalidGraphicsContext = 219,
241  hipErrorInvalidSource = 300,
242  hipErrorFileNotFound = 301,
243  hipErrorSharedObjectSymbolNotFound = 302,
244  hipErrorSharedObjectInitFailed = 303,
245  hipErrorOperatingSystem = 304,
246  hipErrorInvalidHandle = 400,
247  // Deprecated
248  hipErrorInvalidResourceHandle = 400,
249  hipErrorNotFound = 500,
250  hipErrorNotReady = 600,
251  hipErrorIllegalAddress = 700,
255  hipErrorLaunchOutOfResources = 701,
256  hipErrorLaunchTimeOut = 702,
257  hipErrorPeerAccessAlreadyEnabled =
258  704,
259  hipErrorPeerAccessNotEnabled =
260  705,
261  hipErrorSetOnActiveProcess = 708,
262  hipErrorAssert = 710,
263  hipErrorHostMemoryAlreadyRegistered =
264  712,
265  hipErrorHostMemoryNotRegistered =
266  713,
267  hipErrorLaunchFailure =
268  719,
269  hipErrorCooperativeLaunchTooLarge =
270  720,
271  hipErrorNotSupported = 801,
274  hipErrorUnknown = 999, //< Unknown error.
275  // HSA Runtime Error Codes start here.
276  hipErrorRuntimeMemory = 1052,
277  hipErrorRuntimeOther = 1053,
279  hipErrorTbd
281 } hipError_t;
282 
283 #undef __HIP_NODISCARD
284 
285 /*
286  * @brief hipDeviceAttribute_t
287  * @enum
288  * @ingroup Enumerations
289  */
290 typedef enum hipDeviceAttribute_t {
333 
336 
343 
354 
355 enum hipComputeMode {
356  hipComputeModeDefault = 0,
357  hipComputeModeExclusive = 1,
358  hipComputeModeProhibited = 2,
359  hipComputeModeExclusiveProcess = 3
360 };
361 
366 #if defined(__HIP_PLATFORM_HCC__) && !defined(__HIP_PLATFORM_NVCC__)
368 #elif defined(__HIP_PLATFORM_NVCC__) && !defined(__HIP_PLATFORM_HCC__)
369 #include "hip/nvcc_detail/hip_runtime_api.h"
370 #else
371 #error("Must define exactly one of __HIP_PLATFORM_HCC__ or __HIP_PLATFORM_NVCC__");
372 #endif
373 
374 
386 #if defined(__cplusplus) && !defined(__HIP_DISABLE_CPP_FUNCTIONS__)
387 template <class T>
388 static inline hipError_t hipMalloc(T** devPtr, size_t size) {
389  return hipMalloc((void**)devPtr, size);
390 }
391 
392 // Provide an override to automatically typecast the pointer type from void**, and also provide a
393 // default for the flags.
394 template <class T>
395 static inline hipError_t hipHostMalloc(T** ptr, size_t size,
396  unsigned int flags = hipHostMallocDefault) {
397  return hipHostMalloc((void**)ptr, size, flags);
398 }
399 
400 template <class T>
401 static inline hipError_t hipMallocManaged(T** devPtr, size_t size,
402  unsigned int flags = hipMemAttachGlobal) {
403  return hipMallocManaged((void**)devPtr, size, flags);
404 }
405 #endif
406 
407 #endif
size_t totalConstMem
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:96
int asicRevision
Revision of the GPU in this device.
Definition: hip_runtime_api.h:142
Maximum x-dimension of a block.
Definition: hip_runtime_api.h:292
Maximum x-dimension of a grid.
Definition: hip_runtime_api.h:295
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:337
Global memory bus width in bits.
Definition: hip_runtime_api.h:308
unsigned int * hdpRegFlushCntl
Addres of HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:126
size_t texturePitchAlignment
Pitch alignment requirement for texture references bound to pitched memory.
Definition: hip_runtime_api.h:129
int canMapHostMemory
Check whether HIP can map host memory.
Definition: hip_runtime_api.h:116
Definition: hip_runtime_api.h:302
#define hipMemAttachGlobal
Memory can be accessed by any stream on any device.
Definition: hip_runtime_api.h:191
Revision of the GPU in this device.
Definition: hip_runtime_api.h:352
int regsPerBlock
Registers per block.
Definition: hip_runtime_api.h:88
Definition: hip_runtime_api.h:311
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:340
#define hipHostMallocDefault
Flags that can be used with hipHostMalloc.
Definition: hip_runtime_api.h:175
Maximum dimension width of 3D images in image elements.
Definition: hip_runtime_api.h:330
iGPU
Definition: hip_runtime_api.h:324
int isMultiGpuBoard
1 if device is on a multi-GPU board, 0 if not.
Definition: hip_runtime_api.h:115
Peak clock frequency in kilohertz.
Definition: hip_runtime_api.h:306
int maxTexture1D
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:122
Definition: hip_runtime_api.h:162
int clockRate
Max clock frequency of the multiProcessors in khz.
Definition: hip_runtime_api.h:93
Maximum z-dimension of a grid.
Definition: hip_runtime_api.h:297
Minor compute capability version number.
Definition: hip_runtime_api.h:316
Definition: hip_runtime_api.h:298
int pciBusID
PCI Bus ID.
Definition: hip_runtime_api.h:112
Maximum y-dimension of a grid.
Definition: hip_runtime_api.h:296
Multiple GPU devices.
Definition: hip_runtime_api.h:323
int tccDriver
1:If device is Tesla device using TCC driver, else 0
Definition: hip_runtime_api.h:132
int maxThreadsPerBlock
Max work items per work group or workgroup max size.
Definition: hip_runtime_api.h:90
Maximum y-dimension of a block.
Definition: hip_runtime_api.h:293
hipError_t hipHostMalloc(void **ptr, size_t size, unsigned int flags)
Allocate device accessible page locked host memory.
Definition: hip_memory.cpp:762
size_t sharedMemPerBlock
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:87
Support cooperative launch on multiple devices.
Definition: hip_runtime_api.h:326
int maxThreadsPerMultiProcessor
Maximum resident threads per multi-processor.
Definition: hip_runtime_api.h:105
size_t memPitch
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:127
int l2CacheSize
L2 cache size.
Definition: hip_runtime_api.h:104
hipDeviceAttribute_t
Definition: hip_runtime_api.h:290
size_t textureAlignment
Alignment requirement for textures.
Definition: hip_runtime_api.h:128
Major compute capability version number.
Definition: hip_runtime_api.h:315
Maximum number of threads per block.
Definition: hip_runtime_api.h:291
int gcnArch
AMD GCN Arch Value. Eg: 803, 701.
Definition: hip_runtime_api.h:117
Maximum dimensions depth of 3D images in image elements.
Definition: hip_runtime_api.h:332
int kernelExecTimeoutEnabled
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:130
int computeMode
Compute mode.
Definition: hip_runtime_api.h:106
Maximum z-dimension of a block.
Definition: hip_runtime_api.h:294
PCI Bus ID.
Definition: hip_runtime_api.h:319
unsigned int * hdpMemFlushCntl
Addres of HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:125
Maximum dimension height of 2D images in image elements.
Definition: hip_runtime_api.h:329
Warp size in threads.
Definition: hip_runtime_api.h:301
int major
Definition: hip_runtime_api.h:97
Maximum dimensions height of 3D images in image elements.
Definition: hip_runtime_api.h:331
Peak memory clock frequency in kilohertz.
Definition: hip_runtime_api.h:307
Definition: hip_runtime_api.h:313
Address of the HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:335
int clockInstructionRate
Definition: hip_runtime_api.h:107
int cooperativeMultiDeviceLaunch
HIP device supports cooperative launch on multiple devices.
Definition: hip_runtime_api.h:121
Constant memory size in bytes.
Definition: hip_runtime_api.h:300
Pitch alignment requirement for 2D texture references bound to pitched memory;.
Definition: hip_runtime_api.h:339
int warpSize
Warp size.
Definition: hip_runtime_api.h:89
int concurrentKernels
Device can possibly execute multiple kernels concurrently.
Definition: hip_runtime_api.h:110
Alignment requirement for textures.
Definition: hip_runtime_api.h:338
size_t totalGlobalMem
Size of global memory region (in bytes).
Definition: hip_runtime_api.h:86
hipError_t hipMalloc(void **ptr, size_t size)
Allocate memory on the default accelerator.
Definition: hip_memory.cpp:695
Compute mode that device is currently in.
Definition: hip_runtime_api.h:310
PCI Device ID.
Definition: hip_runtime_api.h:320
Device can map host memory into device address space.
Definition: hip_runtime_api.h:341
Number of multiprocessors on the device.
Definition: hip_runtime_api.h:309
int integrated
APU vs dGPU.
Definition: hip_runtime_api.h:119
int memoryBusWidth
Global memory bus width in bits.
Definition: hip_runtime_api.h:95
Definition: hip_runtime_api.h:84
size_t maxSharedMemoryPerMultiProcessor
Maximum Shared Memory Per Multiprocessor.
Definition: hip_runtime_api.h:114
int cooperativeLaunch
HIP device supports cooperative launch.
Definition: hip_runtime_api.h:120
Support cooperative launch.
Definition: hip_runtime_api.h:325
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:327
int pciDeviceID
PCI Device ID.
Definition: hip_runtime_api.h:113
int pciDomainID
PCI Domain ID.
Definition: hip_runtime_api.h:111
int ECCEnabled
Device has ECC support enabled.
Definition: hip_runtime_api.h:131
Definition: hip_runtime_api.h:45
Contains C function APIs for HIP runtime. This file does not use any HCC builtin or special language ...
int memoryClockRate
Max global memory clock frequency in khz.
Definition: hip_runtime_api.h:94
Maximum dimension width of 2D images in image elements.
Definition: hip_runtime_api.h:328
hipError_t hipMallocManaged(void **dev_ptr, size_t size, unsigned int flags __dparm(hipMemAttachGlobal))
Allocates memory that will be automatically managed by AMD HMM.
Address of the HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:334
Device has ECC support enabled.
Definition: hip_runtime_api.h:342
int cooperativeMultiDeviceUnmatchedFunc
Definition: hip_runtime_api.h:133
Definition: hip_runtime_api.h:317