30 #ifndef HIP_INCLUDE_HIP_HIP_RUNTIME_API_H 31 #define HIP_INCLUDE_HIP_HIP_RUNTIME_API_H 35 #include <hip/hip_version.h> 36 #include <hip/hip_common.h> 40 HIP_ERROR_INVALID_VALUE,
41 HIP_ERROR_NOT_INITIALIZED,
42 HIP_ERROR_LAUNCH_OUT_OF_RESOURCES
47 unsigned hasGlobalInt32Atomics : 1;
48 unsigned hasGlobalFloatAtomicExch : 1;
49 unsigned hasSharedInt32Atomics : 1;
50 unsigned hasSharedFloatAtomicExch : 1;
51 unsigned hasFloatAtomicAdd : 1;
54 unsigned hasGlobalInt64Atomics : 1;
55 unsigned hasSharedInt64Atomics : 1;
58 unsigned hasDoubles : 1;
61 unsigned hasWarpVote : 1;
62 unsigned hasWarpBallot : 1;
63 unsigned hasWarpShuffle : 1;
64 unsigned hasFunnelShift : 1;
67 unsigned hasThreadFenceSystem : 1;
68 unsigned hasSyncThreadsExt : 1;
71 unsigned hasSurfaceFuncs : 1;
72 unsigned has3dGrid : 1;
73 unsigned hasDynamicParallelism : 1;
101 int multiProcessorCount;
118 char gcnArchName[256];
134 int cooperativeMultiDeviceUnmatchedGridDim;
136 int cooperativeMultiDeviceUnmatchedBlockDim;
138 int cooperativeMultiDeviceUnmatchedSharedMem;
149 typedef enum hipMemoryType {
163 enum hipMemoryType memoryType;
168 unsigned allocationFlags;
182 #if __cplusplus >= 201703L 183 #define __HIP_NODISCARD [[nodiscard]] 185 #define __HIP_NODISCARD 196 typedef enum __HIP_NODISCARD hipError_t {
198 hipErrorInvalidValue = 1,
199 hipErrorOutOfMemory = 2,
202 hipErrorMemoryAllocation = 2,
203 hipErrorNotInitialized = 3,
205 hipErrorInitializationError = 3,
206 hipErrorDeinitialized = 4,
207 hipErrorProfilerDisabled = 5,
208 hipErrorProfilerNotInitialized = 6,
209 hipErrorProfilerAlreadyStarted = 7,
210 hipErrorProfilerAlreadyStopped = 8,
211 hipErrorInvalidConfiguration = 9,
212 hipErrorInvalidSymbol = 13,
213 hipErrorInvalidDevicePointer = 17,
214 hipErrorInvalidMemcpyDirection = 21,
215 hipErrorInsufficientDriver = 35,
216 hipErrorMissingConfiguration = 52,
217 hipErrorPriorLaunchFailure = 53,
218 hipErrorInvalidDeviceFunction = 98,
219 hipErrorNoDevice = 100,
220 hipErrorInvalidDevice = 101,
221 hipErrorInvalidImage = 200,
222 hipErrorInvalidContext = 201,
223 hipErrorContextAlreadyCurrent = 202,
224 hipErrorMapFailed = 205,
226 hipErrorMapBufferObjectFailed = 205,
227 hipErrorUnmapFailed = 206,
228 hipErrorArrayIsMapped = 207,
229 hipErrorAlreadyMapped = 208,
230 hipErrorNoBinaryForGpu = 209,
231 hipErrorAlreadyAcquired = 210,
232 hipErrorNotMapped = 211,
233 hipErrorNotMappedAsArray = 212,
234 hipErrorNotMappedAsPointer = 213,
235 hipErrorECCNotCorrectable = 214,
236 hipErrorUnsupportedLimit = 215,
237 hipErrorContextAlreadyInUse = 216,
238 hipErrorPeerAccessUnsupported = 217,
239 hipErrorInvalidKernelFile = 218,
240 hipErrorInvalidGraphicsContext = 219,
241 hipErrorInvalidSource = 300,
242 hipErrorFileNotFound = 301,
243 hipErrorSharedObjectSymbolNotFound = 302,
244 hipErrorSharedObjectInitFailed = 303,
245 hipErrorOperatingSystem = 304,
246 hipErrorInvalidHandle = 400,
248 hipErrorInvalidResourceHandle = 400,
249 hipErrorNotFound = 500,
250 hipErrorNotReady = 600,
251 hipErrorIllegalAddress = 700,
255 hipErrorLaunchOutOfResources = 701,
256 hipErrorLaunchTimeOut = 702,
257 hipErrorPeerAccessAlreadyEnabled =
259 hipErrorPeerAccessNotEnabled =
261 hipErrorSetOnActiveProcess = 708,
262 hipErrorAssert = 710,
263 hipErrorHostMemoryAlreadyRegistered =
265 hipErrorHostMemoryNotRegistered =
267 hipErrorLaunchFailure =
269 hipErrorCooperativeLaunchTooLarge =
271 hipErrorNotSupported = 801,
274 hipErrorUnknown = 999,
276 hipErrorRuntimeMemory = 1052,
277 hipErrorRuntimeOther = 1053,
283 #undef __HIP_NODISCARD 355 enum hipComputeMode {
356 hipComputeModeDefault = 0,
357 hipComputeModeExclusive = 1,
358 hipComputeModeProhibited = 2,
359 hipComputeModeExclusiveProcess = 3
366 #if defined(__HIP_PLATFORM_HCC__) && !defined(__HIP_PLATFORM_NVCC__) 368 #elif defined(__HIP_PLATFORM_NVCC__) && !defined(__HIP_PLATFORM_HCC__) 369 #include "hip/nvcc_detail/hip_runtime_api.h" 371 #error("Must define exactly one of __HIP_PLATFORM_HCC__ or __HIP_PLATFORM_NVCC__"); 386 #if defined(__cplusplus) && !defined(__HIP_DISABLE_CPP_FUNCTIONS__) 388 static inline hipError_t
hipMalloc(T** devPtr,
size_t size) {
Definition: hip_runtime_api.h:344
size_t totalConstMem
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:96
Definition: hip_runtime_api.h:321
int asicRevision
Revision of the GPU in this device.
Definition: hip_runtime_api.h:142
Maximum x-dimension of a block.
Definition: hip_runtime_api.h:292
Maximum x-dimension of a grid.
Definition: hip_runtime_api.h:295
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:337
Global memory bus width in bits.
Definition: hip_runtime_api.h:308
unsigned int * hdpRegFlushCntl
Addres of HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:126
size_t texturePitchAlignment
Pitch alignment requirement for texture references bound to pitched memory.
Definition: hip_runtime_api.h:129
int canMapHostMemory
Check whether HIP can map host memory.
Definition: hip_runtime_api.h:116
Definition: hip_runtime_api.h:302
#define hipMemAttachGlobal
Memory can be accessed by any stream on any device.
Definition: hip_runtime_api.h:191
Revision of the GPU in this device.
Definition: hip_runtime_api.h:352
int regsPerBlock
Registers per block.
Definition: hip_runtime_api.h:88
Definition: hip_runtime_api.h:311
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:340
#define hipHostMallocDefault
Flags that can be used with hipHostMalloc.
Definition: hip_runtime_api.h:175
Maximum dimension width of 3D images in image elements.
Definition: hip_runtime_api.h:330
iGPU
Definition: hip_runtime_api.h:324
int isMultiGpuBoard
1 if device is on a multi-GPU board, 0 if not.
Definition: hip_runtime_api.h:115
Peak clock frequency in kilohertz.
Definition: hip_runtime_api.h:306
int maxTexture1D
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:122
Definition: hip_runtime_api.h:162
int clockRate
Max clock frequency of the multiProcessors in khz.
Definition: hip_runtime_api.h:93
Maximum z-dimension of a grid.
Definition: hip_runtime_api.h:297
Minor compute capability version number.
Definition: hip_runtime_api.h:316
Definition: hip_runtime_api.h:298
int pciBusID
PCI Bus ID.
Definition: hip_runtime_api.h:112
Definition: hip_runtime_api.h:346
Maximum y-dimension of a grid.
Definition: hip_runtime_api.h:296
Multiple GPU devices.
Definition: hip_runtime_api.h:323
int tccDriver
1:If device is Tesla device using TCC driver, else 0
Definition: hip_runtime_api.h:132
int maxThreadsPerBlock
Max work items per work group or workgroup max size.
Definition: hip_runtime_api.h:90
Maximum y-dimension of a block.
Definition: hip_runtime_api.h:293
hipError_t hipHostMalloc(void **ptr, size_t size, unsigned int flags)
Allocate device accessible page locked host memory.
Definition: hip_memory.cpp:762
Definition: hip_runtime_api.h:348
size_t sharedMemPerBlock
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:87
Support cooperative launch on multiple devices.
Definition: hip_runtime_api.h:326
int maxThreadsPerMultiProcessor
Maximum resident threads per multi-processor.
Definition: hip_runtime_api.h:105
size_t memPitch
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:127
int l2CacheSize
L2 cache size.
Definition: hip_runtime_api.h:104
hipDeviceAttribute_t
Definition: hip_runtime_api.h:290
size_t textureAlignment
Alignment requirement for textures.
Definition: hip_runtime_api.h:128
Major compute capability version number.
Definition: hip_runtime_api.h:315
Maximum number of threads per block.
Definition: hip_runtime_api.h:291
int gcnArch
AMD GCN Arch Value. Eg: 803, 701.
Definition: hip_runtime_api.h:117
Maximum dimensions depth of 3D images in image elements.
Definition: hip_runtime_api.h:332
int kernelExecTimeoutEnabled
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:130
int computeMode
Compute mode.
Definition: hip_runtime_api.h:106
Maximum z-dimension of a block.
Definition: hip_runtime_api.h:294
PCI Bus ID.
Definition: hip_runtime_api.h:319
unsigned int * hdpMemFlushCntl
Addres of HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:125
Maximum dimension height of 2D images in image elements.
Definition: hip_runtime_api.h:329
Warp size in threads.
Definition: hip_runtime_api.h:301
int major
Definition: hip_runtime_api.h:97
Maximum dimensions height of 3D images in image elements.
Definition: hip_runtime_api.h:331
Peak memory clock frequency in kilohertz.
Definition: hip_runtime_api.h:307
Definition: hip_runtime_api.h:313
Address of the HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:335
int clockInstructionRate
Definition: hip_runtime_api.h:107
int cooperativeMultiDeviceLaunch
HIP device supports cooperative launch on multiple devices.
Definition: hip_runtime_api.h:121
Constant memory size in bytes.
Definition: hip_runtime_api.h:300
Pitch alignment requirement for 2D texture references bound to pitched memory;.
Definition: hip_runtime_api.h:339
int warpSize
Warp size.
Definition: hip_runtime_api.h:89
int concurrentKernels
Device can possibly execute multiple kernels concurrently.
Definition: hip_runtime_api.h:110
Alignment requirement for textures.
Definition: hip_runtime_api.h:338
size_t totalGlobalMem
Size of global memory region (in bytes).
Definition: hip_runtime_api.h:86
hipError_t hipMalloc(void **ptr, size_t size)
Allocate memory on the default accelerator.
Definition: hip_memory.cpp:695
Compute mode that device is currently in.
Definition: hip_runtime_api.h:310
PCI Device ID.
Definition: hip_runtime_api.h:320
Device can map host memory into device address space.
Definition: hip_runtime_api.h:341
Number of multiprocessors on the device.
Definition: hip_runtime_api.h:309
int integrated
APU vs dGPU.
Definition: hip_runtime_api.h:119
int memoryBusWidth
Global memory bus width in bits.
Definition: hip_runtime_api.h:95
Definition: hip_runtime_api.h:84
size_t maxSharedMemoryPerMultiProcessor
Maximum Shared Memory Per Multiprocessor.
Definition: hip_runtime_api.h:114
int cooperativeLaunch
HIP device supports cooperative launch.
Definition: hip_runtime_api.h:120
Support cooperative launch.
Definition: hip_runtime_api.h:325
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:327
int pciDeviceID
PCI Device ID.
Definition: hip_runtime_api.h:113
int pciDomainID
PCI Domain ID.
Definition: hip_runtime_api.h:111
int ECCEnabled
Device has ECC support enabled.
Definition: hip_runtime_api.h:131
Definition: hip_runtime_api.h:45
Contains C function APIs for HIP runtime. This file does not use any HCC builtin or special language ...
Definition: hip_runtime_api.h:350
int memoryClockRate
Max global memory clock frequency in khz.
Definition: hip_runtime_api.h:94
Maximum dimension width of 2D images in image elements.
Definition: hip_runtime_api.h:328
hipError_t hipMallocManaged(void **dev_ptr, size_t size, unsigned int flags __dparm(hipMemAttachGlobal))
Allocates memory that will be automatically managed by AMD HMM.
Address of the HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:334
Device has ECC support enabled.
Definition: hip_runtime_api.h:342
int cooperativeMultiDeviceUnmatchedFunc
Definition: hip_runtime_api.h:133
Definition: hip_runtime_api.h:317