HIP: Heterogenous-computing Interface for Portability
|
Go to the documentation of this file.
30 #ifndef HIP_INCLUDE_HIP_HIP_RUNTIME_API_H
31 #define HIP_INCLUDE_HIP_HIP_RUNTIME_API_H
35 #include <hip/hip_common.h>
39 HIP_ERROR_INVALID_VALUE,
40 HIP_ERROR_NOT_INITIALIZED,
41 HIP_ERROR_LAUNCH_OUT_OF_RESOURCES
167 unsigned allocationFlags;
181 #if __cplusplus >= 201703L
182 #define __HIP_NODISCARD [[nodiscard]]
184 #define __HIP_NODISCARD
195 typedef enum __HIP_NODISCARD hipError_t {
198 hipErrorOutOfMemory = 2,
202 hipErrorNotInitialized = 3,
204 hipErrorInitializationError = 3,
205 hipErrorDeinitialized = 4,
206 hipErrorProfilerDisabled = 5,
207 hipErrorProfilerNotInitialized = 6,
208 hipErrorProfilerAlreadyStarted = 7,
209 hipErrorProfilerAlreadyStopped = 8,
210 hipErrorInvalidConfiguration = 9,
211 hipErrorInvalidSymbol = 13,
214 hipErrorInsufficientDriver = 35,
215 hipErrorMissingConfiguration = 52,
216 hipErrorPriorLaunchFailure = 53,
217 hipErrorInvalidDeviceFunction = 98,
220 hipErrorInvalidImage = 200,
222 hipErrorContextAlreadyCurrent = 202,
223 hipErrorMapFailed = 205,
226 hipErrorUnmapFailed = 206,
227 hipErrorArrayIsMapped = 207,
228 hipErrorAlreadyMapped = 208,
229 hipErrorNoBinaryForGpu = 209,
230 hipErrorAlreadyAcquired = 210,
231 hipErrorNotMapped = 211,
232 hipErrorNotMappedAsArray = 212,
233 hipErrorNotMappedAsPointer = 213,
234 hipErrorECCNotCorrectable = 214,
235 hipErrorUnsupportedLimit = 215,
236 hipErrorContextAlreadyInUse = 216,
237 hipErrorPeerAccessUnsupported = 217,
239 hipErrorInvalidGraphicsContext = 219,
240 hipErrorInvalidSource = 300,
241 hipErrorFileNotFound = 301,
242 hipErrorSharedObjectSymbolNotFound = 302,
243 hipErrorSharedObjectInitFailed = 303,
244 hipErrorOperatingSystem = 304,
245 hipErrorInvalidHandle = 400,
248 hipErrorNotFound = 500,
250 hipErrorIllegalAddress = 700,
255 hipErrorLaunchTimeOut = 702,
260 hipErrorSetOnActiveProcess = 708,
273 hipErrorUnknown = 999,
282 #undef __HIP_NODISCARD
354 enum hipComputeMode {
355 hipComputeModeDefault = 0,
356 hipComputeModeExclusive = 1,
357 hipComputeModeProhibited = 2,
358 hipComputeModeExclusiveProcess = 3
365 #if defined(__HIP_PLATFORM_HCC__) && !defined(__HIP_PLATFORM_NVCC__)
367 #elif defined(__HIP_PLATFORM_NVCC__) && !defined(__HIP_PLATFORM_HCC__)
368 #include "hip/nvcc_detail/hip_runtime_api.h"
370 #error("Must define exactly one of __HIP_PLATFORM_HCC__ or __HIP_PLATFORM_NVCC__");
385 #if defined(__cplusplus) && !defined(__HIP_DISABLE_CPP_FUNCTIONS__)
387 static inline hipError_t
hipMalloc(T** devPtr,
size_t size) {
@ hipDeviceAttributeMaxPitch
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:336
int regsPerBlock
Registers per block.
Definition: hip_runtime_api.h:87
@ hipDeviceAttributeMemoryBusWidth
Global memory bus width in bits.
Definition: hip_runtime_api.h:307
hipErrorInvalidMemcpyDirection
Invalid memory copy direction.
Definition: hip_runtime_api.h:213
unsigned hasGlobalInt64Atomics
64-bit integer atomics for global memory.
Definition: hip_runtime_api.h:53
int minor
Definition: hip_runtime_api.h:99
@ hipDeviceAttributeMaxBlockDimX
Maximum x-dimension of a block.
Definition: hip_runtime_api.h:291
hipErrorInvalidDevicePointer
Invalid Device Pointer.
Definition: hip_runtime_api.h:212
hipErrorMapBufferObjectFailed
Produced when the IPC memory attach failed from ROCr.
Definition: hip_runtime_api.h:225
size_t texturePitchAlignment
Pitch alignment requirement for texture references bound to pitched memory.
Definition: hip_runtime_api.h:128
@ hipDeviceAttributeMaxGridDimX
Maximum x-dimension of a grid.
Definition: hip_runtime_api.h:294
unsigned hasThreadFenceSystem
__threadfence_system.
Definition: hip_runtime_api.h:66
int maxTexture3D[3]
Maximum dimensions (width, height, depth) of 3D images, in image elements.
Definition: hip_runtime_api.h:123
int cooperativeMultiDeviceUnmatchedBlockDim
Definition: hip_runtime_api.h:136
hipErrorHostMemoryNotRegistered
Produced when trying to unlock a non-page-locked memory.
Definition: hip_runtime_api.h:264
hipErrorRuntimeOther
Definition: hip_runtime_api.h:277
@ hipDeviceAttributeClockRate
Peak clock frequency in kilohertz.
Definition: hip_runtime_api.h:305
int asicRevision
Revision of the GPU in this device.
Definition: hip_runtime_api.h:141
@ hipDeviceAttributeMaxGridDimZ
Maximum z-dimension of a grid.
Definition: hip_runtime_api.h:296
@ hipMemoryTypeDevice
Definition: hip_runtime_api.h:150
@ hipDeviceAttributeMaxRegistersPerBlock
Definition: hip_runtime_api.h:301
hipErrorNoDevice
Call to hipGetDeviceCount returned 0 devices.
Definition: hip_runtime_api.h:218
int isLargeBar
1: if it is a large PCI bar device, else 0
Definition: hip_runtime_api.h:140
@ hipDeviceAttributeComputeCapabilityMinor
Minor compute capability version number.
Definition: hip_runtime_api.h:315
@ hipDeviceAttributeAsicRevision
Revision of the GPU in this device.
Definition: hip_runtime_api.h:351
int l2CacheSize
L2 cache size.
Definition: hip_runtime_api.h:103
size_t textureAlignment
Alignment requirement for textures.
Definition: hip_runtime_api.h:127
hipError_t hipHostMalloc(void **ptr, size_t size, unsigned int flags)
Allocate device accessible page locked host memory.
Definition: hip_memory.cpp:762
@ hipDeviceAttributeKernelExecTimeout
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:339
@ hipDeviceAttributeL2CacheSize
Definition: hip_runtime_api.h:310
@ hipDeviceAttributeCooperativeMultiDeviceUnmatchedGridDim
Definition: hip_runtime_api.h:345
@ hipDeviceAttributeMaxTexture3DWidth
Maximum dimension width of 3D images in image elements.
Definition: hip_runtime_api.h:329
unsigned hasSurfaceFuncs
Surface functions.
Definition: hip_runtime_api.h:70
@ hipDeviceAttributeIntegrated
iGPU
Definition: hip_runtime_api.h:323
int isMultiGpuBoard
1 if device is on a multi-GPU board, 0 if not.
Definition: hip_runtime_api.h:114
@ hipDeviceAttributeMaxGridDimY
Maximum y-dimension of a grid.
Definition: hip_runtime_api.h:295
@ hipMemoryTypeHost
Memory is physically located on host.
Definition: hip_runtime_api.h:149
hipErrorInvalidContext
Produced when input context is invalid.
Definition: hip_runtime_api.h:221
unsigned hasSharedInt64Atomics
64-bit integer atomics for shared memory.
Definition: hip_runtime_api.h:54
int computeMode
Compute mode.
Definition: hip_runtime_api.h:105
@ hipDeviceAttributeIsMultiGpuBoard
Multiple GPU devices.
Definition: hip_runtime_api.h:322
int clockRate
Max clock frequency of the multiProcessors in khz.
Definition: hip_runtime_api.h:92
unsigned int * hdpRegFlushCntl
Addres of HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:125
hipErrorPeerAccessNotEnabled
Peer access was never enabled from the current device.
Definition: hip_runtime_api.h:258
unsigned hasDynamicParallelism
Dynamic parallelism.
Definition: hip_runtime_api.h:72
int canMapHostMemory
Check whether HIP can map host memory.
Definition: hip_runtime_api.h:115
size_t sharedMemPerBlock
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:86
@ hipDeviceAttributeCooperativeMultiDeviceLaunch
Support cooperative launch on multiple devices.
Definition: hip_runtime_api.h:325
int maxThreadsPerMultiProcessor
Maximum resident threads per multi-processor.
Definition: hip_runtime_api.h:104
int major
Definition: hip_runtime_api.h:96
@ hipDeviceAttributeMaxSharedMemoryPerBlock
Definition: hip_runtime_api.h:297
hipSuccess
Successful completion.
Definition: hip_runtime_api.h:196
@ hipDeviceAttributeMaxThreadsPerBlock
Maximum number of threads per block.
Definition: hip_runtime_api.h:290
int gcnArch
AMD GCN Arch Value. Eg: 803, 701.
Definition: hip_runtime_api.h:116
Definition: hip_runtime_api.h:44
int kernelExecTimeoutEnabled
Run time limit for kernels executed on the device.
Definition: hip_runtime_api.h:129
int maxTexture1D
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:121
@ hipDeviceAttributeMaxBlockDimZ
Maximum z-dimension of a block.
Definition: hip_runtime_api.h:293
hipError_t hipMallocManaged(void **dev_ptr, size_t size, unsigned int flags __dparm(hipMemAttachGlobal))
Allocates memory that will be automatically managed by AMD HMM.
unsigned hasDoubles
Double-precision floating point.
Definition: hip_runtime_api.h:57
hipErrorInvalidKernelFile
In CUDA DRV, it is CUDA_ERROR_INVALID_PTX.
Definition: hip_runtime_api.h:238
int maxThreadsPerBlock
Max work items per work group or workgroup max size.
Definition: hip_runtime_api.h:89
@ hipDeviceAttributeMaxBlockDimY
Maximum y-dimension of a block.
Definition: hip_runtime_api.h:292
Definition: hip_runtime_api.h:83
@ hipDeviceAttributeCooperativeMultiDeviceUnmatchedBlockDim
Definition: hip_runtime_api.h:347
@ hipDeviceAttributeMaxTexture2DHeight
Maximum dimension height of 2D images in image elements.
Definition: hip_runtime_api.h:328
unsigned hasSharedInt32Atomics
32-bit integer atomics for shared memory.
Definition: hip_runtime_api.h:48
hipErrorInvalidValue
Definition: hip_runtime_api.h:197
size_t memPitch
Maximum pitch in bytes allowed by memory copies.
Definition: hip_runtime_api.h:126
int pciBusID
PCI Bus ID.
Definition: hip_runtime_api.h:111
@ hipDeviceAttributeComputeCapabilityMajor
Major compute capability version number.
Definition: hip_runtime_api.h:314
@ hipDeviceAttributeMaxTexture3DDepth
Maximum dimensions depth of 3D images in image elements.
Definition: hip_runtime_api.h:331
hipErrorRuntimeMemory
Definition: hip_runtime_api.h:275
@ hipDeviceAttributeMaxThreadsPerMultiProcessor
Definition: hip_runtime_api.h:312
hipDeviceArch_t arch
Architectural feature flags. New for HIP.
Definition: hip_runtime_api.h:108
Contains C function APIs for HIP runtime. This file does not use any HCC builtin or special language ...
@ hipDeviceAttributeHdpRegFlushCntl
Address of the HDP_REG_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:334
@ hipDeviceAttributePciBusId
PCI Bus ID.
Definition: hip_runtime_api.h:318
int tccDriver
1:If device is Tesla device using TCC driver, else 0
Definition: hip_runtime_api.h:131
hipError_t hipMalloc(void **ptr, size_t size)
Allocate memory on the default accelerator.
Definition: hip_memory.cpp:695
@ hipMemoryTypeUnified
Not used currently.
Definition: hip_runtime_api.h:154
@ hipDeviceAttributeTexturePitchAlignment
Pitch alignment requirement for 2D texture references bound to pitched memory;.
Definition: hip_runtime_api.h:338
@ hipDeviceAttributeWarpSize
Warp size in threads.
Definition: hip_runtime_api.h:300
unsigned hasGlobalInt32Atomics
32-bit integer atomics for global memory.
Definition: hip_runtime_api.h:46
unsigned hasSyncThreadsExt
__syncthreads_count, syncthreads_and, syncthreads_or.
Definition: hip_runtime_api.h:67
@ hipMemoryTypeArray
Definition: hip_runtime_api.h:152
hipErrorInvalidDevice
DeviceID must be in range 0...#compute-devices.
Definition: hip_runtime_api.h:219
unsigned hasFunnelShift
Funnel two words into one with shift&mask caps.
Definition: hip_runtime_api.h:63
@ hipDeviceAttributeMaxTexture3DHeight
Maximum dimensions height of 3D images in image elements.
Definition: hip_runtime_api.h:330
@ hipDeviceAttributeMemoryClockRate
Peak memory clock frequency in kilohertz.
Definition: hip_runtime_api.h:306
hipErrorNotReady
Definition: hip_runtime_api.h:249
struct hipPointerAttribute_t hipPointerAttribute_t
int maxGridSize[3]
Max grid dimensions (XYZ).
Definition: hip_runtime_api.h:91
@ hipDeviceAttributeComputeMode
Compute mode that device is currently in.
Definition: hip_runtime_api.h:309
@ hipDeviceAttributePciDeviceId
PCI Device ID.
Definition: hip_runtime_api.h:319
size_t maxSharedMemoryPerMultiProcessor
Maximum Shared Memory Per Multiprocessor.
Definition: hip_runtime_api.h:113
int clockInstructionRate
Definition: hip_runtime_api.h:106
unsigned int * hdpMemFlushCntl
Addres of HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:124
Definition: hip_runtime_api.h:161
@ hipDeviceAttributeTotalConstantMemory
Constant memory size in bytes.
Definition: hip_runtime_api.h:299
unsigned hasWarpShuffle
Warp shuffle operations. (__shfl_*).
Definition: hip_runtime_api.h:62
int memoryBusWidth
Global memory bus width in bits.
Definition: hip_runtime_api.h:94
unsigned hasWarpVote
Warp vote instructions (__any, __all).
Definition: hip_runtime_api.h:60
char name[256]
Device name.
Definition: hip_runtime_api.h:84
unsigned hasGlobalFloatAtomicExch
32-bit float atomic exch for global memory.
Definition: hip_runtime_api.h:47
int concurrentKernels
Device can possibly execute multiple kernels concurrently.
Definition: hip_runtime_api.h:109
unsigned hasWarpBallot
Warp ballot instructions (__ballot).
Definition: hip_runtime_api.h:61
size_t totalGlobalMem
Size of global memory region (in bytes).
Definition: hip_runtime_api.h:85
@ hipDeviceAttributeTextureAlignment
Alignment requirement for textures.
Definition: hip_runtime_api.h:337
#define hipHostMallocDefault
Flags that can be used with hipHostMalloc.
Definition: hip_runtime_api.h:175
char gcnArchName[256]
AMD GCN Arch Name.
Definition: hip_runtime_api.h:117
@ hipDeviceAttributeCanMapHostMemory
Device can map host memory into device address space.
Definition: hip_runtime_api.h:340
int maxThreadsDim[3]
Max number of threads in each dimension (XYZ) of a block.
Definition: hip_runtime_api.h:90
int cooperativeMultiDeviceLaunch
HIP device supports cooperative launch on multiple devices.
Definition: hip_runtime_api.h:120
unsigned has3dGrid
Grid and group dims are 3D (rather than 2D).
Definition: hip_runtime_api.h:71
@ hipDeviceAttributeMaxTexture1DWidth
Maximum number of elements in 1D images.
Definition: hip_runtime_api.h:326
@ hipDeviceAttributeCooperativeLaunch
Support cooperative launch.
Definition: hip_runtime_api.h:324
@ hipDeviceAttributeMultiprocessorCount
Number of multiprocessors on the device.
Definition: hip_runtime_api.h:308
int pciDeviceID
PCI Device ID.
Definition: hip_runtime_api.h:112
int memoryClockRate
Max global memory clock frequency in khz.
Definition: hip_runtime_api.h:93
hipErrorCooperativeLaunchTooLarge
Definition: hip_runtime_api.h:268
int warpSize
Warp size.
Definition: hip_runtime_api.h:88
hipErrorAssert
Produced when the kernel calls assert.
Definition: hip_runtime_api.h:261
int cooperativeMultiDeviceUnmatchedFunc
Definition: hip_runtime_api.h:132
int cooperativeMultiDeviceUnmatchedGridDim
Definition: hip_runtime_api.h:134
unsigned hasFloatAtomicAdd
32-bit float atomic add in global and shared memory.
Definition: hip_runtime_api.h:50
int cooperativeLaunch
HIP device supports cooperative launch.
Definition: hip_runtime_api.h:119
unsigned hasSharedFloatAtomicExch
32-bit float atomic exch for shared memory.
Definition: hip_runtime_api.h:49
@ hipDeviceAttributeCooperativeMultiDeviceUnmatchedSharedMem
Definition: hip_runtime_api.h:349
int multiProcessorCount
Number of multi-processors (compute units).
Definition: hip_runtime_api.h:102
int integrated
APU vs dGPU.
Definition: hip_runtime_api.h:118
int ECCEnabled
Device has ECC support enabled.
Definition: hip_runtime_api.h:130
size_t totalConstMem
Size of shared memory region (in bytes).
Definition: hip_runtime_api.h:95
int maxTexture2D[2]
Maximum dimensions (width, height) of 2D images, in image elements.
Definition: hip_runtime_api.h:122
#define hipMemAttachGlobal
Memory can be accessed by any stream on any device.
Definition: hip_runtime_api.h:191
hipErrorHostMemoryAlreadyRegistered
Produced when trying to lock a page-locked memory.
Definition: hip_runtime_api.h:262
hipDeviceAttribute_t
Definition: hip_runtime_api.h:289
hipErrorMemoryAllocation
Memory allocation error.
Definition: hip_runtime_api.h:201
hipErrorLaunchFailure
An exception occurred on the device while executing a kernel.
Definition: hip_runtime_api.h:266
@ hipDeviceAttributeConcurrentKernels
Definition: hip_runtime_api.h:316
int cooperativeMultiDeviceUnmatchedSharedMem
Definition: hip_runtime_api.h:138
hipErrorNotSupported
Produced when the hip API is not supported/implemented.
Definition: hip_runtime_api.h:272
hipErrorLaunchOutOfResources
Out of resources error.
Definition: hip_runtime_api.h:254
hipErrorInvalidResourceHandle
Resource handle (hipEvent_t or hipStream_t) invalid.
Definition: hip_runtime_api.h:247
hipMemoryType
Definition: hip_runtime_api.h:148
@ hipDeviceAttributeMaxTexture2DWidth
Maximum dimension width of 2D images in image elements.
Definition: hip_runtime_api.h:327
int pciDomainID
PCI Domain ID.
Definition: hip_runtime_api.h:110
@ hipDeviceAttributeCooperativeMultiDeviceUnmatchedFunc
Definition: hip_runtime_api.h:343
@ hipDeviceAttributeHdpMemFlushCntl
Address of the HDP_MEM_COHERENCY_FLUSH_CNTL register.
Definition: hip_runtime_api.h:333
@ hipDeviceAttributeEccEnabled
Device has ECC support enabled.
Definition: hip_runtime_api.h:341
struct hipDeviceProp_t hipDeviceProp_t
@ hipDeviceAttributeMaxSharedMemoryPerMultiprocessor
Definition: hip_runtime_api.h:320
hipErrorPeerAccessAlreadyEnabled
Peer access was already enabled from the current device.
Definition: hip_runtime_api.h:256