24 #ifndef HIP_INCLUDE_HIP_HCC_DETAIL_HIP_RUNTIME_API_H 25 #define HIP_INCLUDE_HIP_HCC_DETAIL_HIP_RUNTIME_API_H 34 #ifndef GENERIC_GRID_LAUNCH 35 #define GENERIC_GRID_LAUNCH 1 43 #include <hip/hcc_detail/driver_types.h> 47 #if !__HIP_VDI__ && defined(__cplusplus) 49 #include <hip/hcc_detail/program_state.hpp> 53 #define DEPRECATED(msg) __declspec(deprecated(msg)) 54 #else // !defined(_MSC_VER) 55 #define DEPRECATED(msg) __attribute__ ((deprecated(msg))) 56 #endif // !defined(_MSC_VER) 58 #define DEPRECATED_MSG "This API is marked as deprecated and may not be supported in future releases.For more details please refer https://github.com/ROCm-Developer-Tools/HIP/tree/master/docs/markdown/hip_deprecated_api_list" 60 #if defined(__HCC__) && (__hcc_workweek__ < 16155) 61 #error("This version of HIP requires a newer version of HCC."); 64 #define HIP_LAUNCH_PARAM_BUFFER_POINTER ((void*)0x01) 65 #define HIP_LAUNCH_PARAM_BUFFER_SIZE ((void*)0x02) 66 #define HIP_LAUNCH_PARAM_END ((void*)0x03) 76 #pragma GCC visibility push (default) 82 hipError_t hip_init();
96 typedef int hipDevice_t;
102 #define hipIpcMemLazyEnablePeerAccess 0 104 #define HIP_IPC_HANDLE_SIZE 64 107 char reserved[HIP_IPC_HANDLE_SIZE];
111 struct ihipIpcEventHandle_t;
112 typedef struct ihipIpcEventHandle_t* hipIpcEventHandle_t;
124 size_t constSizeBytes;
125 size_t localSizeBytes;
126 int maxDynamicSharedSizeBytes;
127 int maxThreadsPerBlock;
129 int preferredShmemCarveout;
131 size_t sharedSizeBytes;
137 hipLimitMallocHeapSize = 0x02,
144 #define hipStreamDefault \ 147 #define hipStreamNonBlocking 0x01 151 #define hipEventDefault 0x0 152 #define hipEventBlockingSync \ 154 #define hipEventDisableTiming \ 156 #define hipEventInterprocess 0x4 157 #define hipEventReleaseToDevice \ 159 #define hipEventReleaseToSystem \ 168 #define hipHostMallocDefault 0x0 169 #define hipHostMallocPortable 0x1 170 #define hipHostMallocMapped \ 172 #define hipHostMallocWriteCombined 0x4 174 #define hipHostMallocCoherent \ 176 #define hipHostMallocNonCoherent \ 181 #define hipMemAttachGlobal 0x0 182 #define hipMemAttachHost 0x1 184 #define hipDeviceMallocDefault 0x0 185 #define hipDeviceMallocFinegrained 0x1 187 #define hipHostRegisterDefault 0x0 189 #define hipHostRegisterPortable 0x1 190 #define hipHostRegisterMapped \ 192 #define hipHostRegisterIoMemory 0x4 194 #define hipExtHostRegisterCoarseGrained 0x8 196 #define hipDeviceScheduleAuto 0x0 197 #define hipDeviceScheduleSpin \ 199 #define hipDeviceScheduleYield \ 202 #define hipDeviceScheduleBlockingSync 0x4 204 #define hipDeviceScheduleMask 0x7 206 #define hipDeviceMapHost 0x8 207 #define hipDeviceLmemResizeToMax 0x16 209 #define hipArrayDefault 0x00 210 #define hipArrayLayered 0x01 211 #define hipArraySurfaceLoadStore 0x02 212 #define hipArrayCubemap 0x04 213 #define hipArrayTextureGather 0x08 220 typedef enum hipJitOption {
221 hipJitOptionMaxRegisters = 0,
222 hipJitOptionThreadsPerBlock,
223 hipJitOptionWallTime,
224 hipJitOptionInfoLogBuffer,
225 hipJitOptionInfoLogBufferSizeBytes,
226 hipJitOptionErrorLogBuffer,
227 hipJitOptionErrorLogBufferSizeBytes,
228 hipJitOptionOptimizationLevel,
229 hipJitOptionTargetFromContext,
231 hipJitOptionFallbackStrategy,
232 hipJitOptionGenerateDebugInfo,
233 hipJitOptionLogVerbose,
234 hipJitOptionGenerateLineInfo,
235 hipJitOptionCacheMode,
237 hipJitOptionFastCompile,
238 hipJitOptionNumOptions
274 __host__ __device__
dim3(uint32_t _x = 1, uint32_t _y = 1, uint32_t _z = 1) : x(_x), y(_y), z(_z){};
805 hipError_t
hipStreamWaitEvent(hipStream_t stream, hipEvent_t event,
unsigned int flags);
946 hipError_t
hipEventRecord(hipEvent_t event, hipStream_t stream = NULL);
1085 hipError_t
hipMalloc(
void** ptr,
size_t size);
1115 DEPRECATED(
"use hipHostMalloc instead")
1146 hipError_t
hipHostMalloc(
void** ptr,
size_t size,
unsigned int flags);
1157 hipError_t
hipMallocManaged(
void** devPtr,
size_t size,
unsigned int flags __dparm(0));
1173 hipError_t
hipHostAlloc(
void** ptr,
size_t size,
unsigned int flags);
1235 hipError_t
hipHostRegister(
void* hostPtr,
size_t sizeBytes,
unsigned int flags);
1266 hipError_t
hipMallocPitch(
void** ptr,
size_t* pitch,
size_t width,
size_t height);
1290 hipError_t
hipMemAllocPitch(hipDeviceptr_t* dptr,
size_t* pitch,
size_t widthInBytes,
size_t height,
unsigned int elementSizeBytes);
1305 hipError_t
hipFree(
void* ptr);
1362 hipError_t
hipMemcpy(
void* dst, const
void* src,
size_t sizeBytes, hipMemcpyKind kind);
1381 hipError_t
hipMemcpyHtoD(hipDeviceptr_t dst,
void* src,
size_t sizeBytes);
1400 hipError_t
hipMemcpyDtoH(
void* dst, hipDeviceptr_t src,
size_t sizeBytes);
1419 hipError_t
hipMemcpyDtoD(hipDeviceptr_t dst, hipDeviceptr_t src,
size_t sizeBytes);
1438 hipError_t
hipMemcpyHtoDAsync(hipDeviceptr_t dst,
void* src,
size_t sizeBytes, hipStream_t stream);
1457 hipError_t
hipMemcpyDtoHAsync(
void* dst, hipDeviceptr_t src,
size_t sizeBytes, hipStream_t stream);
1476 hipError_t
hipMemcpyDtoDAsync(hipDeviceptr_t dst, hipDeviceptr_t src,
size_t sizeBytes,
1477 hipStream_t stream);
1481 hipModule_t hmod,
const char* name);
1483 hipError_t hipGetSymbolAddress(
void** devPtr,
const void* symbolName);
1484 hipError_t hipGetSymbolSize(
size_t* size,
const void* symbolName);
1485 hipError_t hipMemcpyToSymbol(
const void* symbolName,
const void* src,
1486 size_t sizeBytes,
size_t offset __dparm(0),
1487 hipMemcpyKind kind __dparm(hipMemcpyHostToDevice));
1488 hipError_t hipMemcpyToSymbolAsync(
const void* symbolName,
const void* src,
1489 size_t sizeBytes,
size_t offset,
1490 hipMemcpyKind kind, hipStream_t stream __dparm(0));
1491 hipError_t hipMemcpyFromSymbol(
void* dst,
const void* symbolName,
1492 size_t sizeBytes,
size_t offset __dparm(0),
1493 hipMemcpyKind kind __dparm(hipMemcpyDeviceToHost));
1494 hipError_t hipMemcpyFromSymbolAsync(
void* dst,
const void* symbolName,
1495 size_t sizeBytes,
size_t offset,
1497 hipStream_t stream __dparm(0));
1501 #ifdef __cplusplus //Start : Not supported in gcc 1504 __attribute__((visibility(
"hidden")))
1505 hipError_t read_agent_global_from_process(hipDeviceptr_t* dptr,
size_t* bytes,
1521 __attribute__((visibility("hidden")))
1522 hipError_t hipGetSymbolAddress(
void** devPtr, const
void* symbolName) {
1524 hip_impl::hip_init();
1526 return hip_impl::read_agent_global_from_process(devPtr, &size, (
const char*)symbolName);
1541 __attribute__((visibility(
"hidden")))
1542 hipError_t hipGetSymbolSize(
size_t* size, const
void* symbolName) {
1544 hip_impl::hip_init();
1545 void* devPtr =
nullptr;
1546 return hip_impl::read_agent_global_from_process(&devPtr, size, (
const char*)symbolName);
1548 #endif // End : Not supported in gcc 1550 #if defined(__cplusplus) 1556 hipError_t hipMemcpyToSymbol(
void*,
const void*,
size_t,
size_t, hipMemcpyKind,
1561 #if defined(__cplusplus) 1590 __attribute__((visibility(
"hidden")))
1591 hipError_t hipMemcpyToSymbol(const
void* symbolName, const
void* src,
1592 size_t sizeBytes,
size_t offset __dparm(0),
1593 hipMemcpyKind kind __dparm(hipMemcpyHostToDevice)) {
1594 if (!symbolName)
return hipErrorInvalidSymbol;
1596 hipDeviceptr_t dst = NULL;
1597 hipGetSymbolAddress(&dst, (
const char*)symbolName);
1599 return hip_impl::hipMemcpyToSymbol(dst, src, sizeBytes, offset, kind,
1600 (
const char*)symbolName);
1604 #if defined(__cplusplus) 1610 hipError_t hipMemcpyToSymbolAsync(
void*,
const void*,
size_t,
size_t,
1611 hipMemcpyKind, hipStream_t,
const char*);
1612 hipError_t hipMemcpyFromSymbol(
void*,
const void*,
size_t,
size_t,
1613 hipMemcpyKind,
const char*);
1614 hipError_t hipMemcpyFromSymbolAsync(
void*,
const void*,
size_t,
size_t,
1615 hipMemcpyKind, hipStream_t,
const char*);
1619 #if defined(__cplusplus) 1649 #ifdef __cplusplus //Start : Not supported in gcc 1651 __attribute__((visibility(
"hidden")))
1652 hipError_t hipMemcpyToSymbolAsync(const
void* symbolName, const
void* src,
1653 size_t sizeBytes,
size_t offset,
1654 hipMemcpyKind kind, hipStream_t stream __dparm(0)) {
1655 if (!symbolName)
return hipErrorInvalidSymbol;
1657 hipDeviceptr_t dst = NULL;
1658 hipGetSymbolAddress(&dst, symbolName);
1660 return hip_impl::hipMemcpyToSymbolAsync(dst, src, sizeBytes, offset, kind,
1662 (
const char*)symbolName);
1666 __attribute__((visibility(
"hidden")))
1667 hipError_t hipMemcpyFromSymbol(
void* dst, const
void* symbolName,
1668 size_t sizeBytes,
size_t offset __dparm(0),
1669 hipMemcpyKind kind __dparm(hipMemcpyDeviceToHost)) {
1670 if (!symbolName)
return hipErrorInvalidSymbol;
1672 hipDeviceptr_t src = NULL;
1673 hipGetSymbolAddress(&src, symbolName);
1675 return hip_impl::hipMemcpyFromSymbol(dst, src, sizeBytes, offset, kind,
1676 (
const char*)symbolName);
1680 __attribute__((visibility(
"hidden")))
1681 hipError_t hipMemcpyFromSymbolAsync(
void* dst, const
void* symbolName,
1682 size_t sizeBytes,
size_t offset,
1684 hipStream_t stream __dparm(0)) {
1685 if (!symbolName)
return hipErrorInvalidSymbol;
1687 hipDeviceptr_t src = NULL;
1688 hipGetSymbolAddress(&src, symbolName);
1690 return hip_impl::hipMemcpyFromSymbolAsync(dst, src, sizeBytes, offset, kind,
1692 (
const char*)symbolName);
1694 #endif // End : Not supported in gcc 1696 #endif // __HIP_VDI__ 1725 hipError_t
hipMemcpyAsync(
void* dst,
const void* src,
size_t sizeBytes, hipMemcpyKind kind,
1726 hipStream_t stream __dparm(0));
1737 hipError_t
hipMemset(
void* dst,
int value,
size_t sizeBytes);
1748 hipError_t
hipMemsetD8(hipDeviceptr_t dest,
unsigned char value,
size_t count);
1765 hipError_t
hipMemsetD8Async(hipDeviceptr_t dest,
unsigned char value,
size_t count, hipStream_t stream __dparm(0));
1776 hipError_t
hipMemsetD16(hipDeviceptr_t dest,
unsigned short value,
size_t count);
1793 hipError_t
hipMemsetD16Async(hipDeviceptr_t dest,
unsigned short value,
size_t count, hipStream_t stream __dparm(0));
1804 hipError_t
hipMemsetD32(hipDeviceptr_t dest,
int value,
size_t count);
1821 hipError_t
hipMemsetAsync(
void* dst,
int value,
size_t sizeBytes, hipStream_t stream __dparm(0));
1839 hipStream_t stream __dparm(0));
1852 hipError_t
hipMemset2D(
void* dst,
size_t pitch,
int value,
size_t width,
size_t height);
1866 hipError_t
hipMemset2DAsync(
void* dst,
size_t pitch,
int value,
size_t width,
size_t height,hipStream_t stream __dparm(0));
1901 hipError_t hipMemPtrGetInfo(
void* ptr,
size_t* size);
1917 size_t height __dparm(0),
unsigned int flags __dparm(
hipArrayDefault));
1947 struct hipExtent extent,
unsigned int flags);
1964 hipError_t
hipMemcpy2D(
void* dst,
size_t dpitch,
const void* src,
size_t spitch,
size_t width,
1965 size_t height, hipMemcpyKind kind);
2007 hipError_t
hipMemcpy2DAsync(
void* dst,
size_t dpitch,
const void* src,
size_t spitch,
size_t width,
2008 size_t height, hipMemcpyKind kind, hipStream_t stream __dparm(0));
2027 size_t spitch,
size_t width,
size_t height, hipMemcpyKind kind);
2046 size_t count, hipMemcpyKind kind);
2064 size_t count, hipMemcpyKind kind);
2241 #ifndef USE_PEER_NON_UNIFIED 2242 #define USE_PEER_NON_UNIFIED 1 2245 #if USE_PEER_NON_UNIFIED == 1 2257 hipError_t
hipMemcpyPeer(
void* dst,
int dstDeviceId,
const void* src,
int srcDeviceId,
2272 hipError_t
hipMemcpyPeerAsync(
void* dst,
int dstDeviceId,
const void* src,
int srcDevice,
2273 size_t sizeBytes, hipStream_t stream __dparm(0));
2297 hipError_t
hipInit(
unsigned int flags);
2319 DEPRECATED(DEPRECATED_MSG)
2320 hipError_t
hipCtxCreate(hipCtx_t* ctx,
unsigned int flags, hipDevice_t device);
2332 DEPRECATED(DEPRECATED_MSG)
2345 DEPRECATED(DEPRECATED_MSG)
2358 DEPRECATED(DEPRECATED_MSG)
2371 DEPRECATED(DEPRECATED_MSG)
2384 DEPRECATED(DEPRECATED_MSG)
2398 DEPRECATED(DEPRECATED_MSG)
2418 DEPRECATED(DEPRECATED_MSG)
2434 DEPRECATED(DEPRECATED_MSG)
2450 DEPRECATED(DEPRECATED_MSG)
2466 DEPRECATED(DEPRECATED_MSG)
2482 DEPRECATED(DEPRECATED_MSG)
2496 DEPRECATED(DEPRECATED_MSG)
2509 DEPRECATED(DEPRECATED_MSG)
2531 DEPRECATED(DEPRECATED_MSG)
2550 DEPRECATED(DEPRECATED_MSG)
2631 hipError_t
hipDeviceGet(hipDevice_t* device,
int ordinal);
2725 hipError_t
hipModuleLoad(hipModule_t* module, const
char* fname);
2749 hipError_t
hipModuleGetFunction(hipFunction_t* function, hipModule_t module, const
char* kname);
2771 hipError_t
hipFuncGetAttribute(
int* value, hipFunction_attribute attrib, hipFunction_t hfunc);
2774 #if defined(__cplusplus) 2780 class agent_globals_impl;
2781 class agent_globals {
2785 agent_globals(
const agent_globals&) =
delete;
2787 hipError_t read_agent_global_from_module(hipDeviceptr_t* dptr,
size_t* bytes,
2788 hipModule_t hmod,
const char* name);
2789 hipError_t read_agent_global_from_process(hipDeviceptr_t* dptr,
size_t* bytes,
2792 agent_globals_impl* impl;
2796 __attribute__((visibility(
"hidden")))
2797 agent_globals& get_agent_globals() {
2798 static agent_globals ag;
2804 __attribute__((visibility(
"hidden")))
2805 hipError_t read_agent_global_from_process(hipDeviceptr_t* dptr,
size_t* bytes,
2807 return get_agent_globals().read_agent_global_from_process(dptr, bytes, name);
2812 #if defined(__cplusplus) 2827 hipModule_t hmod,
const char* name);
2828 #endif // __HIP_VDI__ 2830 hipError_t hipModuleGetTexRef(
textureReference** texRef, hipModule_t hmod,
const char* name);
2855 hipError_t
hipModuleLoadDataEx(hipModule_t* module,
const void* image,
unsigned int numOptions,
2856 hipJitOption* options,
void** optionValues);
2883 unsigned int gridDimZ,
unsigned int blockDimX,
2884 unsigned int blockDimY,
unsigned int blockDimZ,
2885 unsigned int sharedMemBytes, hipStream_t stream,
2886 void** kernelParams,
void** extra);
2905 void** kernelParams,
unsigned int sharedMemBytes,
2906 hipStream_t stream);
2919 int numDevices,
unsigned int flags);
2933 hipFunction_t f,
size_t dynSharedMemPerBlk,
2934 uint32_t blockSizeLimit);
2945 uint32_t* numBlocks, hipFunction_t f, uint32_t blockSize,
size_t dynSharedMemPerBlk);
2957 uint32_t* numBlocks, hipFunction_t f, uint32_t blockSize,
size_t dynSharedMemPerBlk,
unsigned int flags);
2959 #if defined(__clang__) && defined(__HIP__) 2971 hipError_t hipExtLaunchMultiKernelMultiDevice(
hipLaunchParams* launchParamsList,
2972 int numDevices,
unsigned int flags);
3000 DEPRECATED(
"use roctracer/rocTX instead")
3009 DEPRECATED("use roctracer/rocTX instead")
3131 hipError_t
hipConfigureCall(
dim3 gridDim,
dim3 blockDim,
size_t sharedMem __dparm(0), hipStream_t stream __dparm(0));
3174 size_t sharedMem __dparm(0),
3175 hipStream_t stream __dparm(0));
3193 hipStream_t *stream);
3215 size_t sharedMemBytes __dparm(0),
3216 hipStream_t stream __dparm(0));
3227 #if defined(__cplusplus) && !defined(__HCC__) && defined(__clang__) && defined(__HIP__) 3228 template <
typename F>
3230 uint32_t* numBlocks, F func, uint32_t blockSize,
size_t dynSharedMemPerBlk) {
3232 dynSharedMemPerBlk);
3234 template <
typename F>
3236 uint32_t* numBlocks, F func, uint32_t blockSize,
size_t dynSharedMemPerBlk,
unsigned int flags) {
3238 numBlocks, (hipFunction_t)func, blockSize, dynSharedMemPerBlk, flags);
3240 #endif // defined(__cplusplus) && !defined(__HCC__) && defined(__clang__) && defined(__HIP__) 3243 #include <hip/hcc_detail/hip_prof_str.h> 3253 hipError_t hipRemoveApiCallback(uint32_t
id);
3254 hipError_t hipRegisterActivityCallback(uint32_t
id,
void* fun,
void* arg);
3255 hipError_t hipRemoveActivityCallback(uint32_t
id);
3256 const char* hipApiName(uint32_t
id);
3257 const char* hipKernelNameRef(
const hipFunction_t f);
3266 hipError_t hipBindTexture(
size_t* offset,
textureReference* tex,
const void* devPtr,
3269 hipError_t ihipBindTextureImpl(
TlsData *tls,
int dim,
enum hipTextureReadMode readMode,
size_t* offset,
3288 template <
class T,
int dim, enum hipTextureReadMode readMode>
3289 hipError_t hipBindTexture(
size_t* offset,
struct texture<T, dim, readMode>& tex,
const void* devPtr,
3291 return ihipBindTextureImpl(
nullptr, dim, readMode, offset, devPtr, &desc, size, &tex);
3308 template <
class T,
int dim, enum hipTextureReadMode readMode>
3309 hipError_t hipBindTexture(
size_t* offset,
struct texture<T, dim, readMode>& tex,
const void* devPtr,
3310 size_t size = UINT_MAX) {
3311 return ihipBindTextureImpl(
nullptr, dim, readMode, offset, devPtr, &(tex.channelDesc), size, &tex);
3315 hipError_t hipBindTexture2D(
size_t* offset,
textureReference* tex,
const void* devPtr,
3319 hipError_t ihipBindTexture2DImpl(
int dim,
enum hipTextureReadMode readMode,
size_t* offset,
3323 template <
class T,
int dim, enum hipTextureReadMode readMode>
3324 hipError_t hipBindTexture2D(
size_t* offset,
struct texture<T, dim, readMode>& tex,
3325 const void* devPtr,
size_t width,
size_t height,
size_t pitch) {
3326 return ihipBindTexture2DImpl(dim, readMode, offset, devPtr, &(tex.channelDesc), width, height,
3330 template <
class T,
int dim, enum hipTextureReadMode readMode>
3331 hipError_t hipBindTexture2D(
size_t* offset,
struct texture<T, dim, readMode>& tex,
3333 size_t width,
size_t height,
size_t pitch) {
3334 return ihipBindTexture2DImpl(dim, readMode, offset, devPtr, &desc, width, height, &tex);
3341 hipError_t ihipBindTextureToArrayImpl(
TlsData *tls,
int dim,
enum hipTextureReadMode readMode,
3346 template <
class T,
int dim, enum hipTextureReadMode readMode>
3347 hipError_t hipBindTextureToArray(
struct texture<T, dim, readMode>& tex,
hipArray_const_t array) {
3348 return ihipBindTextureToArrayImpl(
nullptr, dim, readMode, array, tex.channelDesc, &tex);
3351 template <
class T,
int dim, enum hipTextureReadMode readMode>
3352 hipError_t hipBindTextureToArray(
struct texture<T, dim, readMode>& tex,
hipArray_const_t array,
3354 return ihipBindTextureToArrayImpl(
nullptr, dim, readMode, array, desc, &tex);
3357 template <
class T,
int dim, enum hipTextureReadMode readMode>
3358 inline static hipError_t hipBindTextureToArray(
struct texture<T, dim, readMode> *tex,
3361 return ihipBindTextureToArrayImpl(
nullptr, dim, readMode, array, *desc, tex);
3369 template <
class T,
int dim, enum hipTextureReadMode readMode>
3370 hipError_t hipBindTextureToMipmappedArray(
const texture<T, dim, readMode>& tex,
3375 template <
class T,
int dim, enum hipTextureReadMode readMode>
3376 hipError_t hipBindTextureToMipmappedArray(
const texture<T, dim, readMode>& tex,
3385 void** kernelParams,
unsigned int sharedMemBytes, hipStream_t stream) {
3387 blockDim, kernelParams, sharedMemBytes, stream);
3392 unsigned int numDevices,
unsigned int flags = 0) {
3396 #if defined(__clang__) && defined(__HIP__) 3398 inline hipError_t hipExtLaunchMultiKernelMultiDevice(
hipLaunchParams* launchParamsList,
3399 unsigned int numDevices,
unsigned int flags = 0) {
3400 return hipExtLaunchMultiKernelMultiDevice(launchParamsList, numDevices, flags);
3414 extern hipError_t ihipUnbindTextureImpl(
const hipTextureObject_t& textureObject);
3416 template <
class T,
int dim, enum hipTextureReadMode readMode>
3417 hipError_t hipUnbindTexture(
struct texture<T, dim, readMode>& tex) {
3418 return ihipUnbindTextureImpl(tex.textureObject);
3422 hipError_t hipGetTextureAlignmentOffset(
size_t* offset,
const textureReference* texref);
3423 hipError_t hipGetTextureReference(
const textureReference** texref,
const void* symbol);
3425 hipError_t hipCreateTextureObject(hipTextureObject_t* pTexObject,
const hipResourceDesc* pResDesc,
3429 hipError_t hipDestroyTextureObject(hipTextureObject_t textureObject);
3432 hipTextureObject_t textureObject);
3434 hipTextureObject_t textureObject);
3435 hipError_t hipGetTextureObjectTextureDesc(
hipTextureDesc* pTexDesc,
3436 hipTextureObject_t textureObject);
3441 hipError_t hipTexRefSetAddressMode(
textureReference* tex,
int dim, hipTextureAddressMode am);
3443 hipError_t hipTexRefGetAddressMode(hipTextureAddressMode* am,
textureReference tex,
int dim);
3445 hipError_t hipTexRefSetFilterMode(
textureReference* tex, hipTextureFilterMode fm);
3449 hipError_t hipTexRefSetFormat(
textureReference* tex, hipArray_Format fmt,
int NumPackedComponents);
3451 hipError_t hipTexRefSetAddress(
size_t* offset,
textureReference* tex, hipDeviceptr_t devPtr,
3454 hipError_t hipTexRefGetAddress(hipDeviceptr_t* dev_ptr,
textureReference tex);
3457 hipDeviceptr_t devPtr,
size_t pitch);
3472 #pragma GCC visibility pop hipError_t hipMemcpy2DFromArrayAsync(void *dst, size_t dpitch, hipArray_const_t src, size_t wOffset, size_t hOffset, size_t width, size_t height, hipMemcpyKind kind, hipStream_t stream __dparm(0))
Copies data between host and device asynchronously.
hipError_t hipHostFree(void *ptr)
Free memory allocated by the hcc hip host memory allocation API This API performs an implicit hipDevi...
Definition: hip_memory.cpp:2005
prefer larger L1 cache and smaller shared memory
Definition: hip_runtime_api.h:248
hipError_t hipModuleGetFunction(hipFunction_t *function, hipModule_t module, const char *kname)
Function with kname will be extracted if present in module.
Definition: hip_module.cpp:1038
hipError_t hipCtxDisablePeerAccess(hipCtx_t peerCtx)
Disable direct access from current context's virtual address space to memory allocations physically l...
Definition: hip_peer.cpp:220
hipError_t hipMemset3D(hipPitchedPtr pitchedDevPtr, int value, hipExtent extent)
Fills synchronously the memory area pointed to by pitchedDevPtr with the constant value...
Definition: hip_memory.cpp:1900
hipError_t hipStreamGetPriority(hipStream_t stream, int *priority)
Query the priority of a stream.
Definition: hip_stream.cpp:237
hipError_t hipDeviceGetCacheConfig(hipFuncCache_t *cacheConfig)
Set Cache configuration for a specific function.
Definition: hip_device.cpp:82
hipError_t hipDriverGetVersion(int *driverVersion)
Returns the approximate HIP driver version.
Definition: hip_context.cpp:85
hipError_t hipLaunchKernel(const void *function_address, dim3 numBlocks, dim3 dimBlocks, void **args, size_t sharedMemBytes __dparm(0), hipStream_t stream __dparm(0))
C compliant kernel launch API.
Definition: hip_runtime_api.h:278
hipError_t hipPeekAtLastError(void)
Return last error returned by any HIP runtime API call.
Definition: hip_error.cpp:41
hipError_t hipMemcpyParam2D(const hip_Memcpy2D *pCopy)
Copies memory for 2D arrays.
Definition: hip_memory.cpp:1783
hipError_t hipDevicePrimaryCtxSetFlags(hipDevice_t dev, unsigned int flags)
Set flags for the primary context.
Definition: hip_context.cpp:321
hipError_t hipDevicePrimaryCtxRetain(hipCtx_t *pctx, hipDevice_t dev)
Retain the primary context on the GPU.
Definition: hip_context.cpp:296
hipError_t hipDeviceComputeCapability(int *major, int *minor, hipDevice_t device)
Returns the compute capability of the device.
Definition: hip_device.cpp:417
hipError_t hipDeviceGetByPCIBusId(int *device, const char *pciBusId)
Returns a handle to a compute device.
Definition: hip_device.cpp:475
hipError_t hipExtMallocWithFlags(void **ptr, size_t sizeBytes, unsigned int flags)
Allocate memory on the default accelerator.
Definition: hip_memory.cpp:364
hipError_t hipMemGetAddressRange(hipDeviceptr_t *pbase, size_t *psize, hipDeviceptr_t dptr)
Get information on memory allocations.
Definition: hip_memory.cpp:2046
hipError_t hipMemsetD16Async(hipDeviceptr_t dest, unsigned short value, size_t count, hipStream_t stream __dparm(0))
Fills the first sizeBytes bytes of the memory area pointed to by dest with the constant short value v...
hipError_t hipFreeHost(void *ptr)
Free memory allocated by the hcc hip host memory allocation API. [Deprecated].
Definition: hip_memory.cpp:2016
hipError_t hipMemcpyToArray(hipArray *dst, size_t wOffset, size_t hOffset, const void *src, size_t count, hipMemcpyKind kind)
Copies data between host and device.
Definition: hip_memory.cpp:1192
unsigned long long hipSurfaceObject_t
Definition: hip_surface_types.h:36
hipError_t hipModuleLoadDataEx(hipModule_t *module, const void *image, unsigned int numOptions, hipJitOption *options, void **optionValues)
builds module from code object which resides in host memory. Image is pointer to that location...
Definition: hip_module.cpp:1206
Definition: driver_types.h:240
hipError_t hipMallocPitch(void **ptr, size_t *pitch, size_t width, size_t height)
Definition: hip_memory.cpp:493
hipError_t hipMemcpy2DAsync(void *dst, size_t dpitch, const void *src, size_t spitch, size_t width, size_t height, hipMemcpyKind kind, hipStream_t stream __dparm(0))
Copies data between host and device.
hipError_t hipMemsetD16(hipDeviceptr_t dest, unsigned short value, size_t count)
Fills the first sizeBytes bytes of the memory area pointed to by dest with the constant short value v...
Definition: hip_memory.cpp:1885
hipError_t hipMemcpy2D(void *dst, size_t dpitch, const void *src, size_t spitch, size_t width, size_t height, hipMemcpyKind kind)
Copies data between host and device.
Definition: hip_memory.cpp:1662
hipError_t hipStreamAddCallback(hipStream_t stream, hipStreamCallback_t callback, void *userData, unsigned int flags)
Adds a callback to be called on the host after all currently enqueued items in the stream have comple...
Definition: hip_stream.cpp:257
hipError_t hipMemcpyFromArray(void *dst, hipArray_const_t srcArray, size_t wOffset, size_t hOffset, size_t count, hipMemcpyKind kind)
Copies data between host and device.
Definition: hip_memory.cpp:1209
uint32_t x
x
Definition: hip_runtime_api.h:270
hipError_t hipMemcpyAtoH(void *dst, hipArray *srcArray, size_t srcOffset, size_t count)
Copies data between host and device.
Definition: hip_memory.cpp:1242
hipError_t hipDeviceEnablePeerAccess(int peerDeviceId, unsigned int flags)
Enable direct access from current device's virtual address space to memory allocations physically loc...
Definition: hip_peer.cpp:193
hipError_t hipCtxPopCurrent(hipCtx_t *ctx)
Pop the current/default context and return the popped context.
Definition: hip_context.cpp:133
const char * hipGetErrorString(hipError_t hipError)
Return handy text string message to explain the error which occurred.
Definition: hip_error.cpp:54
hipError_t hipDeviceGetSharedMemConfig(hipSharedMemConfig *pConfig)
Returns bank width of shared memory for current device.
Definition: hip_device.cpp:123
Definition: hip_runtime_api.h:150
hipError_t hipDeviceGetStreamPriorityRange(int *leastPriority, int *greatestPriority)
Returns numerical values that correspond to the least and greatest stream priority.
Definition: hip_stream.cpp:122
prefer equal size L1 cache and shared memory
Definition: hip_runtime_api.h:249
hipError_t hipHostGetDevicePointer(void **devPtr, void *hstPtr, unsigned int flags)
Get Device pointer from Host Pointer allocated through hipHostMalloc.
hipError_t hipFreeArray(hipArray *array)
Frees an array on the device.
Definition: hip_memory.cpp:2018
hipError_t hipStreamCreateWithPriority(hipStream_t *stream, unsigned int flags, int priority)
Create an asynchronous stream with the specified priority.
Definition: hip_stream.cpp:113
hipError_t hipMemsetAsync(void *dst, int value, size_t sizeBytes, hipStream_t stream __dparm(0))
Fills the first sizeBytes bytes of the memory area pointed to by dev with the constant byte value val...
hipError_t hipEventSynchronize(hipEvent_t event)
Wait for an event to complete.
Definition: hip_event.cpp:143
Definition: driver_types.h:181
hipError_t hipLaunchCooperativeKernel(const void *f, dim3 gridDim, dim3 blockDimX, void **kernelParams, unsigned int sharedMemBytes, hipStream_t stream)
launches kernel f with launch parameters and shared memory on stream with arguments passed to kernelp...
Definition: hip_module.cpp:392
hipError_t hipMemcpyHtoD(hipDeviceptr_t dst, void *src, size_t sizeBytes)
Copy data from Host to Device.
Definition: hip_memory.cpp:1021
hipError_t hipModuleUnload(hipModule_t module)
Frees the module.
Definition: hip_module.cpp:988
Definition: hip_module.cpp:107
hipError_t hipSetDeviceFlags(unsigned flags)
The current device behavior is changed according the flags passed.
hipError_t hipEventQuery(hipEvent_t event)
Query event status.
Definition: hip_event.cpp:222
hipError_t hipDeviceDisablePeerAccess(int peerDeviceId)
Disable direct access from current device's virtual address space to memory allocations physically lo...
Definition: hip_peer.cpp:186
hipError_t hipCtxGetSharedMemConfig(hipSharedMemConfig *pConfig)
Get Shared memory bank configuration.
Definition: hip_context.cpp:241
hipError_t hipMemcpy2DFromArray(void *dst, size_t dpitch, hipArray_const_t src, size_t wOffset, size_t hOffset, size_t width, size_t height, hipMemcpyKind kind)
Copies data between host and device.
Definition: hip_memory.cpp:1793
hipError_t hipOccupancyMaxActiveBlocksPerMultiprocessor(uint32_t *numBlocks, hipFunction_t f, uint32_t blockSize, size_t dynSharedMemPerBlk)
Returns occupancy for a device function.
Definition: hip_module.cpp:1427
Definition: hip_hcc_internal.h:135
hipError_t hipCtxCreate(hipCtx_t *ctx, unsigned int flags, hipDevice_t device)
Create a context and set it as current/ default context.
Definition: hip_context.cpp:52
#define hipArrayDefault
Default HIP array allocation flag.
Definition: hip_runtime_api.h:209
hipError_t hipMallocArray(hipArray **array, const hipChannelFormatDesc *desc, size_t width, size_t height __dparm(0), unsigned int flags __dparm(hipArrayDefault))
Allocate an array on the device.
hipError_t hipCtxSetSharedMemConfig(hipSharedMemConfig config)
Set Shared memory bank configuration.
Definition: hip_context.cpp:233
hipError_t hipCtxSetCurrent(hipCtx_t ctx)
Set the passed context as current/default.
Definition: hip_context.cpp:178
hipError_t __hipPopCallConfiguration(dim3 *gridDim, dim3 *blockDim, size_t *sharedMem, hipStream_t *stream)
Pop configuration of a kernel launch.
hipError_t hipIpcGetMemHandle(hipIpcMemHandle_t *handle, void *devPtr)
Gets an interprocess memory handle for an existing device memory allocation.
Definition: hip_memory.cpp:2067
Definition: hip_runtime_api.h:121
hipError_t hipMemset2DAsync(void *dst, size_t pitch, int value, size_t width, size_t height, hipStream_t stream __dparm(0))
Fills asynchronously the memory area pointed to by dst with the constant value.
Definition: driver_types.h:115
hipError_t hipHostMalloc(void **ptr, size_t size, unsigned int flags)
Allocate device accessible page locked host memory.
Definition: hip_memory.cpp:402
Definition: hip_hcc_internal.h:898
Definition: texture_types.h:74
hipError_t hipDeviceGetLimit(size_t *pValue, enum hipLimit_t limit)
Get Resource limits of current device.
Definition: hip_device.cpp:94
hipError_t hipModuleLoadData(hipModule_t *module, const void *image)
builds module from code object which resides in host memory. Image is pointer to that location...
Definition: hip_module.cpp:1187
Definition: driver_types.h:77
hipDeviceAttribute_t
Definition: hip_runtime_api.h:274
hipError_t hipEventDestroy(hipEvent_t event)
Destroy the specified event.
Definition: hip_event.cpp:131
hipError_t hipStreamCreateWithFlags(hipStream_t *stream, unsigned int flags)
Create an asynchronous stream.
Definition: hip_stream.cpp:97
hipError_t hipConfigureCall(dim3 gridDim, dim3 blockDim, size_t sharedMem __dparm(0), hipStream_t stream __dparm(0))
Configure a kernel launch.
hipError_t hipChooseDevice(int *device, const hipDeviceProp_t *prop)
Device which matches hipDeviceProp_t is returned.
Definition: hip_device.cpp:501
hipError_t hipCtxSetCacheConfig(hipFuncCache_t cacheConfig)
Set L1/Shared cache partition.
Definition: hip_context.cpp:225
hipError_t hipModuleLaunchKernel(hipFunction_t f, unsigned int gridDimX, unsigned int gridDimY, unsigned int gridDimZ, unsigned int blockDimX, unsigned int blockDimY, unsigned int blockDimZ, unsigned int sharedMemBytes, hipStream_t stream, void **kernelParams, void **extra)
launches kernel f with launch parameters and shared memory on stream with arguments passed to kernelp...
Definition: hip_runtime_api.h:269
uint32_t y
y
Definition: hip_runtime_api.h:271
void(* hipStreamCallback_t)(hipStream_t stream, hipError_t status, void *userData)
Definition: hip_runtime_api.h:843
hipError_t hipModuleLoad(hipModule_t *module, const char *fname)
Loads code object from file into a hipModule_t.
Definition: hip_module.cpp:1192
hipError_t hipDevicePrimaryCtxReset(hipDevice_t dev)
Resets the primary context on the GPU.
Definition: hip_context.cpp:308
hipError_t hipEventCreateWithFlags(hipEvent_t *event, unsigned flags)
Create an event with the specified flags.
Definition: hip_event.cpp:91
#define __host__
Definition: host_defines.h:41
hipError_t hipHostAlloc(void **ptr, size_t size, unsigned int flags)
Allocate device accessible page locked host memory [Deprecated].
Definition: hip_memory.cpp:428
hipError_t hipMallocHost(void **ptr, size_t size)
Allocate pinned host memory [Deprecated].
Definition: hip_memory.cpp:422
hipError_t hipEventElapsedTime(float *ms, hipEvent_t start, hipEvent_t stop)
Return the elapsed time between two events.
Definition: hip_event.cpp:174
hipError_t hipDeviceSetCacheConfig(hipFuncCache_t cacheConfig)
Set L1/Shared cache partition.
Definition: hip_device.cpp:74
hipError_t hipDeviceCanAccessPeer(int *canAccessPeer, int deviceId, int peerDeviceId)
Determine if a device can access a peer's memory.
Definition: hip_peer.cpp:179
hipError_t hipGetDeviceCount(int *count)
Return number of compute-capable devices.
Definition: hip_device.cpp:69
Definition: driver_types.h:68
hipError_t hipMemset(void *dst, int value, size_t sizeBytes)
Fills the first sizeBytes bytes of the memory area pointed to by dest with the constant byte value va...
Definition: hip_memory.cpp:1858
Definition: driver_types.h:253
hipError_t hipFuncGetAttribute(int *value, hipFunction_attribute attrib, hipFunction_t hfunc)
Find out a specific attribute for a given function.
Definition: hip_module.cpp:1106
hipError_t hipOccupancyMaxPotentialBlockSize(uint32_t *gridSize, uint32_t *blockSize, hipFunction_t f, size_t dynSharedMemPerBlk, uint32_t blockSizeLimit)
determine the grid and block sizes to achieves maximum occupancy for a kernel
Definition: hip_module.cpp:1364
hipError_t hipStreamDestroy(hipStream_t stream)
Destroys the specified stream.
Definition: hip_stream.cpp:194
hipError_t hipHostGetFlags(unsigned int *flagsPtr, void *hostPtr)
Return flags associated with host pointer.
Definition: hip_memory.cpp:772
hipError_t hipStreamSynchronize(hipStream_t stream)
Wait for all commands in stream to complete.
Definition: hip_stream.cpp:183
hipError_t hipMemAllocPitch(hipDeviceptr_t *dptr, size_t *pitch, size_t widthInBytes, size_t height, unsigned int elementSizeBytes)
Definition: hip_memory.cpp:504
hipError_t hipIpcOpenMemHandle(void **devPtr, hipIpcMemHandle_t handle, unsigned int flags)
Opens an interprocess memory handle exported from another process and returns a device pointer usable...
Definition: hip_memory.cpp:2103
hipError_t hipCtxGetCacheConfig(hipFuncCache_t *cacheConfig)
Set Cache configuration for a specific function.
Definition: hip_context.cpp:217
hipError_t hipMemcpyDtoD(hipDeviceptr_t dst, hipDeviceptr_t src, size_t sizeBytes)
Copy data from Device to Device.
Definition: hip_memory.cpp:1068
hipError_t hipMemset3DAsync(hipPitchedPtr pitchedDevPtr, int value, hipExtent extent, hipStream_t stream __dparm(0))
Fills asynchronously the memory area pointed to by pitchedDevPtr with the constant value...
Definition: hip_runtime_api.h:258
dim3 gridDim
Grid dimentions.
Definition: hip_runtime_api.h:280
no preference for shared memory or L1 (default)
Definition: hip_runtime_api.h:246
hipError_t hipMallocManaged(void **devPtr, size_t size, unsigned int flags __dparm(0))
Allocates memory that will be automatically managed by the Unified Memory system. ...
hipError_t hipCtxSynchronize(void)
Blocks until the default context has completed all preceding requested tasks.
Definition: hip_context.cpp:249
hipError_t hipMemsetD32Async(hipDeviceptr_t dst, int value, size_t count, hipStream_t stream __dparm(0))
Fills the memory area pointed to by dev with the constant integer value for specified number of times...
hipError_t hipCtxGetCurrent(hipCtx_t *ctx)
Get the handle of the current/ default context.
Definition: hip_context.cpp:167
hipError_t hipMalloc3DArray(hipArray **array, const struct hipChannelFormatDesc *desc, struct hipExtent extent, unsigned int flags)
Allocate an array on the device.
Definition: hip_memory.cpp:731
hipError_t hipMemcpyDtoHAsync(void *dst, hipDeviceptr_t src, size_t sizeBytes, hipStream_t stream)
Copy data from Device to Host asynchronously.
Definition: hip_memory.cpp:1135
void * func
Device function symbol.
Definition: hip_runtime_api.h:279
hipError_t hipDeviceSynchronize(void)
Waits on all active streams on current device.
Definition: hip_device.cpp:142
hipError_t hipCtxPushCurrent(hipCtx_t ctx)
Push the context to be set as current/ default context.
Definition: hip_context.cpp:154
hipError_t hipMemcpyDtoH(void *dst, hipDeviceptr_t src, size_t sizeBytes)
Copy data from Device to Host.
Definition: hip_memory.cpp:1045
Defines the different newt vector types for HIP runtime.
hipError_t hipMemcpyAsync(void *dst, const void *src, size_t sizeBytes, hipMemcpyKind kind, hipStream_t stream __dparm(0))
Copies sizeBytes bytes from the memory area pointed to by src to the memory area pointed to by offset...
hipError_t hipDeviceGetName(char *name, int len, hipDevice_t device)
Returns an identifer string for the device.
Definition: hip_device.cpp:429
hipError_t hipGetDeviceProperties(hipDeviceProp_t *prop, int deviceId)
Returns device properties.
Definition: hip_device.cpp:364
hipError_t hipHostRegister(void *hostPtr, size_t sizeBytes, unsigned int flags)
Register host memory so it can be accessed from the current device.
Definition: hip_memory.cpp:797
Definition: driver_types.h:61
hipError_t hipMalloc(void **ptr, size_t size)
Allocate memory on the default accelerator.
Definition: hip_memory.cpp:337
const char * hipGetErrorName(hipError_t hip_error)
Return name of the specified error code in text form.
Definition: hip_error.cpp:48
hipError_t hipMemset2D(void *dst, size_t pitch, int value, size_t width, size_t height)
Fills the memory area pointed to by dst with the constant value.
Definition: hip_memory.cpp:1863
Definition: driver_types.h:233
dim3 blockDim
Block dimentions.
Definition: hip_runtime_api.h:281
hipFuncCache_t
Definition: hip_runtime_api.h:245
hipError_t hipGetLastError(void)
Return last error returned by any HIP runtime API call and resets the stored error code to #hipSucces...
Definition: hip_error.cpp:32
hipError_t hipStreamWaitEvent(hipStream_t stream, hipEvent_t event, unsigned int flags)
Make the specified compute stream wait for an event.
Definition: hip_stream.cpp:130
hipError_t hipStreamGetFlags(hipStream_t stream, unsigned int *flags)
Return flags associated with this stream.
Definition: hip_stream.cpp:222
Defines surface types for HIP runtime.
hipStream_t stream
Stream identifier.
Definition: hip_runtime_api.h:284
hipError_t hipMemGetInfo(size_t *free, size_t *total)
Query memory info. Return snapshot of free memory, and total allocatable memory on the device...
Definition: hip_memory.cpp:1912
hipError_t __hipPushCallConfiguration(dim3 gridDim, dim3 blockDim, size_t sharedMem __dparm(0), hipStream_t stream __dparm(0))
Push configuration of a kernel launch.
hipError_t hipCtxGetDevice(hipDevice_t *device)
Get the handle of the device associated with current/default context.
Definition: hip_context.cpp:191
hipError_t hipDevicePrimaryCtxRelease(hipDevice_t dev)
Release the primary context on the GPU.
Definition: hip_context.cpp:285
hipError_t hipFree(void *ptr)
Free memory allocated by the hcc hip memory allocation API. This API performs an implicit hipDeviceSy...
Definition: hip_memory.cpp:1953
uint32_t z
z
Definition: hip_runtime_api.h:272
hipError_t hipCtxGetApiVersion(hipCtx_t ctx, int *apiVersion)
Returns the approximate HIP api version.
Definition: hip_context.cpp:207
hipError_t hipDeviceReset(void)
The state of current device is discarded and updated to a fresh state.
Definition: hip_device.cpp:147
hipError_t hipInit(unsigned int flags)
Explicitly initializes the HIP runtime.
Definition: hip_context.cpp:39
hipError_t hipLaunchCooperativeKernelMultiDevice(hipLaunchParams *launchParamsList, int numDevices, unsigned int flags)
Launches kernels on multiple devices where thread blocks can cooperate and synchronize as they execut...
Definition: hip_module.cpp:482
hipError_t hipMemcpy3D(const struct hipMemcpy3DParms *p)
Copies data between host and device.
Definition: hip_memory.cpp:1355
hipError_t hipRuntimeGetVersion(int *runtimeVersion)
Returns the approximate HIP Runtime version.
Definition: hip_context.cpp:97
hipError_t hipMemcpyHtoA(hipArray *dstArray, size_t dstOffset, const void *srcHost, size_t count)
Copies data between host and device.
Definition: hip_memory.cpp:1226
hipError_t hipSetupArgument(const void *arg, size_t size, size_t offset)
Set a kernel argument.
Definition: hip_clang.cpp:192
hipError_t hipMemcpyDtoDAsync(hipDeviceptr_t dst, hipDeviceptr_t src, size_t sizeBytes, hipStream_t stream)
Copy data from Device to Device asynchronously.
Definition: hip_memory.cpp:1127
Definition: hip_runtime_api.h:83
hipError_t hipSetDevice(int deviceId)
Set default device to be used for subsequent hip API calls from this thread.
Definition: hip_device.cpp:131
hipError_t hipDeviceGet(hipDevice_t *device, int ordinal)
Returns a handle to a compute device.
Definition: hip_context.cpp:70
hipError_t hipDeviceTotalMem(size_t *bytes, hipDevice_t device)
Returns the total amount of memory on the device.
Definition: hip_device.cpp:463
hipError_t hipMemAllocHost(void **ptr, size_t size)
Allocate pinned host memory [Deprecated].
Definition: hip_memory.cpp:425
hipError_t hipFuncSetCacheConfig(const void *func, hipFuncCache_t config)
Set Cache configuration for a specific function.
Definition: hip_device.cpp:107
The compiler selects a device-specific value for the banking.
Definition: hip_runtime_api.h:257
Definition: hip_runtime.h:202
hipError_t hipMemcpyPeerAsync(void *dst, int dstDeviceId, const void *src, int srcDevice, size_t sizeBytes, hipStream_t stream __dparm(0))
Copies memory from one device to memory on another device.
hipError_t hipCtxGetFlags(unsigned int *flags)
Return flags used for creating default context.
Definition: hip_context.cpp:254
hipError_t hipExtGetLinkTypeAndHopCount(int device1, int device2, uint32_t *linktype, uint32_t *hopcount)
Returns the link type and hop count between two devices.
Definition: hip_device.cpp:588
hipError_t hipCtxDestroy(hipCtx_t ctx)
Destroy a HIP context.
Definition: hip_context.cpp:109
hipError_t hipRegisterApiCallback(uint32_t id, void *fun, void *arg)
Definition: hip_intercept.cpp:33
hipSharedMemConfig
Definition: hip_runtime_api.h:256
Definition: hip_hcc_internal.h:720
hipError_t hipOccupancyMaxActiveBlocksPerMultiprocessorWithFlags(uint32_t *numBlocks, hipFunction_t f, uint32_t blockSize, size_t dynSharedMemPerBlk, unsigned int flags)
Returns occupancy for a device function.
Definition: hip_module.cpp:1436
hipError_t hipDeviceGetAttribute(int *pi, hipDeviceAttribute_t attr, int deviceId)
Query for a specific device attribute.
Definition: hip_device.cpp:337
hipError_t hipMemcpyHtoDAsync(hipDeviceptr_t dst, void *src, size_t sizeBytes, hipStream_t stream)
Copy data from Host to Device asynchronously.
Definition: hip_memory.cpp:1120
hipError_t hipHostUnregister(void *hostPtr)
Un-register host pointer.
Definition: hip_memory.cpp:872
Definition: hip_hcc_internal.h:544
hipError_t hipMemsetD8Async(hipDeviceptr_t dest, unsigned char value, size_t count, hipStream_t stream __dparm(0))
Fills the first sizeBytes bytes of the memory area pointed to by dest with the constant byte value va...
hipError_t hipMemcpyPeer(void *dst, int dstDeviceId, const void *src, int srcDeviceId, size_t sizeBytes)
Copies memory from one device to memory on another device.
Definition: hip_peer.cpp:200
hipError_t hipStreamCreate(hipStream_t *stream)
Create an asynchronous stream.
Definition: hip_stream.cpp:106
hipError_t hipMemcpy3DAsync(const struct hipMemcpy3DParms *p, hipStream_t stream __dparm(0))
Copies data between host and device asynchronously.
hipError_t hipMemcpy(void *dst, const void *src, size_t sizeBytes, hipMemcpyKind kind)
Copy data from src to dst.
Definition: hip_memory.cpp:994
hipError_t hipEventCreate(hipEvent_t *event)
Definition: hip_event.cpp:97
Definition: driver_types.h:90
Definition: hip_runtime_api.h:106
hipError_t hipDevicePrimaryCtxGetState(hipDevice_t dev, unsigned int *flags, int *active)
Get the state of the primary context.
Definition: hip_context.cpp:263
hipError_t hipCtxEnablePeerAccess(hipCtx_t peerCtx, unsigned int flags)
Enables direct access to memory allocations in a peer context.
Definition: hip_peer.cpp:214
Definition: driver_types.h:209
hipError_t hipDeviceSetSharedMemConfig(hipSharedMemConfig config)
The bank width of shared memory on current device is set.
Definition: hip_device.cpp:115
hipError_t hipGetDevice(int *deviceId)
Return the default device id for the calling host thread.
Definition: hip_device.cpp:32
hipError_t hipEventRecord(hipEvent_t event, hipStream_t stream)
Record an event in the specified stream.
Definition: hip_event.cpp:104
hipError_t hipModuleGetGlobal(void **, size_t *, hipModule_t, const char *)
returns device memory pointer and size of the kernel present in the module with symbol name ...
Definition: hip_module.cpp:841
Definition: hip_hcc_internal.h:391
hipError_t hipDeviceGetPCIBusId(char *pciBusId, int len, int device)
Returns a PCI Bus Id string for the device, overloaded to take int device ID.
Definition: hip_device.cpp:443
prefer larger shared memory and smaller L1 cache
Definition: hip_runtime_api.h:247
hipError_t hipMemcpy2DToArray(hipArray *dst, size_t wOffset, size_t hOffset, const void *src, size_t spitch, size_t width, size_t height, hipMemcpyKind kind)
Copies data between host and device.
Definition: hip_memory.cpp:1142
void ** args
Arguments.
Definition: hip_runtime_api.h:282
hipError_t hipStreamQuery(hipStream_t stream)
Return #hipSuccess if all of the operations in the specified stream have completed, or #hipErrorNotReady if not.
Definition: hip_stream.cpp:160
hipError_t hipFuncGetAttributes(struct hipFuncAttributes *attr, const void *func)
Find out attributes for a given function.
Definition: hip_module.cpp:1088
Definition: hip_runtime_api.h:260
hipError_t hipIpcCloseMemHandle(void *devPtr)
Close memory mapped with hipIpcOpenMemHandle.
Definition: hip_memory.cpp:2148
hipError_t hipPointerGetAttributes(hipPointerAttribute_t *attributes, const void *ptr)
Return attributes for the specified pointer.
Definition: hip_memory.cpp:259
hipError_t hipMemcpyParam2DAsync(const hip_Memcpy2D *pCopy, hipStream_t stream __dparm(0))
Copies memory for 2D arrays.
size_t sharedMem
Shared memory.
Definition: hip_runtime_api.h:283
hipError_t hipMemsetD8(hipDeviceptr_t dest, unsigned char value, size_t count)
Fills the first sizeBytes bytes of the memory area pointed to by dest with the constant byte value va...
Definition: hip_memory.cpp:1875
hipError_t hipProfilerStop()
Stop recording of profiling information. When using this API, start the profiler with profiling disab...
Definition: hip_hcc.cpp:2462
hipError_t hipMemsetD32(hipDeviceptr_t dest, int value, size_t count)
Fills the memory area pointed to by dest with the constant integer value for specified number of time...
Definition: hip_memory.cpp:1895
hipError_t hipProfilerStart()
Start recording of profiling information When using this API, start the profiler with profiling disab...
Definition: hip_hcc.cpp:2452
hipError_t hipLaunchByPtr(const void *func)
Launch a kernel.
Definition: hip_clang.cpp:210
Definition: texture_types.h:94