Global enum and defines#
Typedefs | |
typedef enum __HIP_NODISCARD hipError_t | hipError_t |
typedef struct ihipCtx_t * | hipCtx_t |
typedef int | hipDevice_t |
typedef struct ihipStream_t * | hipStream_t |
typedef struct ihipModule_t * | hipModule_t |
typedef struct ihipModuleSymbol_t * | hipFunction_t |
typedef struct ihipMemPoolHandle_t * | hipMemPool_t |
typedef struct ihipEvent_t * | hipEvent_t |
typedef void * | hipExternalMemory_t |
typedef void * | hipExternalSemaphore_t |
typedef struct _hipGraphicsResource | hipGraphicsResource |
typedef hipGraphicsResource * | hipGraphicsResource_t |
typedef struct ihipGraph * | hipGraph_t |
typedef struct hipGraphNode * | hipGraphNode_t |
typedef struct hipGraphExec * | hipGraphExec_t |
typedef struct hipUserObject * | hipUserObject_t |
typedef void(* | hipHostFn_t) (void *userData) |
typedef struct ihipMemGenericAllocationHandle * | hipMemGenericAllocationHandle_t |
typedef unsigned int | GLuint |
typedef unsigned int | GLenum |
Detailed Description
Macro Definition Documentation
◆ __dparm
#define __dparm | ( | x | ) |
◆ __HIP_NODISCARD
#define __HIP_NODISCARD |
◆ DEPRECATED
#define DEPRECATED | ( | msg | ) | __attribute__ ((deprecated(msg))) |
◆ DEPRECATED_MSG
#define DEPRECATED_MSG "This API is marked as deprecated and may not be supported in future releases. For more details please refer https://github.com/ROCm/HIP/blob/develop/docs/reference/deprecated_api_list.md" |
◆ GENERIC_GRID_LAUNCH
#define GENERIC_GRID_LAUNCH 1 |
◆ HIP_IPC_HANDLE_SIZE
#define HIP_IPC_HANDLE_SIZE 64 |
◆ HIP_LAUNCH_PARAM_BUFFER_POINTER
#define HIP_LAUNCH_PARAM_BUFFER_POINTER ((void*)0x01) |
◆ HIP_LAUNCH_PARAM_BUFFER_SIZE
#define HIP_LAUNCH_PARAM_BUFFER_SIZE ((void*)0x02) |
◆ HIP_LAUNCH_PARAM_END
#define HIP_LAUNCH_PARAM_END ((void*)0x03) |
◆ hipArrayCubemap
#define hipArrayCubemap 0x04 |
◆ hipArrayDefault
#define hipArrayDefault 0x00 |
Default HIP array allocation flag.
◆ hipArrayLayered
#define hipArrayLayered 0x01 |
◆ hipArraySurfaceLoadStore
#define hipArraySurfaceLoadStore 0x02 |
◆ hipArrayTextureGather
#define hipArrayTextureGather 0x08 |
◆ hipChooseDevice
#define hipChooseDevice hipChooseDeviceR0600 |
◆ hipCooperativeLaunchMultiDeviceNoPostSync
#define hipCooperativeLaunchMultiDeviceNoPostSync 0x02 |
◆ hipCooperativeLaunchMultiDeviceNoPreSync
#define hipCooperativeLaunchMultiDeviceNoPreSync 0x01 |
◆ hipCpuDeviceId
#define hipCpuDeviceId ((int)-1) |
◆ hipDeviceLmemResizeToMax
#define hipDeviceLmemResizeToMax 0x10 |
◆ hipDeviceMallocDefault
#define hipDeviceMallocDefault 0x0 |
◆ hipDeviceMallocFinegrained
#define hipDeviceMallocFinegrained 0x1 |
Memory is allocated in fine grained region of device.
◆ hipDeviceMallocUncached
#define hipDeviceMallocUncached 0x3 |
Memory allocated will be uncached.
◆ hipDeviceMapHost
#define hipDeviceMapHost 0x8 |
◆ hipDeviceProp_t
#define hipDeviceProp_t hipDeviceProp_tR0600 |
◆ hipDeviceScheduleAuto
#define hipDeviceScheduleAuto 0x0 |
Automatically select between Spin and Yield.
◆ hipDeviceScheduleBlockingSync
#define hipDeviceScheduleBlockingSync 0x4 |
◆ hipDeviceScheduleMask
#define hipDeviceScheduleMask 0x7 |
◆ hipDeviceScheduleSpin
#define hipDeviceScheduleSpin 0x1 |
Dedicate a CPU core to spin-wait. Provides lowest latency, but burns a CPU core and may consume more power.
◆ hipDeviceScheduleYield
#define hipDeviceScheduleYield 0x2 |
Yield the CPU to the operating system when waiting. May increase latency, but lowers power and is friendlier to other threads in the system.
◆ hipEventBlockingSync
#define hipEventBlockingSync 0x1 |
Waiting will yield CPU. Power-friendly and usage-friendly but may increase latency.
◆ hipEventDefault
#define hipEventDefault 0x0 |
Default flags.
◆ hipEventDisableSystemFence
#define hipEventDisableSystemFence 0x20000000 |
Disable performing a system scope sequentially consistent memory fence when the event transitions from recording to recorded. This can be used for events that are only being used to measure timing, and do not require the event inspection operations (see hipEventSynchronize, hipEventQuery, and hipEventElapsedTime) to synchronize-with the work on which the recorded event (see hipEventRecord) is waiting. On some AMD GPU devices this can improve the accuracy of timing measurements by avoiding the cost of cache writeback and invalidation, and the performance impact of those actions on the execution of following work.
◆ hipEventDisableTiming
#define hipEventDisableTiming 0x2 |
Disable event's capability to record timing information. May improve performance.
◆ hipEventInterprocess
#define hipEventInterprocess 0x4 |
Event can support IPC. hipEventDisableTiming also must be set.
◆ hipEventReleaseToDevice
#define hipEventReleaseToDevice 0x40000000 |
Use a device-scope release when recording this event. This flag is useful to obtain more precise timings of commands between events. The flag is a no-op on CUDA platforms.
◆ hipEventReleaseToSystem
#define hipEventReleaseToSystem 0x80000000 |
Use a system-scope release when recording this event. This flag is useful to make non-coherent host memory visible to the host. The flag is a no-op on CUDA platforms.
◆ hipExtAnyOrderLaunch
#define hipExtAnyOrderLaunch 0x01 |
AnyOrderLaunch of kernels.
◆ hipExternalMemoryDedicated
#define hipExternalMemoryDedicated 0x1 |
◆ hipExtHostRegisterCoarseGrained
#define hipExtHostRegisterCoarseGrained 0x8 |
Coarse Grained host memory lock.
◆ hipGetDeviceProperties
#define hipGetDeviceProperties hipGetDevicePropertiesR0600 |
◆ hipGraphKernelNodePortDefault
#define hipGraphKernelNodePortDefault 0 |
This port activates when the kernel has finished executing.
◆ hipGraphKernelNodePortLaunchCompletion
#define hipGraphKernelNodePortLaunchCompletion 2 |
This port activates when all blocks of the kernel have begun execution.
◆ hipGraphKernelNodePortProgrammatic
#define hipGraphKernelNodePortProgrammatic 1 |
This port activates when all blocks of the kernel have performed hipTriggerProgrammaticLaunchCompletion() or have terminated. It must be used with edge type hipGraphDependencyTypeProgrammatic.
◆ hipHostMallocCoherent
#define hipHostMallocCoherent 0x40000000 |
Allocate coherent memory. Overrides HIP_COHERENT_HOST_ALLOC for specific allocation.
◆ hipHostMallocDefault
#define hipHostMallocDefault 0x0 |
Default pinned memory allocation on the host.
◆ hipHostMallocMapped
#define hipHostMallocMapped 0x2 |
Map the allocation into the address space for the current device. The device pointer can be obtained with hipHostGetDevicePointer.
◆ hipHostMallocNonCoherent
#define hipHostMallocNonCoherent 0x80000000 |
Allocate non-coherent memory. Overrides HIP_COHERENT_HOST_ALLOC for specific allocation.
◆ hipHostMallocNumaUser
#define hipHostMallocNumaUser 0x20000000 |
Host memory allocation will follow numa policy set by user.
- Note
- This numa allocation flag is applicable on Linux, under development on Windows.
◆ hipHostMallocPortable
#define hipHostMallocPortable 0x1 |
Memory is considered allocated by all contexts.
◆ hipHostMallocWriteCombined
#define hipHostMallocWriteCombined 0x4 |
Allocates the memory as write-combined. On some system configurations, write-combined allocation may be transferred faster across the PCI Express bus, however, could have low read efficiency by most CPUs. It's a good option for data tranfer from host to device via mapped pinned memory.
◆ hipHostRegisterDefault
#define hipHostRegisterDefault 0x0 |
Memory is Mapped and Portable.
◆ hipHostRegisterIoMemory
#define hipHostRegisterIoMemory 0x4 |
Not supported.
◆ hipHostRegisterMapped
#define hipHostRegisterMapped 0x2 |
Map the allocation into the address space for the current device. The device pointer can be obtained with hipHostGetDevicePointer.
◆ hipHostRegisterPortable
#define hipHostRegisterPortable 0x1 |
Memory is considered registered by all contexts.
◆ hipHostRegisterReadOnly
#define hipHostRegisterReadOnly 0x08 |
This flag is ignored On AMD devices.
◆ hipInvalidDeviceId
#define hipInvalidDeviceId ((int)-2) |
◆ hipIpcMemLazyEnablePeerAccess
#define hipIpcMemLazyEnablePeerAccess 0x01 |
◆ hipKernelNodeAttributeAccessPolicyWindow
#define hipKernelNodeAttributeAccessPolicyWindow hipLaunchAttributeAccessPolicyWindow |
◆ hipKernelNodeAttributeCooperative
#define hipKernelNodeAttributeCooperative hipLaunchAttributeCooperative |
◆ hipKernelNodeAttributePriority
#define hipKernelNodeAttributePriority hipLaunchAttributePriority |
◆ hipKernelNodeAttrID
#define hipKernelNodeAttrID hipLaunchAttributeID |
Kernel node attributeID
◆ hipKernelNodeAttrValue
#define hipKernelNodeAttrValue hipLaunchAttributeValue |
Kernel node attribute value
◆ hipMallocSignalMemory
#define hipMallocSignalMemory 0x2 |
Memory represents a HSA signal.
◆ hipMemAttachGlobal
#define hipMemAttachGlobal 0x01 |
Memory can be accessed by any stream on any device
◆ hipMemAttachHost
#define hipMemAttachHost 0x02 |
Memory cannot be accessed by any stream on any device.
◆ hipMemAttachSingle
#define hipMemAttachSingle 0x04 |
Memory can only be accessed by a single stream on the associated device.
◆ hipOccupancyDefault
#define hipOccupancyDefault 0x00 |
◆ hipOccupancyDisableCachingOverride
#define hipOccupancyDisableCachingOverride 0x01 |
◆ hipStreamDefault
#define hipStreamDefault 0x00 |
Flags that can be used with hipStreamCreateWithFlags. Default stream creation flags. These are used with hipStreamCreate().
◆ hipStreamLegacy
#define hipStreamLegacy ((hipStream_t)1) |
◆ hipStreamNonBlocking
#define hipStreamNonBlocking 0x01 |
Stream does not implicitly synchronize with null stream.
◆ hipStreamPerThread
#define hipStreamPerThread ((hipStream_t)2) |
Implicit stream per application thread.
◆ hipStreamWaitValueAnd
#define hipStreamWaitValueAnd 0x2 |
◆ hipStreamWaitValueEq
#define hipStreamWaitValueEq 0x1 |
◆ hipStreamWaitValueGte
#define hipStreamWaitValueGte 0x0 |
◆ hipStreamWaitValueNor
#define hipStreamWaitValueNor 0x3 |
Typedef Documentation
◆ GLenum
typedef unsigned int GLenum |
GLenum as uint.
◆ GLuint
typedef unsigned int GLuint |
GLuint as uint.
◆ hipCtx_t
typedef struct ihipCtx_t* hipCtx_t |
◆ hipDevice_t
typedef int hipDevice_t |
◆ hipError_t
HIP error type
◆ hipEvent_t
typedef struct ihipEvent_t* hipEvent_t |
◆ hipExternalMemory_t
typedef void* hipExternalMemory_t |
◆ hipExternalSemaphore_t
typedef void* hipExternalSemaphore_t |
◆ hipFunction_t
typedef struct ihipModuleSymbol_t* hipFunction_t |
◆ hipGraph_t
typedef struct ihipGraph* hipGraph_t |
An opaque value that represents a hip graph
◆ hipGraphExec_t
typedef struct hipGraphExec* hipGraphExec_t |
An opaque value that represents a hip graph Exec
◆ hipGraphicsResource
typedef struct _hipGraphicsResource hipGraphicsResource |
◆ hipGraphicsResource_t
typedef hipGraphicsResource* hipGraphicsResource_t |
◆ hipGraphNode_t
typedef struct hipGraphNode* hipGraphNode_t |
An opaque value that represents a hip graph node
◆ hipHostFn_t
typedef void(* hipHostFn_t) (void *userData) |
◆ hipMemGenericAllocationHandle_t
typedef struct ihipMemGenericAllocationHandle* hipMemGenericAllocationHandle_t |
Generic handle for memory allocation
◆ hipMemPool_t
typedef struct ihipMemPoolHandle_t* hipMemPool_t |
HIP memory pool
◆ hipModule_t
typedef struct ihipModule_t* hipModule_t |
◆ hipStream_t
typedef struct ihipStream_t* hipStream_t |
◆ hipUserObject_t
typedef struct hipUserObject* hipUserObject_t |
An opaque value that represents a user obj
Enumeration Type Documentation
◆ hipAccessProperty
enum hipAccessProperty |
◆ hipArraySparseSubresourceType
◆ hipComputeMode
enum hipComputeMode |
◆ hipDeviceAttribute_t
enum hipDeviceAttribute_t |
hipDeviceAttribute_t hipDeviceAttributeUnused number: 5
Enumerator | |
---|---|
hipDeviceAttributeCudaCompatibleBegin | |
hipDeviceAttributeEccEnabled | Whether ECC support is enabled. |
hipDeviceAttributeAccessPolicyMaxWindowSize | Cuda only. The maximum size of the window policy in bytes. |
hipDeviceAttributeAsyncEngineCount | Asynchronous engines number. |
hipDeviceAttributeCanMapHostMemory | Whether host memory can be mapped into device address space. |
hipDeviceAttributeCanUseHostPointerForRegisteredMem | Device can access host registered memory at the same virtual address as the CPU |
hipDeviceAttributeClockRate | Peak clock frequency in kilohertz. |
hipDeviceAttributeComputeMode | Compute mode that device is currently in. |
hipDeviceAttributeComputePreemptionSupported | Device supports Compute Preemption. |
hipDeviceAttributeConcurrentKernels | Device can possibly execute multiple kernels concurrently. |
hipDeviceAttributeConcurrentManagedAccess | Device can coherently access managed memory concurrently with the CPU. |
hipDeviceAttributeCooperativeLaunch | Support cooperative launch. |
hipDeviceAttributeCooperativeMultiDeviceLaunch | Support cooperative launch on multiple devices. |
hipDeviceAttributeDeviceOverlap | Device can concurrently copy memory and execute a kernel. Deprecated. Use instead asyncEngineCount. |
hipDeviceAttributeDirectManagedMemAccessFromHost | Host can directly access managed memory on the device without migration |
hipDeviceAttributeGlobalL1CacheSupported | Device supports caching globals in L1. |
hipDeviceAttributeHostNativeAtomicSupported | Link between the device and the host supports native atomic operations. |
hipDeviceAttributeIntegrated | Device is integrated GPU. |
hipDeviceAttributeIsMultiGpuBoard | Multiple GPU devices. |
hipDeviceAttributeKernelExecTimeout | Run time limit for kernels executed on the device. |
hipDeviceAttributeL2CacheSize | Size of L2 cache in bytes. 0 if the device doesn't have L2 cache. |
hipDeviceAttributeLocalL1CacheSupported | caching locals in L1 is supported |
hipDeviceAttributeLuid | 8-byte locally unique identifier in 8 bytes. Undefined on TCC and non-Windows platforms |
hipDeviceAttributeLuidDeviceNodeMask | Luid device node mask. Undefined on TCC and non-Windows platforms. |
hipDeviceAttributeComputeCapabilityMajor | Major compute capability version number. |
hipDeviceAttributeManagedMemory | Device supports allocating managed memory on this system. |
hipDeviceAttributeMaxBlocksPerMultiProcessor | Max block size per multiprocessor. |
hipDeviceAttributeMaxBlockDimX | Max block size in width. |
hipDeviceAttributeMaxBlockDimY | Max block size in height. |
hipDeviceAttributeMaxBlockDimZ | Max block size in depth. |
hipDeviceAttributeMaxGridDimX | Max grid size in width. |
hipDeviceAttributeMaxGridDimY | Max grid size in height. |
hipDeviceAttributeMaxGridDimZ | Max grid size in depth. |
hipDeviceAttributeMaxSurface1D | Maximum size of 1D surface. |
hipDeviceAttributeMaxSurface1DLayered | Cuda only. Maximum dimensions of 1D layered surface. |
hipDeviceAttributeMaxSurface2D | Maximum dimension (width, height) of 2D surface. |
hipDeviceAttributeMaxSurface2DLayered | Cuda only. Maximum dimensions of 2D layered surface. |
hipDeviceAttributeMaxSurface3D | Maximum dimension (width, height, depth) of 3D surface. |
hipDeviceAttributeMaxSurfaceCubemap | Cuda only. Maximum dimensions of Cubemap surface. |
hipDeviceAttributeMaxSurfaceCubemapLayered | Cuda only. Maximum dimension of Cubemap layered surface. |
hipDeviceAttributeMaxTexture1DWidth | Maximum size of 1D texture. |
hipDeviceAttributeMaxTexture1DLayered | Maximum dimensions of 1D layered texture. |
hipDeviceAttributeMaxTexture1DLinear | Maximum number of elements allocatable in a 1D linear texture. Use cudaDeviceGetTexture1DLinearMaxWidth() instead on Cuda. |
hipDeviceAttributeMaxTexture1DMipmap | Maximum size of 1D mipmapped texture. |
hipDeviceAttributeMaxTexture2DWidth | Maximum dimension width of 2D texture. |
hipDeviceAttributeMaxTexture2DHeight | Maximum dimension hight of 2D texture. |
hipDeviceAttributeMaxTexture2DGather | Maximum dimensions of 2D texture if gather operations performed. |
hipDeviceAttributeMaxTexture2DLayered | Maximum dimensions of 2D layered texture. |
hipDeviceAttributeMaxTexture2DLinear | Maximum dimensions (width, height, pitch) of 2D textures bound to pitched memory. |
hipDeviceAttributeMaxTexture2DMipmap | Maximum dimensions of 2D mipmapped texture. |
hipDeviceAttributeMaxTexture3DWidth | Maximum dimension width of 3D texture. |
hipDeviceAttributeMaxTexture3DHeight | Maximum dimension height of 3D texture. |
hipDeviceAttributeMaxTexture3DDepth | Maximum dimension depth of 3D texture. |
hipDeviceAttributeMaxTexture3DAlt | Maximum dimensions of alternate 3D texture. |
hipDeviceAttributeMaxTextureCubemap | Maximum dimensions of Cubemap texture. |
hipDeviceAttributeMaxTextureCubemapLayered | Maximum dimensions of Cubemap layered texture. |
hipDeviceAttributeMaxThreadsDim | Maximum dimension of a block. |
hipDeviceAttributeMaxThreadsPerBlock | Maximum number of threads per block. |
hipDeviceAttributeMaxThreadsPerMultiProcessor | Maximum resident threads per multiprocessor. |
hipDeviceAttributeMaxPitch | Maximum pitch in bytes allowed by memory copies. |
hipDeviceAttributeMemoryBusWidth | Global memory bus width in bits. |
hipDeviceAttributeMemoryClockRate | Peak memory clock frequency in kilohertz. |
hipDeviceAttributeComputeCapabilityMinor | Minor compute capability version number. |
hipDeviceAttributeMultiGpuBoardGroupID | Unique ID of device group on the same multi-GPU board. |
hipDeviceAttributeMultiprocessorCount | Number of multiprocessors on the device. |
hipDeviceAttributeUnused1 | Previously hipDeviceAttributeName. |
hipDeviceAttributePageableMemoryAccess | Device supports coherently accessing pageable memory without calling hipHostRegister on it |
hipDeviceAttributePageableMemoryAccessUsesHostPageTables | Device accesses pageable memory via the host's page tables. |
hipDeviceAttributePciBusId | PCI Bus ID. |
hipDeviceAttributePciDeviceId | PCI Device ID. |
hipDeviceAttributePciDomainID | PCI Domain ID. |
hipDeviceAttributePersistingL2CacheMaxSize | Maximum l2 persisting lines capacity in bytes. |
hipDeviceAttributeMaxRegistersPerBlock | 32-bit registers available to a thread block. This number is shared by all thread blocks simultaneously resident on a multiprocessor. |
hipDeviceAttributeMaxRegistersPerMultiprocessor | 32-bit registers available per block. |
hipDeviceAttributeReservedSharedMemPerBlock | Shared memory reserved by CUDA driver per block. |
hipDeviceAttributeMaxSharedMemoryPerBlock | Maximum shared memory available per block in bytes. |
hipDeviceAttributeSharedMemPerBlockOptin | Maximum shared memory per block usable by special opt in. |
hipDeviceAttributeSharedMemPerMultiprocessor | Shared memory available per multiprocessor. |
hipDeviceAttributeSingleToDoublePrecisionPerfRatio | Cuda only. Performance ratio of single precision to double precision. |
hipDeviceAttributeStreamPrioritiesSupported | Whether to support stream priorities. |
hipDeviceAttributeSurfaceAlignment | Alignment requirement for surfaces. |
hipDeviceAttributeTccDriver | Cuda only. Whether device is a Tesla device using TCC driver. |
hipDeviceAttributeTextureAlignment | Alignment requirement for textures. |
hipDeviceAttributeTexturePitchAlignment | Pitch alignment requirement for 2D texture references bound to pitched memory;. |
hipDeviceAttributeTotalConstantMemory | Constant memory size in bytes. |
hipDeviceAttributeTotalGlobalMem | Global memory available on devicice. |
hipDeviceAttributeUnifiedAddressing | Cuda only. An unified address space shared with the host. |
hipDeviceAttributeUnused2 | Previously hipDeviceAttributeUuid. |
hipDeviceAttributeWarpSize | Warp size in threads. |
hipDeviceAttributeMemoryPoolsSupported | Device supports HIP Stream Ordered Memory Allocator. |
hipDeviceAttributeVirtualMemoryManagementSupported | Device supports HIP virtual memory management. |
hipDeviceAttributeHostRegisterSupported | Can device support host memory registration via hipHostRegister. |
hipDeviceAttributeMemoryPoolSupportedHandleTypes | Supported handle mask for HIP Stream Ordered Memory Allocator. |
hipDeviceAttributeCudaCompatibleEnd | |
hipDeviceAttributeAmdSpecificBegin | |
hipDeviceAttributeClockInstructionRate | Frequency in khz of the timer used by the device-side "clock*". |
hipDeviceAttributeUnused3 | Previously hipDeviceAttributeArch. |
hipDeviceAttributeMaxSharedMemoryPerMultiprocessor | Maximum Shared Memory PerMultiprocessor. |
hipDeviceAttributeUnused4 | Previously hipDeviceAttributeGcnArch. |
hipDeviceAttributeUnused5 | Previously hipDeviceAttributeGcnArchName. |
hipDeviceAttributeHdpMemFlushCntl | Address of the HDP_MEM_COHERENCY_FLUSH_CNTL register. |
hipDeviceAttributeHdpRegFlushCntl | Address of the HDP_REG_COHERENCY_FLUSH_CNTL register. |
hipDeviceAttributeCooperativeMultiDeviceUnmatchedFunc | Supports cooperative launch on multiple devices with unmatched functions |
hipDeviceAttributeCooperativeMultiDeviceUnmatchedGridDim | Supports cooperative launch on multiple devices with unmatched grid dimensions |
hipDeviceAttributeCooperativeMultiDeviceUnmatchedBlockDim | Supports cooperative launch on multiple devices with unmatched block dimensions |
hipDeviceAttributeCooperativeMultiDeviceUnmatchedSharedMem | Supports cooperative launch on multiple devices with unmatched shared memories |
hipDeviceAttributeIsLargeBar | Whether it is LargeBar. |
hipDeviceAttributeAsicRevision | Revision of the GPU in this device. |
hipDeviceAttributeCanUseStreamWaitValue | '1' if Device supports hipStreamWaitValue32() and hipStreamWaitValue64(), '0' otherwise. |
hipDeviceAttributeImageSupport | '1' if Device supports image, '0' otherwise. |
hipDeviceAttributePhysicalMultiProcessorCount | All available physical compute units for the device |
hipDeviceAttributeFineGrainSupport | '1' if Device supports fine grain, '0' otherwise |
hipDeviceAttributeWallClockRate | Constant frequency of wall clock in kilohertz. |
hipDeviceAttributeAmdSpecificEnd | |
hipDeviceAttributeVendorSpecificBegin |
◆ hipDeviceP2PAttr
enum hipDeviceP2PAttr |
◆ hipDriverProcAddressQueryResult
◆ hipExternalMemoryHandleType
◆ hipExternalSemaphoreHandleType
◆ hipFlushGPUDirectRDMAWritesOptions
◆ hipFuncAttribute
enum hipFuncAttribute |
◆ hipFuncCache_t
enum hipFuncCache_t |
- Warning
- On AMD devices and some Nvidia devices, these hints and controls are ignored.
◆ hipGLDeviceList
enum hipGLDeviceList |
◆ hipGPUDirectRDMAWritesOrdering
◆ hipGraphDebugDotFlags
Enumerator | |
---|---|
hipGraphDebugDotFlagsVerbose | Output all debug data as if every debug flag is enabled |
hipGraphDebugDotFlagsKernelNodeParams | Adds hipKernelNodeParams to output |
hipGraphDebugDotFlagsMemcpyNodeParams | Adds hipMemcpy3DParms to output |
hipGraphDebugDotFlagsMemsetNodeParams | Adds hipMemsetParams to output |
hipGraphDebugDotFlagsHostNodeParams | Adds hipHostNodeParams to output |
hipGraphDebugDotFlagsEventNodeParams | Adds hipEvent_t handle from record and wait nodes to output |
hipGraphDebugDotFlagsExtSemasSignalNodeParams | Adds hipExternalSemaphoreSignalNodeParams values to output |
hipGraphDebugDotFlagsExtSemasWaitNodeParams | Adds hipExternalSemaphoreWaitNodeParams to output |
hipGraphDebugDotFlagsKernelNodeAttributes | Adds hipKernelNodeAttrID values to output |
hipGraphDebugDotFlagsHandles | Adds node handles and every kernel function handle to output |
◆ hipGraphDependencyType
◆ hipGraphExecUpdateResult
Graph execution update result
◆ hipGraphicsRegisterFlags
HIP Access falgs for Interop resources.
◆ hipGraphInstantiateFlags
◆ hipGraphInstantiateResult
hipGraphInstantiateWithParams results
◆ hipGraphMemAttributeType
◆ hipGraphNodeType
enum hipGraphNodeType |
hipGraphNodeType
◆ hipJitOption
enum hipJitOption |
hipJitOption
◆ hipLaunchAttributeID
enum hipLaunchAttributeID |
◆ hipLimit_t
enum hipLimit_t |
hipLimit
- Note
- In HIP device limit-related APIs, any input limit value other than those defined in the enum is treated as "UnsupportedLimit" by default.
◆ hipMemAccessFlags
enum hipMemAccessFlags |
◆ hipMemAllocationGranularity_flags
◆ hipMemAllocationHandleType
Flags for specifying handle types for memory pool allocations
◆ hipMemAllocationType
enum hipMemAllocationType |
◆ hipMemHandleType
enum hipMemHandleType |
◆ hipMemLocationType
enum hipMemLocationType |
◆ hipMemOperationType
enum hipMemOperationType |
◆ hipMemoryAdvise
enum hipMemoryAdvise |
HIP Memory Advise values
- Note
- This memory advise enumeration is used on Linux, not Windows.
◆ hipMemoryType
enum hipMemoryType |
hipMemoryType (for pointer attributes)
- Note
- hipMemoryType enum values are combination of cudaMemoryType and cuMemoryType and AMD specific enum values.
◆ hipMemPoolAttr
enum hipMemPoolAttr |
HIP memory pool attributes
◆ hipMemRangeAttribute
enum hipMemRangeAttribute |
HIP range attributes
Enumerator | |
---|---|
hipMemRangeAttributeReadMostly | Whether the range will mostly be read and only occassionally be written to |
hipMemRangeAttributePreferredLocation | The preferred location of the range. |
hipMemRangeAttributeAccessedBy | Memory range has hipMemAdviseSetAccessedBy set for the specified device |
hipMemRangeAttributeLastPrefetchLocation | prefetched The last location to where the range was |
hipMemRangeAttributeCoherencyMode | Returns coherency mode hipMemRangeCoherencyMode for the range |
◆ hipMemRangeCoherencyMode
HIP Coherency Mode
◆ hiprtcJIT_option
enum hiprtcJIT_option |
hiprtc JIT option
Enumerator | |
---|---|
HIPRTC_JIT_MAX_REGISTERS | CUDA Only Maximum registers may be used in a thread, passed to compiler. |
HIPRTC_JIT_THREADS_PER_BLOCK | CUDA Only Number of thread per block. |
HIPRTC_JIT_WALL_TIME | CUDA Only Value for total wall clock time. |
HIPRTC_JIT_INFO_LOG_BUFFER | CUDA Only Pointer to the buffer with logged information. |
HIPRTC_JIT_INFO_LOG_BUFFER_SIZE_BYTES | CUDA Only Size of the buffer in bytes for logged info. |
HIPRTC_JIT_ERROR_LOG_BUFFER | CUDA Only Pointer to the buffer with logged error(s) |
HIPRTC_JIT_ERROR_LOG_BUFFER_SIZE_BYTES | CUDA Only Size of the buffer in bytes for logged error(s) |
HIPRTC_JIT_OPTIMIZATION_LEVEL | Value of optimization level for generated codes, acceptable options -O0, -O1, -O2, -O3. |
HIPRTC_JIT_TARGET_FROM_HIPCONTEXT | CUDA Only The target context, which is the default. |
HIPRTC_JIT_TARGET | CUDA Only JIT target. |
HIPRTC_JIT_FALLBACK_STRATEGY | CUDA Only Fallback strategy. |
HIPRTC_JIT_GENERATE_DEBUG_INFO | CUDA Only Generate debug information. |
HIPRTC_JIT_LOG_VERBOSE | CUDA Only Generate log verbose. |
HIPRTC_JIT_GENERATE_LINE_INFO | CUDA Only Generate line number information. |
HIPRTC_JIT_CACHE_MODE | CUDA Only Set cache mode. |
HIPRTC_JIT_NEW_SM3X_OPT |
|
HIPRTC_JIT_FAST_COMPILE | CUDA Only Set fast compile. |
HIPRTC_JIT_GLOBAL_SYMBOL_NAMES | CUDA Only Array of device symbol names to be relocated to the host. |
HIPRTC_JIT_GLOBAL_SYMBOL_ADDRESS | CUDA Only Array of host addresses to be relocated to the device. |
HIPRTC_JIT_GLOBAL_SYMBOL_COUNT | CUDA Only Number of symbol count. |
HIPRTC_JIT_LTO |
|
HIPRTC_JIT_FTZ |
|
HIPRTC_JIT_PREC_DIV |
|
HIPRTC_JIT_PREC_SQRT |
|
HIPRTC_JIT_FMA |
|
HIPRTC_JIT_NUM_OPTIONS | Number of options. |
HIPRTC_JIT_IR_TO_ISA_OPT_EXT | Linker options to be passed on to compiler
|
HIPRTC_JIT_IR_TO_ISA_OPT_COUNT_EXT | Count of linker options to be passed on to compiler
|
◆ hiprtcJITInputType
enum hiprtcJITInputType |
hiprtc JIT input type
◆ hiprtcResult
enum hiprtcResult |
hiprtc error code
◆ hipSharedMemConfig
enum hipSharedMemConfig |
- Warning
- On AMD devices and some Nvidia devices, these hints and controls are ignored.
◆ hipStreamCaptureMode
enum hipStreamCaptureMode |
◆ hipStreamCaptureStatus
◆ hipStreamUpdateCaptureDependenciesFlags
◆ hipUserObjectFlags
enum hipUserObjectFlags |