rocprofiler-sdk/fwd.h Source File

rocprofiler-sdk/fwd.h Source File#

Rocprofiler SDK Developer API: rocprofiler-sdk/fwd.h Source File
Rocprofiler SDK Developer API 0.6.0
ROCm Profiling API and tools
fwd.h
Go to the documentation of this file.
1// MIT License
2//
3// Copyright (c) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
4//
5// Permission is hereby granted, free of charge, to any person obtaining a copy
6// of this software and associated documentation files (the "Software"), to deal
7// in the Software without restriction, including without limitation the rights
8// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9// copies of the Software, and to permit persons to whom the Software is
10// furnished to do so, subject to the following conditions:
11//
12// The above copyright notice and this permission notice shall be included in all
13// copies or substantial portions of the Software.
14//
15// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21// SOFTWARE.
22
23#pragma once
24
26
27#include <stddef.h>
28#include <stdint.h>
29
30ROCPROFILER_EXTERN_C_INIT
31
32//--------------------------------------------------------------------------------------//
33//
34// ENUMERATIONS
35//
36//--------------------------------------------------------------------------------------//
37
38/**
39 * @defgroup BASIC_DATA_TYPES Basic data types
40 * @brief Basic data types and typedefs
41 *
42 * @{
43 */
44
45// TODO(aelwazir): Do we need to add a null (way) for every handle?
46// TODO(aelwazir): Remove API Data args from the doxygen?
47// TODO(aelwazir): Not everything in bin needs to be installed bin, use libexec or share?
48
49/**
50 * @brief Status codes.
51 */
52typedef enum // NOLINT(performance-enum-size)
53{
54 ROCPROFILER_STATUS_SUCCESS = 0, ///< No error occurred
55 ROCPROFILER_STATUS_ERROR, ///< Generalized error
56 ROCPROFILER_STATUS_ERROR_CONTEXT_NOT_FOUND, ///< No valid context for given context id
57 ROCPROFILER_STATUS_ERROR_BUFFER_NOT_FOUND, ///< No valid buffer for given buffer id
58 ROCPROFILER_STATUS_ERROR_KIND_NOT_FOUND, ///< Kind identifier is invalid
59 ROCPROFILER_STATUS_ERROR_OPERATION_NOT_FOUND, ///< Operation identifier is invalid for domain
60 ROCPROFILER_STATUS_ERROR_THREAD_NOT_FOUND, ///< No valid thread for given thread id
61 ROCPROFILER_STATUS_ERROR_AGENT_NOT_FOUND, ///< Agent identifier not found
62 ROCPROFILER_STATUS_ERROR_COUNTER_NOT_FOUND, ///< Counter identifier does not exist
63 ROCPROFILER_STATUS_ERROR_CONTEXT_ERROR, ///< Generalized context error
64 ROCPROFILER_STATUS_ERROR_CONTEXT_INVALID, ///< Context configuration is not valid
65 ROCPROFILER_STATUS_ERROR_CONTEXT_NOT_STARTED, ///< Context was not started (e.g., atomic swap
66 ///< into active array failed)
67 ROCPROFILER_STATUS_ERROR_CONTEXT_CONFLICT, ///< Context operation failed due to a conflict with
68 ///< another context
69 ROCPROFILER_STATUS_ERROR_CONTEXT_ID_NOT_ZERO, ///< Context ID is not initialized to zero
70 ROCPROFILER_STATUS_ERROR_BUFFER_BUSY, ///< buffer operation failed because it currently busy
71 ///< handling another request (e.g. flushing)
72 ROCPROFILER_STATUS_ERROR_SERVICE_ALREADY_CONFIGURED, ///< service has already been configured
73 ///< in context
74 ROCPROFILER_STATUS_ERROR_CONFIGURATION_LOCKED, ///< Function call is not valid outside of
75 ///< rocprofiler configuration (i.e.
76 ///< function called post-initialization)
77 ROCPROFILER_STATUS_ERROR_NOT_IMPLEMENTED, ///< Function is not implemented
78 ROCPROFILER_STATUS_ERROR_INCOMPATIBLE_ABI, ///< Data structure provided by user is incompatible
79 ///< with current version of rocprofiler
80 ROCPROFILER_STATUS_ERROR_INVALID_ARGUMENT, ///< Function invoked with one or more invalid
81 ///< arguments
82 ROCPROFILER_STATUS_ERROR_METRIC_NOT_VALID_FOR_AGENT, ///< Invalid metric supplied to agent.
83 ROCPROFILER_STATUS_ERROR_FINALIZED, ///< invalid because rocprofiler has been finalized
84 ROCPROFILER_STATUS_ERROR_HSA_NOT_LOADED, ///< Call requires HSA to be loaded before performed
85 ROCPROFILER_STATUS_ERROR_DIM_NOT_FOUND, ///< Dimension is not found for counter
86 ROCPROFILER_STATUS_ERROR_PROFILE_COUNTER_NOT_FOUND, ///< Profile could not find counter for GPU
87 ///< agent
88 ROCPROFILER_STATUS_ERROR_AST_GENERATION_FAILED, ///< AST could not be generated correctly
90 ROCPROFILER_STATUS_ERROR_AQL_NO_EVENT_COORD, ///< Event coordinate was not found by AQL profile
91 ROCPROFILER_STATUS_ERROR_INCOMPATIBLE_KERNEL, ///< A service depends on a newer version of KFD
92 ///< (amdgpu kernel driver). Check logs for
93 ///< service that report incompatibility
94 ROCPROFILER_STATUS_ERROR_OUT_OF_RESOURCES, ///< The given resources are
95 ///< insufficient to complete operation
96 ROCPROFILER_STATUS_ERROR_PROFILE_NOT_FOUND, ///< Could not find the counter profile
97 ROCPROFILER_STATUS_ERROR_AGENT_DISPATCH_CONFLICT, ///< Cannot enable both agent and dispatch
98 ///< counting in the same context.
99 ROCPROFILER_STATUS_INTERNAL_NO_AGENT_CONTEXT, ///< No agent context found, may not be an error
101 ROCPROFILER_STATUS_ERROR_NO_PROFILE_QUEUE, ///< Profile queue creation failed
102 ROCPROFILER_STATUS_ERROR_NO_HARDWARE_COUNTERS, ///< No hardware counters were specified
103 ROCPROFILER_STATUS_ERROR_AGENT_MISMATCH, ///< Agent mismatch between profile and context.
104 ROCPROFILER_STATUS_ERROR_NOT_AVAILABLE, ///< The service is not available.
105 ///< Please refer to API functions that return this
106 ///< status code for more information.
107 ROCPROFILER_STATUS_ERROR_EXCEEDS_HW_LIMIT, ///< Exceeds hardware limits for collection.
108 ROCPROFILER_STATUS_ERROR_AGENT_ARCH_NOT_SUPPORTED, ///< Agent HW architecture not supported.
112
113/**
114 * @brief Buffer record categories. This enumeration type is encoded in @ref
115 * rocprofiler_record_header_t category field
116 */
125
126/**
127 * @brief Agent type.
128 */
129typedef enum // NOLINT(performance-enum-size)
130{
131 ROCPROFILER_AGENT_TYPE_NONE = 0, ///< Agent type is unknown
132 ROCPROFILER_AGENT_TYPE_CPU, ///< Agent type is a CPU
133 ROCPROFILER_AGENT_TYPE_GPU, ///< Agent type is a GPU
136
137/**
138 * @brief Service Callback Phase.
139 */
140typedef enum // NOLINT(performance-enum-size)
141{
142 ROCPROFILER_CALLBACK_PHASE_NONE = 0, ///< Callback has no phase
143 ROCPROFILER_CALLBACK_PHASE_ENTER, ///< Callback invoked prior to function execution
145 ROCPROFILER_CALLBACK_PHASE_ENTER, ///< Callback invoked prior to code object loading
146 ROCPROFILER_CALLBACK_PHASE_EXIT, ///< Callback invoked after to function execution
148 ROCPROFILER_CALLBACK_PHASE_EXIT, ///< Callback invoked prior to code object unloading
151
152/**
153 * @brief Service Callback Tracing Kind. @see rocprofiler_configure_callback_tracing_service.
154 */
155typedef enum // NOLINT(performance-enum-size)
156{
158 ROCPROFILER_CALLBACK_TRACING_HSA_CORE_API, ///< @see ::rocprofiler_hsa_core_api_id_t
159 ROCPROFILER_CALLBACK_TRACING_HSA_AMD_EXT_API, ///< @see ::rocprofiler_hsa_amd_ext_api_id_t
160 ROCPROFILER_CALLBACK_TRACING_HSA_IMAGE_EXT_API, ///< @see ::rocprofiler_hsa_image_ext_api_id_t
162 ///< ::rocprofiler_hsa_finalize_ext_api_id_t
163 ROCPROFILER_CALLBACK_TRACING_HIP_RUNTIME_API, ///< @see ::rocprofiler_hip_runtime_api_id_t
164 ROCPROFILER_CALLBACK_TRACING_HIP_COMPILER_API, ///< @see ::rocprofiler_hip_compiler_api_id_t
165 ROCPROFILER_CALLBACK_TRACING_MARKER_CORE_API, ///< @see ::rocprofiler_marker_core_api_id_t
167 ///< ::rocprofiler_marker_control_api_id_t
168 ROCPROFILER_CALLBACK_TRACING_MARKER_NAME_API, ///< @see ::rocprofiler_marker_name_api_id_t
169 ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT, ///< @see ::rocprofiler_code_object_operation_t
170 ROCPROFILER_CALLBACK_TRACING_SCRATCH_MEMORY, ///< @see ::rocprofiler_scratch_memory_operation_t
171 ROCPROFILER_CALLBACK_TRACING_KERNEL_DISPATCH, ///< Callbacks for kernel dispatches
172 ROCPROFILER_CALLBACK_TRACING_MEMORY_COPY, ///< @see ::rocprofiler_memory_copy_operation_t
174 ROCPROFILER_CALLBACK_TRACING_OMPT, ///< @see ::rocprofiler_ompt_operation_t
176 ///< ::rocprofiler_memory_allocation_operation_t
177 ROCPROFILER_CALLBACK_TRACING_RUNTIME_INITIALIZATION, ///< Callback notifying that a runtime
178 ///< library has been initialized
182
183/**
184 * @brief Service Buffer Tracing Kind. @see rocprofiler_configure_buffer_tracing_service.
185 */
186typedef enum // NOLINT(performance-enum-size)
187{
189 ROCPROFILER_BUFFER_TRACING_HSA_CORE_API, ///< @see ::rocprofiler_hsa_core_api_id_t
190 ROCPROFILER_BUFFER_TRACING_HSA_AMD_EXT_API, ///< @see ::rocprofiler_hsa_amd_ext_api_id_t
191 ROCPROFILER_BUFFER_TRACING_HSA_IMAGE_EXT_API, ///< @see ::rocprofiler_hsa_image_ext_api_id_t
193 ///< ::rocprofiler_hsa_finalize_ext_api_id_t
194 ROCPROFILER_BUFFER_TRACING_HIP_RUNTIME_API, ///< @see ::rocprofiler_hip_runtime_api_id_t
195 ROCPROFILER_BUFFER_TRACING_HIP_COMPILER_API, ///< @see ::rocprofiler_hip_compiler_api_id_t
196 ROCPROFILER_BUFFER_TRACING_MARKER_CORE_API, ///< @see ::rocprofiler_marker_core_api_id_t
197 ROCPROFILER_BUFFER_TRACING_MARKER_CONTROL_API, ///< @see ::rocprofiler_marker_control_api_id_t
198 ROCPROFILER_BUFFER_TRACING_MARKER_NAME_API, ///< @see ::rocprofiler_marker_name_api_id_t
199 ROCPROFILER_BUFFER_TRACING_MEMORY_COPY, ///< @see ::rocprofiler_memory_copy_operation_t
200 ROCPROFILER_BUFFER_TRACING_KERNEL_DISPATCH, ///< Buffer kernel dispatch info
201 ROCPROFILER_BUFFER_TRACING_PAGE_MIGRATION, ///< Buffer page migration info
202 ROCPROFILER_BUFFER_TRACING_SCRATCH_MEMORY, ///< Buffer scratch memory reclaimation info
203 ROCPROFILER_BUFFER_TRACING_CORRELATION_ID_RETIREMENT, ///< Correlation ID in no longer in use
205 ROCPROFILER_BUFFER_TRACING_OMPT, ///< @see ::rocprofiler_ompt_operation_t
207 ///< ::rocprofiler_memory_allocation_operation_t
208 ROCPROFILER_BUFFER_TRACING_RUNTIME_INITIALIZATION, ///< Record indicating a runtime library has
209 ///< been initialized. @see
210 ///< ::rocprofiler_runtime_initialization_operation_t
214
215/**
216 * @brief ROCProfiler Code Object Tracer Operations.
217 */
218typedef enum // NOLINT(performance-enum-size)
219{
220 ROCPROFILER_CODE_OBJECT_NONE = 0, ///< Unknown code object operation
221 ROCPROFILER_CODE_OBJECT_LOAD, ///< Code object containing kernel symbols
226
227/**
228 * @brief Memory Copy Operations.
229 */
230typedef enum // NOLINT(performance-enum-size)
231{
232 ROCPROFILER_MEMORY_COPY_NONE = 0, ///< Unknown memory copy direction
233 ROCPROFILER_MEMORY_COPY_HOST_TO_HOST, ///< Memory copy from host to host
234 ROCPROFILER_MEMORY_COPY_HOST_TO_DEVICE, ///< Memory copy from host to device
235 ROCPROFILER_MEMORY_COPY_DEVICE_TO_HOST, ///< Memory copy from device to host
236 ROCPROFILER_MEMORY_COPY_DEVICE_TO_DEVICE, ///< Memory copy from device to device
239
240/**
241 * @brief Memory Allocation Operation.
242 */
243typedef enum // NOLINT(performance-enum-size)
244{
245 ROCPROFILER_MEMORY_ALLOCATION_NONE = 0, ///< Unknown memory allocation function
246 ROCPROFILER_MEMORY_ALLOCATION_ALLOCATE, ///< Allocate memory function
247 ROCPROFILER_MEMORY_ALLOCATION_VMEM_ALLOCATE, ///< Allocate vmem memory handle
248 ROCPROFILER_MEMORY_ALLOCATION_FREE, ///< Free memory function
249 ROCPROFILER_MEMORY_ALLOCATION_VMEM_FREE, ///< Release vmem memory handle
252
253/**
254 * @brief ROCProfiler Kernel Dispatch Tracing Operation Types.
255 */
256typedef enum // NOLINT(performance-enum-size)
257{
258 ROCPROFILER_KERNEL_DISPATCH_NONE = 0, ///< Unknown kernel dispatch operation
262
263 /// @var ROCPROFILER_KERNEL_DISPATCH_ENQUEUE
264 /// @brief Invoke callback prior to a kernel being enqueued and after the kernel has been
265 /// enqueued. When the phase is ::ROCPROFILER_CALLBACK_PHASE_ENTER, this is an opportunity to
266 /// push an external correlation id and/or modify the active contexts before a kernel is
267 /// launched. Any active contexts containing services related to a kernel dispatch (kernel
268 /// tracing, counter collection, etc.) will be captured after this callback and attached to the
269 /// kernel. These captured contexts will be considered "active" when the kernel completes even
270 /// if the context was stopped before the kernel completes -- this contract is designed to
271 /// ensure that tools do not have to delay stopping a context because of an async operation in
272 /// order to get the data they requested when the async operation was started. When the phase is
273 /// ::ROCPROFILER_CALLBACK_PHASE_EXIT, the active contexts for the kernel dispatch have been
274 /// captured and it is safe to disable those contexts without affecting the delivery of the
275 /// requested data when the kernel completes. It is important to note that, even if the context
276 /// associated with the kernel dispatch callback tracing service is disabled in between the
277 /// enter and exit phase, the exit phase callback is still delievered but that context will not
278 /// be captured when the kernel is enqueued and therefore will not provide a
279 /// ::ROCPROFILER_KERNEL_DISPATCH_COMPLETE callback. Furthermore, it should be
280 /// noted that if a tool encodes information into the `::rocprofiler_user_data_t` output
281 /// parameter in ::rocprofiler_callback_tracing_cb_t, that same value will be delivered in the
282 /// exit phase and in the ::ROCPROFILER_KERNEL_DISPATCH_COMPLETE callback. In
283 /// other words, any modifications to that user data value in the exit phase will not be
284 /// reflected in the ::ROCPROFILER_KERNEL_DISPATCH_COMPLETE callback because a
285 /// copy of that user data struct is attached to the kernel, not a reference to the user data
286 /// struct.
287 ///
288 /// @var ROCPROFILER_KERNEL_DISPATCH_COMPLETE
289 /// @brief Invoke callback after a kernel has completed and the HSA runtime has processed the
290 /// signal indicating that the kernel has completed. The latter half of this statement is
291 /// important. There is no guarantee that these callbacks are invoked in any order related to
292 /// when the kernels were dispatched, i.e. even if kernel A is launched and fully executed
293 /// before kernel B is launched, it is entirely possible that the HSA runtime ends up processing
294 /// the signal associated with kernel B before processing the signal associated with kernel A --
295 /// resulting in rocprofiler-sdk invoking this operation callback for kernel B before invoking
296 /// the callback for kernel A.
298
299/**
300 * @brief PC Sampling Method.
301 */
302typedef enum // NOLINT(performance-enum-size)
303{
304 ROCPROFILER_PC_SAMPLING_METHOD_NONE = 0, ///< Unknown sampling type
305 ROCPROFILER_PC_SAMPLING_METHOD_STOCHASTIC, ///< Stochastic sampling (MI300+)
306 ROCPROFILER_PC_SAMPLING_METHOD_HOST_TRAP, ///< Interval sampling (MI200+)
309
310/**
311 * @brief PC Sampling Unit.
312 */
313typedef enum // NOLINT(performance-enum-size)
314{
315 ROCPROFILER_PC_SAMPLING_UNIT_NONE = 0, ///< Sample interval has unspecified units
316 ROCPROFILER_PC_SAMPLING_UNIT_INSTRUCTIONS, ///< Sample interval is in instructions
317 ROCPROFILER_PC_SAMPLING_UNIT_CYCLES, ///< Sample interval is in cycles
318 ROCPROFILER_PC_SAMPLING_UNIT_TIME, ///< Sample internval is in nanoseconds
321
322/**
323 * @brief Actions when Buffer is full.
324 */
325typedef enum // NOLINT(performance-enum-size)
326{
327 ROCPROFILER_BUFFER_POLICY_NONE = 0, ///< No policy has been set
328 ROCPROFILER_BUFFER_POLICY_DISCARD, ///< Drop records when buffer is full
329 ROCPROFILER_BUFFER_POLICY_LOSSLESS, ///< Block when buffer is full
332
333/**
334 * @brief Page migration event.
335 */
349
350/**
351 * @brief Scratch event kind
352 */
353typedef enum
354{
355 ROCPROFILER_SCRATCH_MEMORY_NONE = 0, ///< Unknown scratch operation
356 ROCPROFILER_SCRATCH_MEMORY_ALLOC, ///< Scratch memory allocation event
357 ROCPROFILER_SCRATCH_MEMORY_FREE, ///< Scratch memory free event
358 ROCPROFILER_SCRATCH_MEMORY_ASYNC_RECLAIM, ///< Scratch memory asynchronously reclaimed
361
362/**
363 * @brief Enumeration for specifying runtime libraries supported by rocprofiler. This enumeration is
364 * used for thread creation callbacks. @see INTERNAL_THREADING.
365 */
376
377/**
378 * @brief Enumeration for specifying intercept tables supported by rocprofiler. This enumeration is
379 * used for intercept tables. @see INTERCEPT_TABLE.
380 */
393
394/**
395 * @brief ROCProfiler Runtime Initialization Tracer Operations.
396 */
397typedef enum // NOLINT(performance-enum-size)
398{
399 ROCPROFILER_RUNTIME_INITIALIZATION_NONE = 0, ///< Unknown runtime initialization
400 ROCPROFILER_RUNTIME_INITIALIZATION_HSA, ///< Application loaded HSA runtime
401 ROCPROFILER_RUNTIME_INITIALIZATION_HIP, ///< Application loaded HIP runtime
402 ROCPROFILER_RUNTIME_INITIALIZATION_MARKER, ///< Application loaded Marker (ROCTx) runtime
403 ROCPROFILER_RUNTIME_INITIALIZATION_RCCL, ///< Application loaded RCCL runtime
404 ROCPROFILER_RUNTIME_INITIALIZATION_ROCDECODE, ///< Application loaded rocDecode runtime
407
408/**
409 * @brief Enumeration for specifying the counter info struct version you want.
410 */
417
418/**
419 * @brief Enumeration for distinguishing different buffer record kinds within the
420 * ::ROCPROFILER_BUFFER_CATEGORY_COUNTERS category
421 */
422typedef enum
423{
425 ROCPROFILER_COUNTER_RECORD_PROFILE_COUNTING_DISPATCH_HEADER, ///< ::rocprofiler_dispatch_counting_service_record_t
428
429 /// @var ROCPROFILER_COUNTER_RECORD_KIND_DISPATCH_PROFILE_HEADER
430 /// @brief Indicates the payload type is of type
431 /// ::rocprofiler_dispatch_counting_service_record_t
433
434/**
435 * @brief Enumeration of flags that can be used with some counter api calls
436 */
437typedef enum
438{
440 ROCPROFILER_COUNTER_FLAG_ASYNC, ///< Do not wait for completion before returning.
441 ROCPROFILER_COUNTER_FLAG_APPEND_DEFINITION, ///< Append the counter definition to the system
442 ///< provided counter definition file.
445
446/**
447 * @brief Enumeration for distinguishing different buffer record kinds within the
448 * ::ROCPROFILER_BUFFER_CATEGORY_PC_SAMPLING category
449 */
457
458//--------------------------------------------------------------------------------------//
459//
460// ALIASES
461//
462//--------------------------------------------------------------------------------------//
463
464/**
465 * @brief ROCProfiler Timestamp.
466 */
467typedef uint64_t rocprofiler_timestamp_t;
468
469/**
470 * @brief Thread ID. Value will be equivalent to `syscall(__NR_gettid)`
471 */
472typedef uint64_t rocprofiler_thread_id_t;
473
474/**
475 * @brief Tracing Operation ID. Depending on the kind, operations can be determined.
476 * If the value is equal to zero that means all operations will be considered
477 * for tracing. Detailed API tracing operations can be found at associated header file
478 * for that partiular operation. i.e: For ROCProfiler enumeration of HSA AMD Extended API tracing
479 * operations, look at source/include/rocprofiler-sdk/hsa/amd_ext_api_id.h
480 */
482
483/**
484 * @brief Kernel identifier type
485 *
486 */
487typedef uint64_t rocprofiler_kernel_id_t;
488
489// /**
490// * @brief Sequence identifier type
491// *
492// */
494
495/**
496 * @brief Unique record id encoding both the counter
497 * and dimensional values (positions) for the record.
498 */
500
501/**
502 * @brief A dimension for counter instances. Some example
503 * dimensions include XCC, SM (Shader), etc. This
504 * value represents the dimension beind described
505 * or queried about.
506 */
508
509//--------------------------------------------------------------------------------------//
510//
511// UNIONS
512//
513//--------------------------------------------------------------------------------------//
514
515/**
516 * @brief User-assignable data type
517 *
518 */
520{
521 uint64_t value; ///< usage example: set to process id, thread id, etc.
522 void* ptr; ///< usage example: set to address of data allocation
524
525/**
526 * @brief Stores memory address for profiling
527 *
528 */
530{
531 uint64_t handle; ///< usage example: store address in uint64_t format
532 void* ptr; ///< usage example: generic form of address
534
535/**
536 * @brief Stores UUID for devices.
537 *
538 */
540{
541 uint64_t value; ///< numerical value
542 void* bytes; ///< uuid in hexadecimal
544
545//--------------------------------------------------------------------------------------//
546//
547// STRUCTS
548//
549//--------------------------------------------------------------------------------------//
550
551/**
552 * @brief Context ID.
553 */
554typedef struct
555{
556 uint64_t handle;
558
559/**
560 * @brief Queue ID.
561 */
562typedef struct
563{
564 uint64_t handle;
566
567/**
568 * @brief ROCProfiler Record Correlation ID.
569 */
575
576/**
577 * @brief The NULL value of an internal correlation ID.
578 */
579#define ROCPROFILER_CORRELATION_ID_INTERNAL_NONE ROCPROFILER_UINT64_C(0)
580
581/**
582 * @struct rocprofiler_buffer_id_t
583 * @brief Buffer ID.
584 */
585typedef struct
586{
587 uint64_t handle;
589
590/**
591 * @brief Agent Identifier
592 */
593typedef struct
594{
595 uint64_t handle;
597
598/**
599 * @brief Counter ID.
600 */
601typedef struct
602{
603 uint64_t handle;
605
606/**
607 * @brief Profile Configurations
608 * @see rocprofiler_create_profile_config for how to create.
609 */
610typedef struct
611{
612 uint64_t handle; // Opaque handle
614
615/**
616 * @brief Multi-dimensional struct of data used to describe GPU workgroup and grid sizes
617 */
618typedef struct rocprofiler_dim3_t
619{
620 uint32_t x;
621 uint32_t y;
622 uint32_t z;
624
625/**
626 * @brief Tracing record
627 *
628 */
639
640/**
641 * @brief Generic record with type identifier(s) and a pointer to data. This data type is used with
642 * buffered data.
643 *
644 * @code{.cpp}
645 * void
646 * tool_tracing_callback(rocprofiler_record_header_t** headers,
647 * size_t num_headers)
648 * {
649 * for(size_t i = 0; i < num_headers; ++i)
650 * {
651 * rocprofiler_record_header_t* header = headers[i];
652 *
653 * if(header->category == ROCPROFILER_BUFFER_CATEGORY_TRACING &&
654 * header->kind == ROCPROFILER_BUFFER_TRACING_HSA_API)
655 * {
656 * // cast to rocprofiler_buffer_tracing_hsa_api_record_t which
657 * // is type associated with this category + kind
658 * auto* record =
659 * static_cast<rocprofiler_buffer_tracing_hsa_api_record_t*>(header->payload);
660 *
661 * // trivial test
662 * assert(record->start_timestamp <= record->end_timestamp);
663 * }
664 * }
665 * }
666 *
667 * @endcode
668 */
669typedef struct
670{
671 union
672 {
673 struct
674 {
675 uint32_t category; ///< rocprofiler_buffer_category_t
676 uint32_t kind; ///< domain
677 };
678 uint64_t hash; ///< generic identifier. You can compute this via: `uint64_t hash = category
679 ///< | ((uint64_t)(kind) << 32)`, e.g.
680 };
681 void* payload;
683
684/**
685 * @brief Function for computing the unsigned 64-bit hash value in @ref rocprofiler_record_header_t
686 * from a category and kind (two unsigned 32-bit values)
687 *
688 * @param [in] category a value from @ref rocprofiler_buffer_category_t
689 * @param [in] kind depending on the category, this is the domain value, e.g., @ref
690 * rocprofiler_buffer_tracing_kind_t value
691 * @return uint64_t hash value of category and kind
692 */
693static inline uint64_t
694rocprofiler_record_header_compute_hash(uint32_t category, uint32_t kind)
695{
696 uint64_t value = category;
697 value |= ((uint64_t)(kind)) << 32;
698 return value;
699}
700
701/**
702 * @brief ROCProfiler kernel dispatch information
703 *
704 */
706{
707 uint64_t size; ///< Size of this struct (minus reserved padding)
708 rocprofiler_agent_id_t agent_id; ///< Agent ID where kernel is launched
709 rocprofiler_queue_id_t queue_id; ///< Queue ID where kernel packet is enqueued
710 rocprofiler_kernel_id_t kernel_id; ///< Kernel identifier
711 rocprofiler_dispatch_id_t dispatch_id; ///< unique id for each dispatch
712 uint32_t private_segment_size; ///< runtime private memory segment size
713 uint32_t group_segment_size; ///< runtime group memory segment size
714 rocprofiler_dim3_t workgroup_size; ///< runtime workgroup size (grid * threads)
715 rocprofiler_dim3_t grid_size; ///< runtime grid size
716 uint8_t reserved_padding[56]; // reserved for extensions w/o ABI break
718
719/**
720 * @brief Details for the dimension, including its size, for a counter record.
721 */
722typedef struct
723{
724 const char* name;
727
728 /// @var id
729 /// @brief Id for this dimension used by @ref rocprofiler_query_record_dimension_position
731
732/**
733 * @brief ROCProfiler Profile Counting Counter Record per instance.
734 */
735typedef struct
736{
737 rocprofiler_counter_instance_id_t id; ///< counter identifier
738 double counter_value; ///< counter value
742
743 /// @var dispatch_id
744 /// @brief A value greater than zero indicates that this counter record is associated with a
745 /// specific dispatch.
746 ///
747 /// This value can be mapped to a dispatch via the `dispatch_info` field (@see
748 /// ::rocprofiler_kernel_dispatch_info_t) of a ::rocprofiler_dispatch_counting_service_data_t
749 /// instance (provided during callback for profile config) or a
750 /// ::rocprofiler_dispatch_counting_service_record_t records (which will be insert into the
751 /// buffer prior to the associated ::rocprofiler_record_counter_t records).
753
754/**
755 * @brief Counter info struct version 0
756 */
757typedef struct
758{
759 rocprofiler_counter_id_t id; ///< Id of this counter
760 const char* name; ///< Name of the counter
761 const char* description; ///< Description of the counter
762 const char* block; ///< Block of the counter (non-derived only)
763 const char* expression; ///< Counter expression (derived counters only)
764 uint8_t is_constant : 1; ///< If this counter is HW constant
765 uint8_t is_derived : 1; ///< If this counter is a derived counter
767
768/**
769 * @brief ROCProfiler SPM Record.
770 *
771 */
772typedef struct
773{
774 /**
775 * Counters, including identifiers to get counter information and Counters
776 * values
777 */
781
782/** @} */
783
784ROCPROFILER_EXTERN_C_FINI
785
787 static_assert(sizeof(rocprofiler_kernel_dispatch_info_t) == 128,
788 "Increasing the size of the kernel dispatch info is not permitted");)
#define ROCPROFILER_CXX_CODE(...)
Definition defines.h:132
void * ptr
usage example: set to address of data allocation
Definition fwd.h:522
const char * name
Name of the counter.
Definition fwd.h:760
const char * block
Block of the counter (non-derived only)
Definition fwd.h:762
rocprofiler_dim3_t grid_size
runtime grid size
Definition fwd.h:715
uint64_t handle
usage example: store address in uint64_t format
Definition fwd.h:531
rocprofiler_user_data_t external
Definition fwd.h:573
rocprofiler_counter_dimension_id_t id
Id for this dimension used by rocprofiler_query_record_dimension_position.
Definition fwd.h:726
uint64_t value
usage example: set to process id, thread id, etc.
Definition fwd.h:521
uint32_t z
Definition fwd.h:622
uint32_t group_segment_size
runtime group memory segment size
Definition fwd.h:713
void * ptr
usage example: generic form of address
Definition fwd.h:532
rocprofiler_user_data_t user_data
Definition fwd.h:740
rocprofiler_agent_id_t agent_id
Agent ID where kernel is launched.
Definition fwd.h:708
uint32_t y
Definition fwd.h:621
uint32_t private_segment_size
runtime private memory segment size
Definition fwd.h:712
rocprofiler_callback_phase_t phase
Definition fwd.h:636
uint64_t handle
Definition fwd.h:595
rocprofiler_counter_id_t id
Id of this counter.
Definition fwd.h:759
rocprofiler_record_counter_t * counters
Definition fwd.h:778
rocprofiler_dispatch_id_t dispatch_id
A value greater than zero indicates that this counter record is associated with a specific dispatch.
Definition fwd.h:739
rocprofiler_context_id_t context_id
Definition fwd.h:631
const char * description
Description of the counter.
Definition fwd.h:761
rocprofiler_callback_tracing_kind_t kind
Definition fwd.h:634
uint8_t is_constant
If this counter is HW constant.
Definition fwd.h:764
uint64_t handle
Definition fwd.h:564
uint64_t value
numerical value
Definition fwd.h:541
rocprofiler_dispatch_id_t dispatch_id
unique id for each dispatch
Definition fwd.h:711
rocprofiler_thread_id_t thread_id
Definition fwd.h:632
rocprofiler_kernel_id_t kernel_id
Kernel identifier.
Definition fwd.h:710
rocprofiler_tracing_operation_t operation
Definition fwd.h:635
rocprofiler_counter_instance_id_t id
counter identifier
Definition fwd.h:737
const char * expression
Counter expression (derived counters only)
Definition fwd.h:763
void * bytes
uuid in hexadecimal
Definition fwd.h:542
uint64_t size
Size of this struct (minus reserved padding)
Definition fwd.h:707
double counter_value
counter value
Definition fwd.h:738
uint64_t counters_count
Definition fwd.h:779
rocprofiler_correlation_id_t correlation_id
Definition fwd.h:633
uint32_t x
Definition fwd.h:620
rocprofiler_dim3_t workgroup_size
runtime workgroup size (grid * threads)
Definition fwd.h:714
uint8_t is_derived
If this counter is a derived counter.
Definition fwd.h:765
rocprofiler_queue_id_t queue_id
Queue ID where kernel packet is enqueued.
Definition fwd.h:709
rocprofiler_agent_id_t agent_id
Definition fwd.h:741
rocprofiler_pc_sampling_method_t
PC Sampling Method.
Definition fwd.h:303
rocprofiler_code_object_operation_t
ROCProfiler Code Object Tracer Operations.
Definition fwd.h:219
int32_t rocprofiler_tracing_operation_t
Tracing Operation ID. Depending on the kind, operations can be determined. If the value is equal to z...
Definition fwd.h:481
rocprofiler_buffer_policy_t
Actions when Buffer is full.
Definition fwd.h:326
rocprofiler_scratch_memory_operation_t
Scratch event kind.
Definition fwd.h:354
uint64_t rocprofiler_counter_dimension_id_t
A dimension for counter instances. Some example dimensions include XCC, SM (Shader),...
Definition fwd.h:507
rocprofiler_page_migration_operation_t
Page migration event.
Definition fwd.h:337
rocprofiler_memory_copy_operation_t
Memory Copy Operations.
Definition fwd.h:231
uint64_t rocprofiler_counter_instance_id_t
Unique record id encoding both the counter and dimensional values (positions) for the record.
Definition fwd.h:499
rocprofiler_runtime_initialization_operation_t
ROCProfiler Runtime Initialization Tracer Operations.
Definition fwd.h:398
rocprofiler_memory_allocation_operation_t
Memory Allocation Operation.
Definition fwd.h:244
rocprofiler_counter_record_kind_t
Enumeration for distinguishing different buffer record kinds within the ROCPROFILER_BUFFER_CATEGORY_C...
Definition fwd.h:423
rocprofiler_pc_sampling_unit_t
PC Sampling Unit.
Definition fwd.h:314
rocprofiler_intercept_table_t
Enumeration for specifying intercept tables supported by rocprofiler. This enumeration is used for in...
Definition fwd.h:382
rocprofiler_status_t
Status codes.
Definition fwd.h:53
uint64_t rocprofiler_dispatch_id_t
Definition fwd.h:493
rocprofiler_callback_phase_t
Service Callback Phase.
Definition fwd.h:141
uint64_t rocprofiler_kernel_id_t
Kernel identifier type.
Definition fwd.h:487
uint64_t rocprofiler_thread_id_t
Thread ID. Value will be equivalent to syscall(__NR_gettid)
Definition fwd.h:472
rocprofiler_buffer_tracing_kind_t
Service Buffer Tracing Kind.
Definition fwd.h:187
rocprofiler_pc_sampling_record_kind_t
Enumeration for distinguishing different buffer record kinds within the ROCPROFILER_BUFFER_CATEGORY_P...
Definition fwd.h:451
rocprofiler_kernel_dispatch_operation_t
ROCProfiler Kernel Dispatch Tracing Operation Types.
Definition fwd.h:257
rocprofiler_runtime_library_t
Enumeration for specifying runtime libraries supported by rocprofiler. This enumeration is used for t...
Definition fwd.h:367
uint64_t rocprofiler_timestamp_t
ROCProfiler Timestamp.
Definition fwd.h:467
rocprofiler_buffer_category_t
Buffer record categories. This enumeration type is encoded in rocprofiler_record_header_t category fi...
Definition fwd.h:118
rocprofiler_callback_tracing_kind_t
Service Callback Tracing Kind.
Definition fwd.h:156
rocprofiler_agent_type_t
Agent type.
Definition fwd.h:130
rocprofiler_counter_info_version_id_t
Enumeration for specifying the counter info struct version you want.
Definition fwd.h:412
rocprofiler_counter_flag_t
Enumeration of flags that can be used with some counter api calls.
Definition fwd.h:438
@ ROCPROFILER_PC_SAMPLING_METHOD_STOCHASTIC
Stochastic sampling (MI300+)
Definition fwd.h:305
@ ROCPROFILER_PC_SAMPLING_METHOD_HOST_TRAP
Interval sampling (MI200+)
Definition fwd.h:306
@ ROCPROFILER_PC_SAMPLING_METHOD_LAST
Definition fwd.h:307
@ ROCPROFILER_PC_SAMPLING_METHOD_NONE
Unknown sampling type.
Definition fwd.h:304
@ ROCPROFILER_CODE_OBJECT_HOST_KERNEL_SYMBOL_REGISTER
Kernel symbols - Host.
Definition fwd.h:223
@ ROCPROFILER_CODE_OBJECT_DEVICE_KERNEL_SYMBOL_REGISTER
Kernel symbols - Device.
Definition fwd.h:222
@ ROCPROFILER_CODE_OBJECT_LAST
Definition fwd.h:224
@ ROCPROFILER_CODE_OBJECT_NONE
Unknown code object operation.
Definition fwd.h:220
@ ROCPROFILER_CODE_OBJECT_LOAD
Code object containing kernel symbols.
Definition fwd.h:221
@ ROCPROFILER_BUFFER_POLICY_DISCARD
Drop records when buffer is full.
Definition fwd.h:328
@ ROCPROFILER_BUFFER_POLICY_NONE
No policy has been set.
Definition fwd.h:327
@ ROCPROFILER_BUFFER_POLICY_LOSSLESS
Block when buffer is full.
Definition fwd.h:329
@ ROCPROFILER_BUFFER_POLICY_LAST
Definition fwd.h:330
@ ROCPROFILER_SCRATCH_MEMORY_ALLOC
Scratch memory allocation event.
Definition fwd.h:356
@ ROCPROFILER_SCRATCH_MEMORY_FREE
Scratch memory free event.
Definition fwd.h:357
@ ROCPROFILER_SCRATCH_MEMORY_ASYNC_RECLAIM
Scratch memory asynchronously reclaimed.
Definition fwd.h:358
@ ROCPROFILER_SCRATCH_MEMORY_LAST
Definition fwd.h:359
@ ROCPROFILER_SCRATCH_MEMORY_NONE
Unknown scratch operation.
Definition fwd.h:355
@ ROCPROFILER_PAGE_MIGRATION_NONE
Unknown event.
Definition fwd.h:338
@ ROCPROFILER_PAGE_MIGRATION_LAST
Definition fwd.h:347
@ ROCPROFILER_PAGE_MIGRATION_PAGE_FAULT_START
Definition fwd.h:341
@ ROCPROFILER_PAGE_MIGRATION_PAGE_FAULT_END
Definition fwd.h:342
@ ROCPROFILER_PAGE_MIGRATION_UNMAP_FROM_GPU
Definition fwd.h:345
@ ROCPROFILER_PAGE_MIGRATION_QUEUE_EVICTION
Definition fwd.h:343
@ ROCPROFILER_PAGE_MIGRATION_PAGE_MIGRATE_END
Definition fwd.h:340
@ ROCPROFILER_PAGE_MIGRATION_PAGE_MIGRATE_START
Definition fwd.h:339
@ ROCPROFILER_PAGE_MIGRATION_DROPPED_EVENT
Definition fwd.h:346
@ ROCPROFILER_PAGE_MIGRATION_QUEUE_RESTORE
Definition fwd.h:344
@ ROCPROFILER_MEMORY_COPY_LAST
Definition fwd.h:237
@ ROCPROFILER_MEMORY_COPY_DEVICE_TO_DEVICE
Memory copy from device to device.
Definition fwd.h:236
@ ROCPROFILER_MEMORY_COPY_HOST_TO_HOST
Memory copy from host to host.
Definition fwd.h:233
@ ROCPROFILER_MEMORY_COPY_DEVICE_TO_HOST
Memory copy from device to host.
Definition fwd.h:235
@ ROCPROFILER_MEMORY_COPY_NONE
Unknown memory copy direction.
Definition fwd.h:232
@ ROCPROFILER_MEMORY_COPY_HOST_TO_DEVICE
Memory copy from host to device.
Definition fwd.h:234
@ ROCPROFILER_RUNTIME_INITIALIZATION_LAST
Definition fwd.h:405
@ ROCPROFILER_RUNTIME_INITIALIZATION_NONE
Unknown runtime initialization.
Definition fwd.h:399
@ ROCPROFILER_RUNTIME_INITIALIZATION_ROCDECODE
Application loaded rocDecode runtime.
Definition fwd.h:404
@ ROCPROFILER_RUNTIME_INITIALIZATION_HIP
Application loaded HIP runtime.
Definition fwd.h:401
@ ROCPROFILER_RUNTIME_INITIALIZATION_MARKER
Application loaded Marker (ROCTx) runtime.
Definition fwd.h:402
@ ROCPROFILER_RUNTIME_INITIALIZATION_RCCL
Application loaded RCCL runtime.
Definition fwd.h:403
@ ROCPROFILER_RUNTIME_INITIALIZATION_HSA
Application loaded HSA runtime.
Definition fwd.h:400
@ ROCPROFILER_MEMORY_ALLOCATION_NONE
Unknown memory allocation function.
Definition fwd.h:245
@ ROCPROFILER_MEMORY_ALLOCATION_ALLOCATE
Allocate memory function.
Definition fwd.h:246
@ ROCPROFILER_MEMORY_ALLOCATION_FREE
Free memory function.
Definition fwd.h:248
@ ROCPROFILER_MEMORY_ALLOCATION_VMEM_FREE
Release vmem memory handle.
Definition fwd.h:249
@ ROCPROFILER_MEMORY_ALLOCATION_VMEM_ALLOCATE
Allocate vmem memory handle.
Definition fwd.h:247
@ ROCPROFILER_MEMORY_ALLOCATION_LAST
Definition fwd.h:250
@ ROCPROFILER_COUNTER_RECORD_PROFILE_COUNTING_DISPATCH_HEADER
rocprofiler_dispatch_counting_service_record_t
Definition fwd.h:425
@ ROCPROFILER_COUNTER_RECORD_VALUE
Definition fwd.h:426
@ ROCPROFILER_COUNTER_RECORD_LAST
Definition fwd.h:427
@ ROCPROFILER_COUNTER_RECORD_NONE
Definition fwd.h:424
@ ROCPROFILER_PC_SAMPLING_UNIT_LAST
Definition fwd.h:319
@ ROCPROFILER_PC_SAMPLING_UNIT_TIME
Sample internval is in nanoseconds.
Definition fwd.h:318
@ ROCPROFILER_PC_SAMPLING_UNIT_NONE
Sample interval has unspecified units.
Definition fwd.h:315
@ ROCPROFILER_PC_SAMPLING_UNIT_INSTRUCTIONS
Sample interval is in instructions.
Definition fwd.h:316
@ ROCPROFILER_PC_SAMPLING_UNIT_CYCLES
Sample interval is in cycles.
Definition fwd.h:317
@ ROCPROFILER_MARKER_NAME_TABLE
Definition fwd.h:388
@ ROCPROFILER_MARKER_CONTROL_TABLE
Definition fwd.h:387
@ ROCPROFILER_RCCL_TABLE
Definition fwd.h:389
@ ROCPROFILER_HIP_COMPILER_TABLE
Definition fwd.h:385
@ ROCPROFILER_MARKER_CORE_TABLE
Definition fwd.h:386
@ ROCPROFILER_TABLE_LAST
Definition fwd.h:391
@ ROCPROFILER_HSA_TABLE
Definition fwd.h:383
@ ROCPROFILER_ROCDECODE_TABLE
Definition fwd.h:390
@ ROCPROFILER_HIP_RUNTIME_TABLE
Definition fwd.h:384
@ ROCPROFILER_STATUS_ERROR_FINALIZED
invalid because rocprofiler has been finalized
Definition fwd.h:83
@ ROCPROFILER_STATUS_ERROR_CONTEXT_NOT_STARTED
Context was not started (e.g., atomic swap into active array failed)
Definition fwd.h:65
@ ROCPROFILER_STATUS_ERROR_INVALID_ARGUMENT
Function invoked with one or more invalid arguments.
Definition fwd.h:80
@ ROCPROFILER_STATUS_ERROR_NO_PROFILE_QUEUE
Profile queue creation failed.
Definition fwd.h:101
@ ROCPROFILER_STATUS_ERROR_CONTEXT_ERROR
Generalized context error.
Definition fwd.h:63
@ ROCPROFILER_STATUS_ERROR_CONFIGURATION_LOCKED
Function call is not valid outside of rocprofiler configuration (i.e. function called post-initializa...
Definition fwd.h:74
@ ROCPROFILER_STATUS_ERROR_BUFFER_NOT_FOUND
No valid buffer for given buffer id.
Definition fwd.h:57
@ ROCPROFILER_STATUS_ERROR_PROFILE_NOT_FOUND
Could not find the counter profile.
Definition fwd.h:96
@ ROCPROFILER_STATUS_ERROR_COUNTER_NOT_FOUND
Counter identifier does not exist.
Definition fwd.h:62
@ ROCPROFILER_STATUS_ERROR_THREAD_NOT_FOUND
No valid thread for given thread id.
Definition fwd.h:60
@ ROCPROFILER_STATUS_ERROR_CONTEXT_CONFLICT
Context operation failed due to a conflict with another context.
Definition fwd.h:67
@ ROCPROFILER_STATUS_ERROR_SERVICE_ALREADY_CONFIGURED
service has already been configured in context
Definition fwd.h:72
@ ROCPROFILER_STATUS_ERROR_NOT_IMPLEMENTED
Function is not implemented.
Definition fwd.h:77
@ ROCPROFILER_STATUS_ERROR_AGENT_MISMATCH
Agent mismatch between profile and context.
Definition fwd.h:103
@ ROCPROFILER_STATUS_ERROR_PERMISSION_DENIED
Permission denied.
Definition fwd.h:109
@ ROCPROFILER_STATUS_ERROR_AGENT_DISPATCH_CONFLICT
Cannot enable both agent and dispatch counting in the same context.
Definition fwd.h:97
@ ROCPROFILER_STATUS_ERROR_OPERATION_NOT_FOUND
Operation identifier is invalid for domain.
Definition fwd.h:59
@ ROCPROFILER_STATUS_ERROR_AQL_NO_EVENT_COORD
Event coordinate was not found by AQL profile.
Definition fwd.h:90
@ ROCPROFILER_STATUS_ERROR_NOT_AVAILABLE
The service is not available. Please refer to API functions that return this status code for more inf...
Definition fwd.h:104
@ ROCPROFILER_STATUS_ERROR_SAMPLE_RATE_EXCEEDED
Sample rate exceeded.
Definition fwd.h:100
@ ROCPROFILER_STATUS_ERROR_CONTEXT_INVALID
Context configuration is not valid.
Definition fwd.h:64
@ ROCPROFILER_STATUS_ERROR_OUT_OF_RESOURCES
The given resources are insufficient to complete operation.
Definition fwd.h:94
@ ROCPROFILER_STATUS_LAST
Definition fwd.h:110
@ ROCPROFILER_STATUS_ERROR_AGENT_NOT_FOUND
Agent identifier not found.
Definition fwd.h:61
@ ROCPROFILER_STATUS_ERROR
Generalized error.
Definition fwd.h:55
@ ROCPROFILER_STATUS_ERROR_EXCEEDS_HW_LIMIT
Exceeds hardware limits for collection.
Definition fwd.h:107
@ ROCPROFILER_STATUS_ERROR_CONTEXT_NOT_FOUND
No valid context for given context id.
Definition fwd.h:56
@ ROCPROFILER_STATUS_ERROR_KIND_NOT_FOUND
Kind identifier is invalid.
Definition fwd.h:58
@ ROCPROFILER_STATUS_INTERNAL_NO_AGENT_CONTEXT
No agent context found, may not be an error.
Definition fwd.h:99
@ ROCPROFILER_STATUS_ERROR_AST_GENERATION_FAILED
AST could not be generated correctly.
Definition fwd.h:88
@ ROCPROFILER_STATUS_ERROR_INCOMPATIBLE_KERNEL
A service depends on a newer version of KFD (amdgpu kernel driver). Check logs for service that repor...
Definition fwd.h:91
@ ROCPROFILER_STATUS_ERROR_PROFILE_COUNTER_NOT_FOUND
Profile could not find counter for GPU agent.
Definition fwd.h:86
@ ROCPROFILER_STATUS_ERROR_AGENT_ARCH_NOT_SUPPORTED
Agent HW architecture not supported.
Definition fwd.h:108
@ ROCPROFILER_STATUS_ERROR_DIM_NOT_FOUND
Dimension is not found for counter.
Definition fwd.h:85
@ ROCPROFILER_STATUS_ERROR_METRIC_NOT_VALID_FOR_AGENT
Invalid metric supplied to agent.
Definition fwd.h:82
@ ROCPROFILER_STATUS_ERROR_BUFFER_BUSY
buffer operation failed because it currently busy handling another request (e.g. flushing)
Definition fwd.h:70
@ ROCPROFILER_STATUS_SUCCESS
No error occurred.
Definition fwd.h:54
@ ROCPROFILER_STATUS_ERROR_INCOMPATIBLE_ABI
Data structure provided by user is incompatible with current version of rocprofiler.
Definition fwd.h:78
@ ROCPROFILER_STATUS_ERROR_CONTEXT_ID_NOT_ZERO
Context ID is not initialized to zero.
Definition fwd.h:69
@ ROCPROFILER_STATUS_ERROR_NO_HARDWARE_COUNTERS
No hardware counters were specified.
Definition fwd.h:102
@ ROCPROFILER_STATUS_ERROR_AST_NOT_FOUND
AST was not found.
Definition fwd.h:89
@ ROCPROFILER_STATUS_ERROR_HSA_NOT_LOADED
Call requires HSA to be loaded before performed.
Definition fwd.h:84
@ ROCPROFILER_CALLBACK_PHASE_NONE
Callback has no phase.
Definition fwd.h:142
@ ROCPROFILER_CALLBACK_PHASE_UNLOAD
Callback invoked prior to code object unloading.
Definition fwd.h:147
@ ROCPROFILER_CALLBACK_PHASE_EXIT
Callback invoked after to function execution.
Definition fwd.h:146
@ ROCPROFILER_CALLBACK_PHASE_ENTER
Callback invoked prior to function execution.
Definition fwd.h:143
@ ROCPROFILER_CALLBACK_PHASE_LAST
Definition fwd.h:149
@ ROCPROFILER_CALLBACK_PHASE_LOAD
Callback invoked prior to code object loading.
Definition fwd.h:144
@ ROCPROFILER_BUFFER_TRACING_PAGE_MIGRATION
Buffer page migration info.
Definition fwd.h:201
@ ROCPROFILER_BUFFER_TRACING_MARKER_CORE_API
Definition fwd.h:196
@ ROCPROFILER_BUFFER_TRACING_RUNTIME_INITIALIZATION
Record indicating a runtime library has been initialized.
Definition fwd.h:208
@ ROCPROFILER_BUFFER_TRACING_MEMORY_ALLOCATION
Definition fwd.h:206
@ ROCPROFILER_BUFFER_TRACING_MARKER_NAME_API
Definition fwd.h:198
@ ROCPROFILER_BUFFER_TRACING_LAST
Definition fwd.h:212
@ ROCPROFILER_BUFFER_TRACING_CORRELATION_ID_RETIREMENT
Correlation ID in no longer in use.
Definition fwd.h:203
@ ROCPROFILER_BUFFER_TRACING_HSA_CORE_API
Definition fwd.h:189
@ ROCPROFILER_BUFFER_TRACING_MEMORY_COPY
Definition fwd.h:199
@ ROCPROFILER_BUFFER_TRACING_RCCL_API
RCCL tracing.
Definition fwd.h:204
@ ROCPROFILER_BUFFER_TRACING_ROCDECODE_API
rocDecode tracing
Definition fwd.h:211
@ ROCPROFILER_BUFFER_TRACING_SCRATCH_MEMORY
Buffer scratch memory reclaimation info.
Definition fwd.h:202
@ ROCPROFILER_BUFFER_TRACING_KERNEL_DISPATCH
Buffer kernel dispatch info.
Definition fwd.h:200
@ ROCPROFILER_BUFFER_TRACING_HIP_RUNTIME_API
Definition fwd.h:194
@ ROCPROFILER_BUFFER_TRACING_MARKER_CONTROL_API
Definition fwd.h:197
@ ROCPROFILER_BUFFER_TRACING_OMPT
Definition fwd.h:205
@ ROCPROFILER_BUFFER_TRACING_NONE
Definition fwd.h:188
@ ROCPROFILER_BUFFER_TRACING_HSA_IMAGE_EXT_API
Definition fwd.h:191
@ ROCPROFILER_BUFFER_TRACING_HIP_COMPILER_API
Definition fwd.h:195
@ ROCPROFILER_BUFFER_TRACING_HSA_AMD_EXT_API
Definition fwd.h:190
@ ROCPROFILER_BUFFER_TRACING_HSA_FINALIZE_EXT_API
Definition fwd.h:192
@ ROCPROFILER_PC_SAMPLING_RECORD_LAST
Definition fwd.h:455
@ ROCPROFILER_PC_SAMPLING_RECORD_HOST_TRAP_V0_SAMPLE
rocprofiler_pc_sampling_record_host_trap_v0_t
Definition fwd.h:453
@ ROCPROFILER_PC_SAMPLING_RECORD_NONE
Definition fwd.h:452
@ ROCPROFILER_PC_SAMPLING_RECORD_STOCHASTIC_V0_SAMPLE
for the future use
Definition fwd.h:454
@ ROCPROFILER_KERNEL_DISPATCH_ENQUEUE
Definition fwd.h:259
@ ROCPROFILER_KERNEL_DISPATCH_COMPLETE
Definition fwd.h:260
@ ROCPROFILER_KERNEL_DISPATCH_NONE
Unknown kernel dispatch operation.
Definition fwd.h:258
@ ROCPROFILER_KERNEL_DISPATCH_LAST
Definition fwd.h:261
@ ROCPROFILER_RCCL_LIBRARY
Definition fwd.h:372
@ ROCPROFILER_ROCDECODE_LIBRARY
Definition fwd.h:373
@ ROCPROFILER_LIBRARY_LAST
Definition fwd.h:374
@ ROCPROFILER_HIP_LIBRARY
Definition fwd.h:370
@ ROCPROFILER_LIBRARY
Definition fwd.h:368
@ ROCPROFILER_HSA_LIBRARY
Definition fwd.h:369
@ ROCPROFILER_MARKER_LIBRARY
Definition fwd.h:371
@ ROCPROFILER_BUFFER_CATEGORY_TRACING
Definition fwd.h:120
@ ROCPROFILER_BUFFER_CATEGORY_NONE
Definition fwd.h:119
@ ROCPROFILER_BUFFER_CATEGORY_PC_SAMPLING
Definition fwd.h:121
@ ROCPROFILER_BUFFER_CATEGORY_LAST
Definition fwd.h:123
@ ROCPROFILER_BUFFER_CATEGORY_COUNTERS
Definition fwd.h:122
@ ROCPROFILER_CALLBACK_TRACING_CODE_OBJECT
Definition fwd.h:169
@ ROCPROFILER_CALLBACK_TRACING_ROCDECODE_API
rocDecode API Tracing
Definition fwd.h:179
@ ROCPROFILER_CALLBACK_TRACING_MEMORY_ALLOCATION
Definition fwd.h:175
@ ROCPROFILER_CALLBACK_TRACING_OMPT
Definition fwd.h:174
@ ROCPROFILER_CALLBACK_TRACING_MARKER_CONTROL_API
Definition fwd.h:166
@ ROCPROFILER_CALLBACK_TRACING_KERNEL_DISPATCH
Callbacks for kernel dispatches.
Definition fwd.h:171
@ ROCPROFILER_CALLBACK_TRACING_RCCL_API
RCCL tracing.
Definition fwd.h:173
@ ROCPROFILER_CALLBACK_TRACING_RUNTIME_INITIALIZATION
Callback notifying that a runtime library has been initialized.
Definition fwd.h:177
@ ROCPROFILER_CALLBACK_TRACING_HIP_COMPILER_API
Definition fwd.h:164
@ ROCPROFILER_CALLBACK_TRACING_HSA_AMD_EXT_API
Definition fwd.h:159
@ ROCPROFILER_CALLBACK_TRACING_MARKER_NAME_API
Definition fwd.h:168
@ ROCPROFILER_CALLBACK_TRACING_HSA_CORE_API
Definition fwd.h:158
@ ROCPROFILER_CALLBACK_TRACING_LAST
Definition fwd.h:180
@ ROCPROFILER_CALLBACK_TRACING_MEMORY_COPY
Definition fwd.h:172
@ ROCPROFILER_CALLBACK_TRACING_NONE
Definition fwd.h:157
@ ROCPROFILER_CALLBACK_TRACING_SCRATCH_MEMORY
Definition fwd.h:170
@ ROCPROFILER_CALLBACK_TRACING_HIP_RUNTIME_API
Definition fwd.h:163
@ ROCPROFILER_CALLBACK_TRACING_HSA_IMAGE_EXT_API
Definition fwd.h:160
@ ROCPROFILER_CALLBACK_TRACING_MARKER_CORE_API
Definition fwd.h:165
@ ROCPROFILER_CALLBACK_TRACING_HSA_FINALIZE_EXT_API
Definition fwd.h:161
@ ROCPROFILER_AGENT_TYPE_NONE
Agent type is unknown.
Definition fwd.h:131
@ ROCPROFILER_AGENT_TYPE_GPU
Agent type is a GPU.
Definition fwd.h:133
@ ROCPROFILER_AGENT_TYPE_LAST
Definition fwd.h:134
@ ROCPROFILER_AGENT_TYPE_CPU
Agent type is a CPU.
Definition fwd.h:132
@ ROCPROFILER_COUNTER_INFO_VERSION_0
Definition fwd.h:414
@ ROCPROFILER_COUNTER_INFO_VERSION_LAST
Definition fwd.h:415
@ ROCPROFILER_COUNTER_INFO_VERSION_NONE
Definition fwd.h:413
@ ROCPROFILER_COUNTER_FLAG_LAST
Definition fwd.h:443
@ ROCPROFILER_COUNTER_FLAG_NONE
Definition fwd.h:439
@ ROCPROFILER_COUNTER_FLAG_APPEND_DEFINITION
Append the counter definition to the system provided counter definition file.
Definition fwd.h:441
@ ROCPROFILER_COUNTER_FLAG_ASYNC
Do not wait for completion before returning.
Definition fwd.h:440
Agent Identifier.
Definition fwd.h:594
Context ID.
Definition fwd.h:555
ROCProfiler Record Correlation ID.
Definition fwd.h:571
Counter ID.
Definition fwd.h:602
Counter info struct version 0.
Definition fwd.h:758
Multi-dimensional struct of data used to describe GPU workgroup and grid sizes.
Definition fwd.h:619
ROCProfiler kernel dispatch information.
Definition fwd.h:706
Profile Configurations.
Definition fwd.h:611
ROCProfiler Profile Counting Counter Record per instance.
Definition fwd.h:736
Details for the dimension, including its size, for a counter record.
Definition fwd.h:723
Generic record with type identifier(s) and a pointer to data. This data type is used with buffered da...
Definition fwd.h:670
ROCProfiler SPM Record.
Definition fwd.h:773
Stores memory address for profiling.
Definition fwd.h:530
User-assignable data type.
Definition fwd.h:520
Stores UUID for devices.
Definition fwd.h:540