triton-windows 3.3.0.post19__cp311-cp311-win_amd64.whl → 3.3.1.post21__cp311-cp311-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of triton-windows might be problematic. Click here for more details.
- triton/_C/libtriton.pyd +0 -0
- triton/__init__.py +1 -1
- triton/backends/amd/driver.py +6 -1
- triton/backends/nvidia/compiler.py +1 -3
- triton/backends/nvidia/driver.py +7 -3
- triton/runtime/autotuner.py +2 -2
- triton/runtime/build.py +5 -5
- triton/runtime/tcc/lib/python310.def +1610 -0
- triton/runtime/tcc/lib/python311.def +1633 -0
- triton/runtime/tcc/lib/python312.def +1703 -0
- triton/runtime/tcc/lib/python313.def +1651 -0
- triton/runtime/tcc/lib/python313t.def +1656 -0
- triton/runtime/tcc/lib/python39.def +1644 -0
- triton/runtime/tcc/lib/python3t.def +905 -0
- triton/windows_utils.py +11 -4
- {triton_windows-3.3.0.post19.dist-info → triton_windows-3.3.1.post21.dist-info}/METADATA +1 -1
- {triton_windows-3.3.0.post19.dist-info → triton_windows-3.3.1.post21.dist-info}/RECORD +19 -109
- {triton_windows-3.3.0.post19.dist-info → triton_windows-3.3.1.post21.dist-info}/WHEEL +1 -1
- triton/backends/amd/include/hip/amd_detail/amd_channel_descriptor.h +0 -358
- triton/backends/amd/include/hip/amd_detail/amd_device_functions.h +0 -1010
- triton/backends/amd/include/hip/amd_detail/amd_hip_atomic.h +0 -1638
- triton/backends/amd/include/hip/amd_detail/amd_hip_bf16.h +0 -1814
- triton/backends/amd/include/hip/amd_detail/amd_hip_bfloat16.h +0 -293
- triton/backends/amd/include/hip/amd_detail/amd_hip_common.h +0 -32
- triton/backends/amd/include/hip/amd_detail/amd_hip_complex.h +0 -174
- triton/backends/amd/include/hip/amd_detail/amd_hip_cooperative_groups.h +0 -835
- triton/backends/amd/include/hip/amd_detail/amd_hip_fp16.h +0 -1809
- triton/backends/amd/include/hip/amd_detail/amd_hip_fp8.h +0 -1391
- triton/backends/amd/include/hip/amd_detail/amd_hip_gl_interop.h +0 -108
- triton/backends/amd/include/hip/amd_detail/amd_hip_math_constants.h +0 -124
- triton/backends/amd/include/hip/amd_detail/amd_hip_runtime.h +0 -405
- triton/backends/amd/include/hip/amd_detail/amd_hip_runtime_pt_api.h +0 -196
- triton/backends/amd/include/hip/amd_detail/amd_hip_unsafe_atomics.h +0 -565
- triton/backends/amd/include/hip/amd_detail/amd_hip_vector_types.h +0 -2226
- triton/backends/amd/include/hip/amd_detail/amd_math_functions.h +0 -104
- triton/backends/amd/include/hip/amd_detail/amd_surface_functions.h +0 -244
- triton/backends/amd/include/hip/amd_detail/amd_warp_functions.h +0 -538
- triton/backends/amd/include/hip/amd_detail/amd_warp_sync_functions.h +0 -288
- triton/backends/amd/include/hip/amd_detail/concepts.hpp +0 -30
- triton/backends/amd/include/hip/amd_detail/device_library_decls.h +0 -133
- triton/backends/amd/include/hip/amd_detail/functional_grid_launch.hpp +0 -218
- triton/backends/amd/include/hip/amd_detail/grid_launch.h +0 -67
- triton/backends/amd/include/hip/amd_detail/grid_launch.hpp +0 -50
- triton/backends/amd/include/hip/amd_detail/grid_launch_GGL.hpp +0 -26
- triton/backends/amd/include/hip/amd_detail/helpers.hpp +0 -137
- triton/backends/amd/include/hip/amd_detail/hip_api_trace.hpp +0 -1446
- triton/backends/amd/include/hip/amd_detail/hip_assert.h +0 -101
- triton/backends/amd/include/hip/amd_detail/hip_cooperative_groups_helper.h +0 -242
- triton/backends/amd/include/hip/amd_detail/hip_fp16_gcc.h +0 -254
- triton/backends/amd/include/hip/amd_detail/hip_fp16_math_fwd.h +0 -96
- triton/backends/amd/include/hip/amd_detail/hip_ldg.h +0 -100
- triton/backends/amd/include/hip/amd_detail/hip_prof_str.h +0 -10570
- triton/backends/amd/include/hip/amd_detail/hip_runtime_prof.h +0 -78
- triton/backends/amd/include/hip/amd_detail/host_defines.h +0 -184
- triton/backends/amd/include/hip/amd_detail/hsa_helpers.hpp +0 -102
- triton/backends/amd/include/hip/amd_detail/macro_based_grid_launch.hpp +0 -798
- triton/backends/amd/include/hip/amd_detail/math_fwd.h +0 -698
- triton/backends/amd/include/hip/amd_detail/ockl_image.h +0 -177
- triton/backends/amd/include/hip/amd_detail/program_state.hpp +0 -107
- triton/backends/amd/include/hip/amd_detail/texture_fetch_functions.h +0 -491
- triton/backends/amd/include/hip/amd_detail/texture_indirect_functions.h +0 -478
- triton/backends/amd/include/hip/channel_descriptor.h +0 -39
- triton/backends/amd/include/hip/device_functions.h +0 -38
- triton/backends/amd/include/hip/driver_types.h +0 -468
- triton/backends/amd/include/hip/hip_bf16.h +0 -36
- triton/backends/amd/include/hip/hip_bfloat16.h +0 -44
- triton/backends/amd/include/hip/hip_common.h +0 -100
- triton/backends/amd/include/hip/hip_complex.h +0 -38
- triton/backends/amd/include/hip/hip_cooperative_groups.h +0 -46
- triton/backends/amd/include/hip/hip_deprecated.h +0 -95
- triton/backends/amd/include/hip/hip_ext.h +0 -161
- triton/backends/amd/include/hip/hip_fp16.h +0 -36
- triton/backends/amd/include/hip/hip_fp8.h +0 -33
- triton/backends/amd/include/hip/hip_gl_interop.h +0 -32
- triton/backends/amd/include/hip/hip_hcc.h +0 -24
- triton/backends/amd/include/hip/hip_math_constants.h +0 -36
- triton/backends/amd/include/hip/hip_profile.h +0 -27
- triton/backends/amd/include/hip/hip_runtime.h +0 -75
- triton/backends/amd/include/hip/hip_runtime_api.h +0 -9261
- triton/backends/amd/include/hip/hip_texture_types.h +0 -29
- triton/backends/amd/include/hip/hip_vector_types.h +0 -41
- triton/backends/amd/include/hip/hip_version.h +0 -17
- triton/backends/amd/include/hip/hiprtc.h +0 -421
- triton/backends/amd/include/hip/library_types.h +0 -78
- triton/backends/amd/include/hip/math_functions.h +0 -42
- triton/backends/amd/include/hip/surface_types.h +0 -63
- triton/backends/amd/include/hip/texture_types.h +0 -194
- triton/backends/amd/include/hsa/Brig.h +0 -1131
- triton/backends/amd/include/hsa/amd_hsa_common.h +0 -91
- triton/backends/amd/include/hsa/amd_hsa_elf.h +0 -462
- triton/backends/amd/include/hsa/amd_hsa_kernel_code.h +0 -269
- triton/backends/amd/include/hsa/amd_hsa_queue.h +0 -109
- triton/backends/amd/include/hsa/amd_hsa_signal.h +0 -80
- triton/backends/amd/include/hsa/hsa.h +0 -5738
- triton/backends/amd/include/hsa/hsa_amd_tool.h +0 -91
- triton/backends/amd/include/hsa/hsa_api_trace.h +0 -579
- triton/backends/amd/include/hsa/hsa_api_trace_version.h +0 -68
- triton/backends/amd/include/hsa/hsa_ext_amd.h +0 -3146
- triton/backends/amd/include/hsa/hsa_ext_finalize.h +0 -531
- triton/backends/amd/include/hsa/hsa_ext_image.h +0 -1454
- triton/backends/amd/include/hsa/hsa_ven_amd_aqlprofile.h +0 -488
- triton/backends/amd/include/hsa/hsa_ven_amd_loader.h +0 -667
- triton/backends/amd/include/hsa/hsa_ven_amd_pc_sampling.h +0 -416
- triton/backends/amd/include/roctracer/ext/prof_protocol.h +0 -107
- triton/backends/amd/include/roctracer/hip_ostream_ops.h +0 -4515
- triton/backends/amd/include/roctracer/hsa_ostream_ops.h +0 -1727
- triton/backends/amd/include/roctracer/hsa_prof_str.h +0 -3059
- triton/backends/amd/include/roctracer/roctracer.h +0 -779
- triton/backends/amd/include/roctracer/roctracer_ext.h +0 -81
- triton/backends/amd/include/roctracer/roctracer_hcc.h +0 -24
- triton/backends/amd/include/roctracer/roctracer_hip.h +0 -37
- triton/backends/amd/include/roctracer/roctracer_hsa.h +0 -112
- triton/backends/amd/include/roctracer/roctracer_plugin.h +0 -137
- triton/backends/amd/include/roctracer/roctracer_roctx.h +0 -67
- triton/backends/amd/include/roctracer/roctx.h +0 -229
- {triton_windows-3.3.0.post19.dist-info → triton_windows-3.3.1.post21.dist-info}/top_level.txt +0 -0
|
@@ -1,269 +0,0 @@
|
|
|
1
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
2
|
-
//
|
|
3
|
-
// The University of Illinois/NCSA
|
|
4
|
-
// Open Source License (NCSA)
|
|
5
|
-
//
|
|
6
|
-
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
|
|
7
|
-
//
|
|
8
|
-
// Developed by:
|
|
9
|
-
//
|
|
10
|
-
// AMD Research and AMD HSA Software Development
|
|
11
|
-
//
|
|
12
|
-
// Advanced Micro Devices, Inc.
|
|
13
|
-
//
|
|
14
|
-
// www.amd.com
|
|
15
|
-
//
|
|
16
|
-
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
17
|
-
// of this software and associated documentation files (the "Software"), to
|
|
18
|
-
// deal with the Software without restriction, including without limitation
|
|
19
|
-
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
20
|
-
// and/or sell copies of the Software, and to permit persons to whom the
|
|
21
|
-
// Software is furnished to do so, subject to the following conditions:
|
|
22
|
-
//
|
|
23
|
-
// - Redistributions of source code must retain the above copyright notice,
|
|
24
|
-
// this list of conditions and the following disclaimers.
|
|
25
|
-
// - Redistributions in binary form must reproduce the above copyright
|
|
26
|
-
// notice, this list of conditions and the following disclaimers in
|
|
27
|
-
// the documentation and/or other materials provided with the distribution.
|
|
28
|
-
// - Neither the names of Advanced Micro Devices, Inc,
|
|
29
|
-
// nor the names of its contributors may be used to endorse or promote
|
|
30
|
-
// products derived from this Software without specific prior written
|
|
31
|
-
// permission.
|
|
32
|
-
//
|
|
33
|
-
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
34
|
-
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
35
|
-
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
36
|
-
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
37
|
-
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
38
|
-
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
39
|
-
// DEALINGS WITH THE SOFTWARE.
|
|
40
|
-
//
|
|
41
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
42
|
-
|
|
43
|
-
#ifndef AMD_HSA_KERNEL_CODE_H
|
|
44
|
-
#define AMD_HSA_KERNEL_CODE_H
|
|
45
|
-
|
|
46
|
-
#include "amd_hsa_common.h"
|
|
47
|
-
#include "hsa.h"
|
|
48
|
-
|
|
49
|
-
// AMD Kernel Code Version Enumeration Values.
|
|
50
|
-
typedef uint32_t amd_kernel_code_version32_t;
|
|
51
|
-
enum amd_kernel_code_version_t {
|
|
52
|
-
AMD_KERNEL_CODE_VERSION_MAJOR = 1,
|
|
53
|
-
AMD_KERNEL_CODE_VERSION_MINOR = 1
|
|
54
|
-
};
|
|
55
|
-
|
|
56
|
-
// AMD Machine Kind Enumeration Values.
|
|
57
|
-
typedef uint16_t amd_machine_kind16_t;
|
|
58
|
-
enum amd_machine_kind_t {
|
|
59
|
-
AMD_MACHINE_KIND_UNDEFINED = 0,
|
|
60
|
-
AMD_MACHINE_KIND_AMDGPU = 1
|
|
61
|
-
};
|
|
62
|
-
|
|
63
|
-
// AMD Machine Version.
|
|
64
|
-
typedef uint16_t amd_machine_version16_t;
|
|
65
|
-
|
|
66
|
-
// AMD Float Round Mode Enumeration Values.
|
|
67
|
-
enum amd_float_round_mode_t {
|
|
68
|
-
AMD_FLOAT_ROUND_MODE_NEAREST_EVEN = 0,
|
|
69
|
-
AMD_FLOAT_ROUND_MODE_PLUS_INFINITY = 1,
|
|
70
|
-
AMD_FLOAT_ROUND_MODE_MINUS_INFINITY = 2,
|
|
71
|
-
AMD_FLOAT_ROUND_MODE_ZERO = 3
|
|
72
|
-
};
|
|
73
|
-
|
|
74
|
-
// AMD Float Denorm Mode Enumeration Values.
|
|
75
|
-
enum amd_float_denorm_mode_t {
|
|
76
|
-
AMD_FLOAT_DENORM_MODE_FLUSH_SOURCE_OUTPUT = 0,
|
|
77
|
-
AMD_FLOAT_DENORM_MODE_FLUSH_OUTPUT = 1,
|
|
78
|
-
AMD_FLOAT_DENORM_MODE_FLUSH_SOURCE = 2,
|
|
79
|
-
AMD_FLOAT_DENORM_MODE_NO_FLUSH = 3
|
|
80
|
-
};
|
|
81
|
-
|
|
82
|
-
// AMD Compute Program Resource Register One.
|
|
83
|
-
typedef uint32_t amd_compute_pgm_rsrc_one32_t;
|
|
84
|
-
enum amd_compute_pgm_rsrc_one_t {
|
|
85
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_GRANULATED_WORKITEM_VGPR_COUNT, 0, 6),
|
|
86
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_GRANULATED_WAVEFRONT_SGPR_COUNT, 6, 4),
|
|
87
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_PRIORITY, 10, 2),
|
|
88
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_FLOAT_ROUND_MODE_32, 12, 2),
|
|
89
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_FLOAT_ROUND_MODE_16_64, 14, 2),
|
|
90
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_FLOAT_DENORM_MODE_32, 16, 2),
|
|
91
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_FLOAT_DENORM_MODE_16_64, 18, 2),
|
|
92
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_PRIV, 20, 1),
|
|
93
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_ENABLE_DX10_CLAMP, 21, 1),
|
|
94
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_DEBUG_MODE, 22, 1),
|
|
95
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_ENABLE_IEEE_MODE, 23, 1),
|
|
96
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_BULKY, 24, 1),
|
|
97
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_CDBG_USER, 25, 1),
|
|
98
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_ONE_RESERVED1, 26, 6)
|
|
99
|
-
};
|
|
100
|
-
|
|
101
|
-
// AMD System VGPR Workitem ID Enumeration Values.
|
|
102
|
-
enum amd_system_vgpr_workitem_id_t {
|
|
103
|
-
AMD_SYSTEM_VGPR_WORKITEM_ID_X = 0,
|
|
104
|
-
AMD_SYSTEM_VGPR_WORKITEM_ID_X_Y = 1,
|
|
105
|
-
AMD_SYSTEM_VGPR_WORKITEM_ID_X_Y_Z = 2,
|
|
106
|
-
AMD_SYSTEM_VGPR_WORKITEM_ID_UNDEFINED = 3
|
|
107
|
-
};
|
|
108
|
-
|
|
109
|
-
// AMD Compute Program Resource Register Two.
|
|
110
|
-
typedef uint32_t amd_compute_pgm_rsrc_two32_t;
|
|
111
|
-
enum amd_compute_pgm_rsrc_two_t {
|
|
112
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_SGPR_PRIVATE_SEGMENT_WAVE_BYTE_OFFSET, 0, 1),
|
|
113
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_USER_SGPR_COUNT, 1, 5),
|
|
114
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_TRAP_HANDLER, 6, 1),
|
|
115
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_SGPR_WORKGROUP_ID_X, 7, 1),
|
|
116
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_SGPR_WORKGROUP_ID_Y, 8, 1),
|
|
117
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_SGPR_WORKGROUP_ID_Z, 9, 1),
|
|
118
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_SGPR_WORKGROUP_INFO, 10, 1),
|
|
119
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_VGPR_WORKITEM_ID, 11, 2),
|
|
120
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_ADDRESS_WATCH, 13, 1),
|
|
121
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_MEMORY_VIOLATION, 14, 1),
|
|
122
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_GRANULATED_LDS_SIZE, 15, 9),
|
|
123
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_IEEE_754_FP_INVALID_OPERATION, 24, 1),
|
|
124
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_FP_DENORMAL_SOURCE, 25, 1),
|
|
125
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_IEEE_754_FP_DIVISION_BY_ZERO, 26, 1),
|
|
126
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_IEEE_754_FP_OVERFLOW, 27, 1),
|
|
127
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_IEEE_754_FP_UNDERFLOW, 28, 1),
|
|
128
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_IEEE_754_FP_INEXACT, 29, 1),
|
|
129
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_ENABLE_EXCEPTION_INT_DIVISION_BY_ZERO, 30, 1),
|
|
130
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_COMPUTE_PGM_RSRC_TWO_RESERVED1, 31, 1)
|
|
131
|
-
};
|
|
132
|
-
|
|
133
|
-
// AMD Element Byte Size Enumeration Values.
|
|
134
|
-
enum amd_element_byte_size_t {
|
|
135
|
-
AMD_ELEMENT_BYTE_SIZE_2 = 0,
|
|
136
|
-
AMD_ELEMENT_BYTE_SIZE_4 = 1,
|
|
137
|
-
AMD_ELEMENT_BYTE_SIZE_8 = 2,
|
|
138
|
-
AMD_ELEMENT_BYTE_SIZE_16 = 3
|
|
139
|
-
};
|
|
140
|
-
|
|
141
|
-
// AMD Kernel Code Properties.
|
|
142
|
-
typedef uint32_t amd_kernel_code_properties32_t;
|
|
143
|
-
enum amd_kernel_code_properties_t {
|
|
144
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER, 0, 1),
|
|
145
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_DISPATCH_PTR, 1, 1),
|
|
146
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_QUEUE_PTR, 2, 1),
|
|
147
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_KERNARG_SEGMENT_PTR, 3, 1),
|
|
148
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_DISPATCH_ID, 4, 1),
|
|
149
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_FLAT_SCRATCH_INIT, 5, 1),
|
|
150
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_PRIVATE_SEGMENT_SIZE, 6, 1),
|
|
151
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_GRID_WORKGROUP_COUNT_X, 7, 1),
|
|
152
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_GRID_WORKGROUP_COUNT_Y, 8, 1),
|
|
153
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_SGPR_GRID_WORKGROUP_COUNT_Z, 9, 1),
|
|
154
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_RESERVED1, 10, 6),
|
|
155
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_ENABLE_ORDERED_APPEND_GDS, 16, 1),
|
|
156
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_PRIVATE_ELEMENT_SIZE, 17, 2),
|
|
157
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_IS_PTR64, 19, 1),
|
|
158
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_IS_DYNAMIC_CALLSTACK, 20, 1),
|
|
159
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_IS_DEBUG_ENABLED, 21, 1),
|
|
160
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_IS_XNACK_ENABLED, 22, 1),
|
|
161
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_KERNEL_CODE_PROPERTIES_RESERVED2, 23, 9)
|
|
162
|
-
};
|
|
163
|
-
|
|
164
|
-
// AMD Power Of Two Enumeration Values.
|
|
165
|
-
typedef uint8_t amd_powertwo8_t;
|
|
166
|
-
enum amd_powertwo_t {
|
|
167
|
-
AMD_POWERTWO_1 = 0,
|
|
168
|
-
AMD_POWERTWO_2 = 1,
|
|
169
|
-
AMD_POWERTWO_4 = 2,
|
|
170
|
-
AMD_POWERTWO_8 = 3,
|
|
171
|
-
AMD_POWERTWO_16 = 4,
|
|
172
|
-
AMD_POWERTWO_32 = 5,
|
|
173
|
-
AMD_POWERTWO_64 = 6,
|
|
174
|
-
AMD_POWERTWO_128 = 7,
|
|
175
|
-
AMD_POWERTWO_256 = 8
|
|
176
|
-
};
|
|
177
|
-
|
|
178
|
-
// AMD Enabled Control Directive Enumeration Values.
|
|
179
|
-
typedef uint64_t amd_enabled_control_directive64_t;
|
|
180
|
-
enum amd_enabled_control_directive_t {
|
|
181
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_ENABLE_BREAK_EXCEPTIONS = 1,
|
|
182
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_ENABLE_DETECT_EXCEPTIONS = 2,
|
|
183
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_MAX_DYNAMIC_GROUP_SIZE = 4,
|
|
184
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_MAX_FLAT_GRID_SIZE = 8,
|
|
185
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_MAX_FLAT_WORKGROUP_SIZE = 16,
|
|
186
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_REQUIRED_DIM = 32,
|
|
187
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_REQUIRED_GRID_SIZE = 64,
|
|
188
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_REQUIRED_WORKGROUP_SIZE = 128,
|
|
189
|
-
AMD_ENABLED_CONTROL_DIRECTIVE_REQUIRE_NO_PARTIAL_WORKGROUPS = 256
|
|
190
|
-
};
|
|
191
|
-
|
|
192
|
-
// AMD Exception Kind Enumeration Values.
|
|
193
|
-
typedef uint16_t amd_exception_kind16_t;
|
|
194
|
-
enum amd_exception_kind_t {
|
|
195
|
-
AMD_EXCEPTION_KIND_INVALID_OPERATION = 1,
|
|
196
|
-
AMD_EXCEPTION_KIND_DIVISION_BY_ZERO = 2,
|
|
197
|
-
AMD_EXCEPTION_KIND_OVERFLOW = 4,
|
|
198
|
-
AMD_EXCEPTION_KIND_UNDERFLOW = 8,
|
|
199
|
-
AMD_EXCEPTION_KIND_INEXACT = 16
|
|
200
|
-
};
|
|
201
|
-
|
|
202
|
-
// AMD Control Directives.
|
|
203
|
-
#define AMD_CONTROL_DIRECTIVES_ALIGN_BYTES 64
|
|
204
|
-
#define AMD_CONTROL_DIRECTIVES_ALIGN __ALIGNED__(AMD_CONTROL_DIRECTIVES_ALIGN_BYTES)
|
|
205
|
-
typedef AMD_CONTROL_DIRECTIVES_ALIGN struct amd_control_directives_s {
|
|
206
|
-
amd_enabled_control_directive64_t enabled_control_directives;
|
|
207
|
-
uint16_t enable_break_exceptions;
|
|
208
|
-
uint16_t enable_detect_exceptions;
|
|
209
|
-
uint32_t max_dynamic_group_size;
|
|
210
|
-
uint64_t max_flat_grid_size;
|
|
211
|
-
uint32_t max_flat_workgroup_size;
|
|
212
|
-
uint8_t required_dim;
|
|
213
|
-
uint8_t reserved1[3];
|
|
214
|
-
uint64_t required_grid_size[3];
|
|
215
|
-
uint32_t required_workgroup_size[3];
|
|
216
|
-
uint8_t reserved2[60];
|
|
217
|
-
} amd_control_directives_t;
|
|
218
|
-
|
|
219
|
-
// AMD Kernel Code.
|
|
220
|
-
#define AMD_ISA_ALIGN_BYTES 256
|
|
221
|
-
#define AMD_KERNEL_CODE_ALIGN_BYTES 64
|
|
222
|
-
#define AMD_KERNEL_CODE_ALIGN __ALIGNED__(AMD_KERNEL_CODE_ALIGN_BYTES)
|
|
223
|
-
typedef AMD_KERNEL_CODE_ALIGN struct amd_kernel_code_s {
|
|
224
|
-
amd_kernel_code_version32_t amd_kernel_code_version_major;
|
|
225
|
-
amd_kernel_code_version32_t amd_kernel_code_version_minor;
|
|
226
|
-
amd_machine_kind16_t amd_machine_kind;
|
|
227
|
-
amd_machine_version16_t amd_machine_version_major;
|
|
228
|
-
amd_machine_version16_t amd_machine_version_minor;
|
|
229
|
-
amd_machine_version16_t amd_machine_version_stepping;
|
|
230
|
-
int64_t kernel_code_entry_byte_offset;
|
|
231
|
-
int64_t kernel_code_prefetch_byte_offset;
|
|
232
|
-
uint64_t kernel_code_prefetch_byte_size;
|
|
233
|
-
uint64_t max_scratch_backing_memory_byte_size;
|
|
234
|
-
amd_compute_pgm_rsrc_one32_t compute_pgm_rsrc1;
|
|
235
|
-
amd_compute_pgm_rsrc_two32_t compute_pgm_rsrc2;
|
|
236
|
-
amd_kernel_code_properties32_t kernel_code_properties;
|
|
237
|
-
uint32_t workitem_private_segment_byte_size;
|
|
238
|
-
uint32_t workgroup_group_segment_byte_size;
|
|
239
|
-
uint32_t gds_segment_byte_size;
|
|
240
|
-
uint64_t kernarg_segment_byte_size;
|
|
241
|
-
uint32_t workgroup_fbarrier_count;
|
|
242
|
-
uint16_t wavefront_sgpr_count;
|
|
243
|
-
uint16_t workitem_vgpr_count;
|
|
244
|
-
uint16_t reserved_vgpr_first;
|
|
245
|
-
uint16_t reserved_vgpr_count;
|
|
246
|
-
uint16_t reserved_sgpr_first;
|
|
247
|
-
uint16_t reserved_sgpr_count;
|
|
248
|
-
uint16_t debug_wavefront_private_segment_offset_sgpr;
|
|
249
|
-
uint16_t debug_private_segment_buffer_sgpr;
|
|
250
|
-
amd_powertwo8_t kernarg_segment_alignment;
|
|
251
|
-
amd_powertwo8_t group_segment_alignment;
|
|
252
|
-
amd_powertwo8_t private_segment_alignment;
|
|
253
|
-
amd_powertwo8_t wavefront_size;
|
|
254
|
-
int32_t call_convention;
|
|
255
|
-
uint8_t reserved1[12];
|
|
256
|
-
uint64_t runtime_loader_kernel_symbol;
|
|
257
|
-
amd_control_directives_t control_directives;
|
|
258
|
-
} amd_kernel_code_t;
|
|
259
|
-
|
|
260
|
-
// TODO: this struct should be completely gone once debugger designs/implements
|
|
261
|
-
// Debugger APIs.
|
|
262
|
-
typedef struct amd_runtime_loader_debug_info_s {
|
|
263
|
-
const void* elf_raw;
|
|
264
|
-
size_t elf_size;
|
|
265
|
-
const char *kernel_name;
|
|
266
|
-
const void *owning_segment;
|
|
267
|
-
} amd_runtime_loader_debug_info_t;
|
|
268
|
-
|
|
269
|
-
#endif // AMD_HSA_KERNEL_CODE_H
|
|
@@ -1,109 +0,0 @@
|
|
|
1
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
2
|
-
//
|
|
3
|
-
// The University of Illinois/NCSA
|
|
4
|
-
// Open Source License (NCSA)
|
|
5
|
-
//
|
|
6
|
-
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
|
|
7
|
-
//
|
|
8
|
-
// Developed by:
|
|
9
|
-
//
|
|
10
|
-
// AMD Research and AMD HSA Software Development
|
|
11
|
-
//
|
|
12
|
-
// Advanced Micro Devices, Inc.
|
|
13
|
-
//
|
|
14
|
-
// www.amd.com
|
|
15
|
-
//
|
|
16
|
-
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
17
|
-
// of this software and associated documentation files (the "Software"), to
|
|
18
|
-
// deal with the Software without restriction, including without limitation
|
|
19
|
-
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
20
|
-
// and/or sell copies of the Software, and to permit persons to whom the
|
|
21
|
-
// Software is furnished to do so, subject to the following conditions:
|
|
22
|
-
//
|
|
23
|
-
// - Redistributions of source code must retain the above copyright notice,
|
|
24
|
-
// this list of conditions and the following disclaimers.
|
|
25
|
-
// - Redistributions in binary form must reproduce the above copyright
|
|
26
|
-
// notice, this list of conditions and the following disclaimers in
|
|
27
|
-
// the documentation and/or other materials provided with the distribution.
|
|
28
|
-
// - Neither the names of Advanced Micro Devices, Inc,
|
|
29
|
-
// nor the names of its contributors may be used to endorse or promote
|
|
30
|
-
// products derived from this Software without specific prior written
|
|
31
|
-
// permission.
|
|
32
|
-
//
|
|
33
|
-
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
34
|
-
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
35
|
-
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
36
|
-
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
37
|
-
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
38
|
-
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
39
|
-
// DEALINGS WITH THE SOFTWARE.
|
|
40
|
-
//
|
|
41
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
42
|
-
|
|
43
|
-
#ifndef AMD_HSA_QUEUE_H
|
|
44
|
-
#define AMD_HSA_QUEUE_H
|
|
45
|
-
|
|
46
|
-
#include "amd_hsa_common.h"
|
|
47
|
-
#include "hsa.h"
|
|
48
|
-
|
|
49
|
-
// AMD Queue Properties.
|
|
50
|
-
typedef uint32_t amd_queue_properties32_t;
|
|
51
|
-
enum amd_queue_properties_t {
|
|
52
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_ENABLE_TRAP_HANDLER, 0, 1),
|
|
53
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_IS_PTR64, 1, 1),
|
|
54
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_ENABLE_TRAP_HANDLER_DEBUG_SGPRS, 2, 1),
|
|
55
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_ENABLE_PROFILING, 3, 1),
|
|
56
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_USE_SCRATCH_ONCE, 4, 1),
|
|
57
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_PROPERTIES_RESERVED1, 5, 27)
|
|
58
|
-
};
|
|
59
|
-
|
|
60
|
-
// AMD Queue.
|
|
61
|
-
#define AMD_QUEUE_ALIGN_BYTES 64
|
|
62
|
-
#define AMD_QUEUE_ALIGN __ALIGNED__(AMD_QUEUE_ALIGN_BYTES)
|
|
63
|
-
|
|
64
|
-
// AMD Queue Capabilities.
|
|
65
|
-
typedef uint32_t amd_queue_capabilities32_t;
|
|
66
|
-
enum amd_queue_capabilities_t {
|
|
67
|
-
/* Whether this CP queue supports dual-scratch and async-reclaim */
|
|
68
|
-
AMD_HSA_BITS_CREATE_ENUM_ENTRIES(AMD_QUEUE_CAPS_ASYNC_RECLAIM, 0, 1),
|
|
69
|
-
};
|
|
70
|
-
|
|
71
|
-
// Members tagged with "async-reclaim" are ignored by CP FW's that do not support
|
|
72
|
-
// AMD_QUEUE_CAPS_ASYNC_RECLAIM. CP FW's that support async-reclaim also support
|
|
73
|
-
// dual-scratch (alternate scratch).
|
|
74
|
-
|
|
75
|
-
typedef struct AMD_QUEUE_ALIGN amd_queue_s {
|
|
76
|
-
hsa_queue_t hsa_queue;
|
|
77
|
-
uint32_t caps;
|
|
78
|
-
uint32_t reserved1[3];
|
|
79
|
-
volatile uint64_t write_dispatch_id;
|
|
80
|
-
uint32_t group_segment_aperture_base_hi;
|
|
81
|
-
uint32_t private_segment_aperture_base_hi;
|
|
82
|
-
uint32_t max_cu_id;
|
|
83
|
-
uint32_t max_wave_id;
|
|
84
|
-
volatile uint64_t max_legacy_doorbell_dispatch_id_plus_1;
|
|
85
|
-
volatile uint32_t legacy_doorbell_lock;
|
|
86
|
-
uint32_t reserved2[9];
|
|
87
|
-
volatile uint64_t read_dispatch_id;
|
|
88
|
-
uint32_t read_dispatch_id_field_base_byte_offset;
|
|
89
|
-
uint32_t compute_tmpring_size;
|
|
90
|
-
uint32_t scratch_resource_descriptor[4];
|
|
91
|
-
uint64_t scratch_backing_memory_location;
|
|
92
|
-
uint64_t scratch_backing_memory_byte_size;
|
|
93
|
-
uint32_t scratch_wave64_lane_byte_size;
|
|
94
|
-
amd_queue_properties32_t queue_properties;
|
|
95
|
-
volatile uint64_t scratch_last_used_index; /* async-reclaim */
|
|
96
|
-
hsa_signal_t queue_inactive_signal;
|
|
97
|
-
uint32_t reserved4[2];
|
|
98
|
-
volatile uint64_t alt_scratch_last_used_index; /* async-reclaim */
|
|
99
|
-
uint64_t alt_scratch_backing_memory_location; /* async-reclaim */
|
|
100
|
-
uint64_t alt_scratch_backing_memory_byte_size; /* async-reclaim */
|
|
101
|
-
uint32_t alt_scratch_dispatch_limit_x; /* async-reclaim */
|
|
102
|
-
uint32_t alt_scratch_dispatch_limit_y; /* async-reclaim */
|
|
103
|
-
uint32_t alt_scratch_dispatch_limit_z; /* async-reclaim */
|
|
104
|
-
uint32_t alt_scratch_wave64_lane_byte_size; /* async-reclaim */
|
|
105
|
-
uint32_t alt_compute_tmpring_size; /* async-reclaim */
|
|
106
|
-
uint32_t reserved5;
|
|
107
|
-
} amd_queue_t;
|
|
108
|
-
|
|
109
|
-
#endif // AMD_HSA_QUEUE_H
|
|
@@ -1,80 +0,0 @@
|
|
|
1
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
2
|
-
//
|
|
3
|
-
// The University of Illinois/NCSA
|
|
4
|
-
// Open Source License (NCSA)
|
|
5
|
-
//
|
|
6
|
-
// Copyright (c) 2014-2020, Advanced Micro Devices, Inc. All rights reserved.
|
|
7
|
-
//
|
|
8
|
-
// Developed by:
|
|
9
|
-
//
|
|
10
|
-
// AMD Research and AMD HSA Software Development
|
|
11
|
-
//
|
|
12
|
-
// Advanced Micro Devices, Inc.
|
|
13
|
-
//
|
|
14
|
-
// www.amd.com
|
|
15
|
-
//
|
|
16
|
-
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
17
|
-
// of this software and associated documentation files (the "Software"), to
|
|
18
|
-
// deal with the Software without restriction, including without limitation
|
|
19
|
-
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
20
|
-
// and/or sell copies of the Software, and to permit persons to whom the
|
|
21
|
-
// Software is furnished to do so, subject to the following conditions:
|
|
22
|
-
//
|
|
23
|
-
// - Redistributions of source code must retain the above copyright notice,
|
|
24
|
-
// this list of conditions and the following disclaimers.
|
|
25
|
-
// - Redistributions in binary form must reproduce the above copyright
|
|
26
|
-
// notice, this list of conditions and the following disclaimers in
|
|
27
|
-
// the documentation and/or other materials provided with the distribution.
|
|
28
|
-
// - Neither the names of Advanced Micro Devices, Inc,
|
|
29
|
-
// nor the names of its contributors may be used to endorse or promote
|
|
30
|
-
// products derived from this Software without specific prior written
|
|
31
|
-
// permission.
|
|
32
|
-
//
|
|
33
|
-
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
34
|
-
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
35
|
-
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
36
|
-
// THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
37
|
-
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
38
|
-
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
39
|
-
// DEALINGS WITH THE SOFTWARE.
|
|
40
|
-
//
|
|
41
|
-
////////////////////////////////////////////////////////////////////////////////
|
|
42
|
-
|
|
43
|
-
#ifndef AMD_HSA_SIGNAL_H
|
|
44
|
-
#define AMD_HSA_SIGNAL_H
|
|
45
|
-
|
|
46
|
-
#include "amd_hsa_common.h"
|
|
47
|
-
#include "amd_hsa_queue.h"
|
|
48
|
-
|
|
49
|
-
// AMD Signal Kind Enumeration Values.
|
|
50
|
-
typedef int64_t amd_signal_kind64_t;
|
|
51
|
-
enum amd_signal_kind_t {
|
|
52
|
-
AMD_SIGNAL_KIND_INVALID = 0,
|
|
53
|
-
AMD_SIGNAL_KIND_USER = 1,
|
|
54
|
-
AMD_SIGNAL_KIND_DOORBELL = -1,
|
|
55
|
-
AMD_SIGNAL_KIND_LEGACY_DOORBELL = -2
|
|
56
|
-
};
|
|
57
|
-
|
|
58
|
-
// AMD Signal.
|
|
59
|
-
#define AMD_SIGNAL_ALIGN_BYTES 64
|
|
60
|
-
#define AMD_SIGNAL_ALIGN __ALIGNED__(AMD_SIGNAL_ALIGN_BYTES)
|
|
61
|
-
typedef struct AMD_SIGNAL_ALIGN amd_signal_s {
|
|
62
|
-
amd_signal_kind64_t kind;
|
|
63
|
-
union {
|
|
64
|
-
volatile int64_t value;
|
|
65
|
-
volatile uint32_t* legacy_hardware_doorbell_ptr;
|
|
66
|
-
volatile uint64_t* hardware_doorbell_ptr;
|
|
67
|
-
};
|
|
68
|
-
uint64_t event_mailbox_ptr;
|
|
69
|
-
uint32_t event_id;
|
|
70
|
-
uint32_t reserved1;
|
|
71
|
-
uint64_t start_ts;
|
|
72
|
-
uint64_t end_ts;
|
|
73
|
-
union {
|
|
74
|
-
amd_queue_t* queue_ptr;
|
|
75
|
-
uint64_t reserved2;
|
|
76
|
-
};
|
|
77
|
-
uint32_t reserved3[2];
|
|
78
|
-
} amd_signal_t;
|
|
79
|
-
|
|
80
|
-
#endif // AMD_HSA_SIGNAL_H
|