/Users/buildslave/jenkins/sharedspace/clang-stage2-coverage-R@2/llvm/lib/Target/AMDGPU/Utils/AMDKernelCodeTInfo.h
Line | Count | Source |
1 | 195k | //===--------------------- AMDKernelCodeTInfo.h ---------------------------===// |
2 | 195k | // |
3 | 195k | // The LLVM Compiler Infrastructure |
4 | 195k | // |
5 | 195k | // This file is distributed under the University of Illinois Open Source |
6 | 195k | // License. See LICENSE.TXT for details. |
7 | 195k | // |
8 | 195k | //===----------------------------------------------------------------------===// |
9 | 195k | // |
10 | 195k | //===----------------------------------------------------------------------===// |
11 | 195k | // |
12 | 195k | /// \file - specifies tables for amd_kernel_code_t structure parsing/printing |
13 | 195k | // |
14 | 195k | //===----------------------------------------------------------------------===// |
15 | 195k | |
16 | 195k | #define QNAME(name) amd_kernel_code_t::name |
17 | 195k | #define FLD_T(name) decltype(QNAME(name)), &QNAME(name) |
18 | 195k | |
19 | 195k | #define FIELD2(sname, aname, name) \ |
20 | 5.48M | RECORD(sname, aname, printField<FLD_T(name)>, parseField<FLD_T(name)>) |
21 | 195k | |
22 | 4.30M | #define FIELD(name) FIELD2(name, name, name) |
23 | 195k | |
24 | 195k | |
25 | 195k | #define PRINTCODEPROP(name) \ |
26 | 195k | printBitField<FLD_T(code_properties),\ |
27 | 195k | AMD_CODE_PROPERTY_##name##_SHIFT,\ |
28 | 195k | AMD_CODE_PROPERTY_##name##_WIDTH> |
29 | 195k | |
30 | 195k | #define PARSECODEPROP(name) \ |
31 | 195k | parseBitField<FLD_T(code_properties),\ |
32 | 195k | AMD_CODE_PROPERTY_##name##_SHIFT,\ |
33 | 195k | AMD_CODE_PROPERTY_##name##_WIDTH> |
34 | 195k | |
35 | 195k | #define CODEPROP(name, shift) \ |
36 | 3.13M | RECORD(name, name, PRINTCODEPROP(shift), PARSECODEPROP(shift)) |
37 | 195k | |
38 | 195k | // have to define these lambdas because of Set/GetMacro |
39 | 195k | #define PRINTCOMP(GetMacro, Shift) \ |
40 | 195k | [](StringRef Name, const amd_kernel_code_t &C, raw_ostream &OS) { \ |
41 | 195k | printName(OS, Name) << \ |
42 | 195k | (int)GetMacro(C.compute_pgm_resource_registers >> Shift); \ |
43 | 195k | } |
44 | 195k | #define PARSECOMP(SetMacro, Shift) \ |
45 | 195k | [](amd_kernel_code_t &C, MCAsmParser &MCParser, raw_ostream &Err) { \ |
46 | 195k | int64_t Value = 0; \ |
47 | 195k | if (!expectAbsExpression(MCParser, Value, Err)) \ |
48 | 195k | return false; \ |
49 | 195k | C.compute_pgm_resource_registers |= SetMacro(Value) << Shift; \ |
50 | 195k | return true; \ |
51 | 195k | } |
52 | 195k | |
53 | 195k | #define COMPPGM(name, aname, GetMacro, SetMacro, Shift) \ |
54 | 3.72M | RECORD(name, aname, PRINTCOMP(GetMacro, Shift), PARSECOMP(SetMacro, Shift)) |
55 | 195k | |
56 | 195k | #define COMPPGM1(name, aname, AccMacro) \ |
57 | 1.56M | COMPPGM(name, aname, G_00B848_##AccMacro, S_00B848_##AccMacro, 0) |
58 | 195k | |
59 | 195k | #define COMPPGM2(name, aname, AccMacro) \ |
60 | 2.15M | COMPPGM(name, aname, G_00B84C_##AccMacro, S_00B84C_##AccMacro, 32) |
61 | 195k | |
62 | 195k | /////////////////////////////////////////////////////////////////////////////// |
63 | 195k | // Begin of the table |
64 | 195k | // Define RECORD(name, print, parse) in your code to get field definitions |
65 | 195k | // and include this file |
66 | 195k | |
67 | 195k | FIELD2(amd_code_version_major, kernel_code_version_major, amd_kernel_code_version_major), |
68 | 195k | FIELD2(amd_code_version_minor, kernel_code_version_minor, amd_kernel_code_version_minor), |
69 | 195k | FIELD2(amd_machine_kind, machine_kind, amd_machine_kind), |
70 | 195k | FIELD2(amd_machine_version_major, machine_version_major, amd_machine_version_major), |
71 | 195k | FIELD2(amd_machine_version_minor, machine_version_minor, amd_machine_version_minor), |
72 | 195k | FIELD2(amd_machine_version_stepping, machine_version_stepping, amd_machine_version_stepping), |
73 | 195k | |
74 | 195k | FIELD(kernel_code_entry_byte_offset), |
75 | 195k | FIELD(kernel_code_prefetch_byte_size), |
76 | 195k | FIELD(max_scratch_backing_memory_byte_size), |
77 | 195k | |
78 | 195k | COMPPGM1(granulated_workitem_vgpr_count, compute_pgm_rsrc1_vgprs, VGPRS), |
79 | 195k | COMPPGM1(granulated_wavefront_sgpr_count, compute_pgm_rsrc1_sgprs, SGPRS), |
80 | 195k | COMPPGM1(priority, compute_pgm_rsrc1_priority, PRIORITY), |
81 | 195k | COMPPGM1(float_mode, compute_pgm_rsrc1_float_mode, FLOAT_MODE), // TODO: split float_mode |
82 | 195k | COMPPGM1(priv, compute_pgm_rsrc1_priv, PRIV), |
83 | 195k | COMPPGM1(enable_dx10_clamp, compute_pgm_rsrc1_dx10_clamp, DX10_CLAMP), |
84 | 195k | COMPPGM1(debug_mode, compute_pgm_rsrc1_debug_mode, DEBUG_MODE), |
85 | 195k | COMPPGM1(enable_ieee_mode, compute_pgm_rsrc1_ieee_mode, IEEE_MODE), |
86 | 195k | // TODO: bulky |
87 | 195k | // TODO: cdbg_user |
88 | 195k | COMPPGM2(enable_sgpr_private_segment_wave_byte_offset, compute_pgm_rsrc2_scratch_en, SCRATCH_EN), |
89 | 195k | COMPPGM2(user_sgpr_count, compute_pgm_rsrc2_user_sgpr, USER_SGPR), |
90 | 195k | COMPPGM2(enable_trap_handler, compute_pgm_rsrc2_trap_handler, TRAP_HANDLER), |
91 | 195k | COMPPGM2(enable_sgpr_workgroup_id_x, compute_pgm_rsrc2_tgid_x_en, TGID_X_EN), |
92 | 195k | COMPPGM2(enable_sgpr_workgroup_id_y, compute_pgm_rsrc2_tgid_y_en, TGID_Y_EN), |
93 | 195k | COMPPGM2(enable_sgpr_workgroup_id_z, compute_pgm_rsrc2_tgid_z_en, TGID_Z_EN), |
94 | 195k | COMPPGM2(enable_sgpr_workgroup_info, compute_pgm_rsrc2_tg_size_en, TG_SIZE_EN), |
95 | 195k | COMPPGM2(enable_vgpr_workitem_id, compute_pgm_rsrc2_tidig_comp_cnt, TIDIG_COMP_CNT), |
96 | 195k | COMPPGM2(enable_exception_msb, compute_pgm_rsrc2_excp_en_msb, EXCP_EN_MSB), // TODO: split enable_exception_msb |
97 | 195k | COMPPGM2(granulated_lds_size, compute_pgm_rsrc2_lds_size, LDS_SIZE), |
98 | 195k | COMPPGM2(enable_exception, compute_pgm_rsrc2_excp_en, EXCP_EN), // TODO: split enable_exception |
99 | 195k | |
100 | 195k | CODEPROP(enable_sgpr_private_segment_buffer, ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER), |
101 | 195k | CODEPROP(enable_sgpr_dispatch_ptr, ENABLE_SGPR_DISPATCH_PTR), |
102 | 195k | CODEPROP(enable_sgpr_queue_ptr, ENABLE_SGPR_QUEUE_PTR), |
103 | 195k | CODEPROP(enable_sgpr_kernarg_segment_ptr, ENABLE_SGPR_KERNARG_SEGMENT_PTR), |
104 | 195k | CODEPROP(enable_sgpr_dispatch_id, ENABLE_SGPR_DISPATCH_ID), |
105 | 195k | CODEPROP(enable_sgpr_flat_scratch_init, ENABLE_SGPR_FLAT_SCRATCH_INIT), |
106 | 195k | CODEPROP(enable_sgpr_private_segment_size, ENABLE_SGPR_PRIVATE_SEGMENT_SIZE), |
107 | 195k | CODEPROP(enable_sgpr_grid_workgroup_count_x, ENABLE_SGPR_GRID_WORKGROUP_COUNT_X), |
108 | 195k | CODEPROP(enable_sgpr_grid_workgroup_count_y, ENABLE_SGPR_GRID_WORKGROUP_COUNT_Y), |
109 | 195k | CODEPROP(enable_sgpr_grid_workgroup_count_z, ENABLE_SGPR_GRID_WORKGROUP_COUNT_Z), |
110 | 195k | CODEPROP(enable_ordered_append_gds, ENABLE_ORDERED_APPEND_GDS), |
111 | 195k | CODEPROP(private_element_size, PRIVATE_ELEMENT_SIZE), |
112 | 195k | CODEPROP(is_ptr64, IS_PTR64), |
113 | 195k | CODEPROP(is_dynamic_callstack, IS_DYNAMIC_CALLSTACK), |
114 | 195k | CODEPROP(is_debug_enabled, IS_DEBUG_SUPPORTED), |
115 | 195k | CODEPROP(is_xnack_enabled, IS_XNACK_SUPPORTED), |
116 | 195k | |
117 | 195k | FIELD(workitem_private_segment_byte_size), |
118 | 195k | FIELD(workgroup_group_segment_byte_size), |
119 | 195k | FIELD(gds_segment_byte_size), |
120 | 195k | FIELD(kernarg_segment_byte_size), |
121 | 195k | FIELD(workgroup_fbarrier_count), |
122 | 195k | FIELD(wavefront_sgpr_count), |
123 | 195k | FIELD(workitem_vgpr_count), |
124 | 195k | FIELD(reserved_vgpr_first), |
125 | 195k | FIELD(reserved_vgpr_count), |
126 | 195k | FIELD(reserved_sgpr_first), |
127 | 195k | FIELD(reserved_sgpr_count), |
128 | 195k | FIELD(debug_wavefront_private_segment_offset_sgpr), |
129 | 195k | FIELD(debug_private_segment_buffer_sgpr), |
130 | 195k | FIELD(kernarg_segment_alignment), |
131 | 195k | FIELD(group_segment_alignment), |
132 | 195k | FIELD(private_segment_alignment), |
133 | 195k | FIELD(wavefront_size), |
134 | 195k | FIELD(call_convention), |
135 | 195k | FIELD(runtime_loader_kernel_symbol) |
136 | 195k | // TODO: control_directive |
137 | 195k | |
138 | 195k | // end of the table |
139 | 195k | /////////////////////////////////////////////////////////////////////////////// |
140 | 195k | |
141 | 195k | #undef QNAME |
142 | 195k | #undef FLD_T |
143 | 195k | #undef FIELD2 |
144 | 195k | #undef FIELD |
145 | 195k | #undef PRINTCODEPROP |
146 | 195k | #undef PARSECODEPROP |
147 | 195k | #undef CODEPROP |
148 | 195k | #undef PRINTCOMP |
149 | 195k | #undef PAPSECOMP |
150 | 195k | #undef COMPPGM |
151 | 195k | #undef COMPPGM1 |
152 | 195k | #undef COMPPGM2 |