1 /* -*- mesa-c++  -*-
2  *
3  * Copyright (c) 2018 Collabora LTD
4  *
5  * Author: Gert Wollny <gert.wollny@collabora.com>
6  *
7  * Permission is hereby granted, free of charge, to any person obtaining a
8  * copy of this software and associated documentation files (the "Software"),
9  * to deal in the Software without restriction, including without limitation
10  * on the rights to use, copy, modify, merge, publish, distribute, sub
11  * license, and/or sell copies of the Software, and to permit persons to whom
12  * the Software is furnished to do so, subject to the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the next
15  * paragraph) shall be included in all copies or substantial portions of the
16  * Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21  * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
22  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24  * USE OR OTHER DEALINGS IN THE SOFTWARE.
25  */
26 
27 #include "sfn_alu_defines.h"
28 
29 namespace r600 {
30 
31 const std::map<EAluOp, AluOp> alu_ops = {
32    {op0_nop                 ,AluOp(0, 0, AluOp::a,"NOP")},
33    {op0_group_barrier       ,AluOp(0, 0, AluOp::a,"GROUP_BARRIER")},
34    {op0_group_seq_begin     ,AluOp(0, 0, AluOp::a,"GROUP_SEQ_BEGIN")},
35    {op0_group_seq_end       ,AluOp(0, 0, AluOp::a,"GROUP_SEQ_END")},
36    {op0_pred_set_clr        ,AluOp(0, 1, AluOp::a,"PRED_SET_CLR")},
37    {op0_store_flags         ,AluOp(0, 0, AluOp::v,"STORE_FLAGS")},
38    {op0_lds_1a              ,AluOp(0, 0, AluOp::v,"LDS_1A")},
39    {op0_lds_1a1d            ,AluOp(0, 0, AluOp::v,"LDS_1A1D")},
40    {op0_lds_2a              ,AluOp(0, 0, AluOp::v,"LDS_2A")},
41 
42    {op1_bcnt_int            ,AluOp(1, 0, AluOp::v,"BCNT_INT")},
43    {op1_bcnt_accum_prev_int ,AluOp(1, 0, AluOp::v,"BCNT_ACCUM_PREV_INT")},
44    {op1_bfrev_int           ,AluOp(1, 0, AluOp::a,"BFREV_INT")},
45    {op1_ceil                ,AluOp(1, 1, AluOp::a,"CEIL")},
46    {op1_cos                 ,AluOp(1, 1, AluOp::t,"COS")},
47    {op1_exp_ieee            ,AluOp(1, 1, AluOp::t,"EXP_IEEE")},
48    {op1_floor               ,AluOp(1, 1, AluOp::a,"FLOOR")},
49    {op1_flt_to_int          ,AluOp(1, 0, AluOp::a,"FLT_TO_INT")},
50    {op1_flt_to_uint         ,AluOp(1, 1, AluOp::t,"FLT_TO_UINT")},
51    {op1_flt_to_int_rpi      ,AluOp(1, 1, AluOp::v,"FLT_TO_INT_RPI")},
52    {op1_flt_to_int_floor    ,AluOp(1, 1, AluOp::v,"FLT_TO_INT_FLOOR")},
53    {op1_flt16_to_flt32      ,AluOp(1, 1, AluOp::v,"FLT16_TO_FLT32")},
54    {op1_flt32_to_flt16      ,AluOp(1, 1, AluOp::v,"FLT32_TO_FLT16")},
55    {op1_flt32_to_flt64      ,AluOp(1, 1, AluOp::v,"FLT32_TO_FLT64")},
56    {op1_flt64_to_flt32      ,AluOp(1, 1, AluOp::a,"FLT64_TO_FLT32")},
57    {op1_fract               ,AluOp(1, 1, AluOp::a,"FRACT")},
58    {op1_fract_64            ,AluOp(1, 1, AluOp::v,"FRACT_64")},
59    {op1_frexp_64            ,AluOp(1, 1, AluOp::v,"FREXP_64")},
60    {op1_int_to_flt          ,AluOp(1, 0, AluOp::t,"INT_TO_FLT")},
61    {op1_ldexp_64            ,AluOp(1, 1, AluOp::v,"LDEXP_64")},
62    {op1_interp_load_p0      ,AluOp(1, 1, AluOp::v,"INTERP_LOAD_P0")},
63    {op1_interp_load_p10     ,AluOp(1, 1, AluOp::v,"INTERP_LOAD_P10")},
64    {op1_interp_load_p20     ,AluOp(1, 1, AluOp::v,"INTERP_LOAD_P20")},
65    {op1_load_store_flags    ,AluOp(1, 0, AluOp::v,"LOAD_STORE_FLAGS")},
66    {op1_log_clamped         ,AluOp(1, 1, AluOp::t,"LOG_CLAMPED")},
67    {op1_log_ieee            ,AluOp(1, 1, AluOp::t,"LOG_IEEE")},
68    {op1_max4                ,AluOp(1, 1, AluOp::v,"MAX4")},
69    {op1_mbcnt_32hi_int      ,AluOp(1, 0, AluOp::v,"MBCNT_32HI_INT")},
70    {op1_mbcnt_32lo_accum_prev_int ,AluOp(1, 0, AluOp::v,"MBCNT_32LO_ACCUM_PREV_INT")},
71    {op1_mov                 ,AluOp(1, 0, AluOp::a,"MOV")},
72    {op1_mova_int            ,AluOp(1, 0, AluOp::v,"MOVA_INT")},
73    {op1_not_int             ,AluOp(1, 0, AluOp::a,"NOT_INT")},
74    {op1_offset_to_flt       ,AluOp(1, 0, AluOp::v,"OFFSET_TO_FLT")},
75    {op1_pred_set_inv        ,AluOp(1, 1, AluOp::a,"PRED_SET_INV")},
76    {op1_pred_set_restore    ,AluOp(1, 1, AluOp::a,"PRED_SET_RESTORE")},
77    {op1_set_cf_idx0         ,AluOp(1, 0, AluOp::a,"SET_CF_IDX0")}, /* Reads from AR register? */
78    {op1_set_cf_idx1         ,AluOp(1, 0, AluOp::a,"SET_CF_IDX1")}, /* Reads from AR register? */
79    {op1_recip_clamped       ,AluOp(1, 1, AluOp::t,"RECIP_CLAMPED")},
80    {op1_recip_ff            ,AluOp(1, 1, AluOp::t,"RECIP_FF")},
81    {op1_recip_ieee          ,AluOp(1, 1, AluOp::t,"RECIP_IEEE")},
82    {op1_recipsqrt_clamped   ,AluOp(1, 1, AluOp::t,"RECIPSQRT_CLAMPED")},
83    {op1_recipsqrt_ff        ,AluOp(1, 1, AluOp::t,"RECIPSQRT_FF")},
84    {op1_recipsqrt_ieee1     ,AluOp(1, 1, AluOp::t,"RECIPSQRT_IEEE")},
85    {op1_recip_int           ,AluOp(1, 0, AluOp::t,"RECIP_INT")},
86    {op1_recip_uint          ,AluOp(1, 0, AluOp::t,"RECIP_UINT")},
87    {op1_recip_64            ,AluOp(1, 1, AluOp::t,"RECIP_64")},
88    {op1_recip_clamped_64    ,AluOp(1, 1, AluOp::t,"RECIP_CLAMPED_64")},
89    {op1_recipsqrt_64        ,AluOp(1, 1, AluOp::t,"RECIPSQRT_64")},
90    {op1_recipsqrt_clamped_64,AluOp(1, 1, AluOp::t,"RECIPSQRT_CLAMPED_64")},
91    {op1_rndne               ,AluOp(1, 1, AluOp::a,"RNDNE")},
92    {op1_sqrt_ieee           ,AluOp(1, 1, AluOp::t,"SQRT_IEEE")},
93    {op1_sin                 ,AluOp(1, 1, AluOp::t,"SIN")},
94    {op1_trunc               ,AluOp(1, 1, AluOp::a,"TRUNC")},
95    {op1_sqrt_64             ,AluOp(1, 1, AluOp::t,"SQRT_64")},
96    {op1_ubyte0_flt          ,AluOp(1, 1, AluOp::v,"UBYTE0_FLT")},
97    {op1_ubyte1_flt          ,AluOp(1, 1, AluOp::v,"UBYTE1_FLT")},
98    {op1_ubyte2_flt          ,AluOp(1, 1, AluOp::v,"UBYTE2_FLT")},
99    {op1_ubyte3_flt          ,AluOp(1, 1, AluOp::v,"UBYTE3_FLT")},
100    {op1_uint_to_flt         ,AluOp(1, 0, AluOp::t,"UINT_TO_FLT")},
101    {op1_ffbh_uint           ,AluOp(1, 0, AluOp::v,"FFBH_UINT")},
102    {op1_ffbl_int            ,AluOp(1, 0, AluOp::v,"FFBL_INT")},
103    {op1_ffbh_int            ,AluOp(1, 0, AluOp::v,"FFBH_INT")},
104    {op1_flt_to_uint4        ,AluOp(1, 1, AluOp::v,"FLT_TO_UINT4")},
105    {op1v_flt32_to_flt64     ,AluOp(1, 1, AluOp::a,"FLT32_TO_FLT64")},
106    {op1v_flt64_to_flt32     ,AluOp(1, 1, AluOp::v,"FLT64_TO_FLT32")},
107 
108    {op2_add                 ,AluOp(2, 1, AluOp::a,"ADD")},
109    {op2_bfm_int             ,AluOp(2, 0, AluOp::v,"BFM_INT")},
110    {op2_mul                 ,AluOp(2, 1, AluOp::a,"MUL")},
111    {op2_mul_ieee            ,AluOp(2, 1, AluOp::a,"MUL_IEEE")},
112    {op2_max                 ,AluOp(2, 1, AluOp::a,"MAX")},
113    {op2_min                 ,AluOp(2, 1, AluOp::a,"MIN")},
114    {op2_max_dx10            ,AluOp(2, 1, AluOp::a,"MAX_DX10")},
115    {op2_min_dx10            ,AluOp(2, 1, AluOp::a,"MIN_DX10")},
116    {op2_sete                ,AluOp(2, 1, AluOp::a,"SETE")},
117    {op2_setgt               ,AluOp(2, 1, AluOp::a,"SETGT")},
118    {op2_setge               ,AluOp(2, 1, AluOp::a,"SETGE")},
119    {op2_setne               ,AluOp(2, 1, AluOp::a,"SETNE")},
120    {op2_sete_dx10           ,AluOp(2, 1, AluOp::a,"SETE_DX10")},
121    {op2_setgt_dx10          ,AluOp(2, 1, AluOp::a,"SETGT_DX10")},
122    {op2_setge_dx10          ,AluOp(2, 1, AluOp::a,"SETGE_DX10")},
123    {op2_setne_dx10          ,AluOp(2, 1, AluOp::a,"SETNE_DX10")},
124    {op2_ashr_int            ,AluOp(2, 0, AluOp::a,"ASHR_INT")},
125    {op2_lshr_int            ,AluOp(2, 0, AluOp::a,"LSHR_INT")},
126    {op2_lshl_int            ,AluOp(2, 0, AluOp::a,"LSHL_INT")},
127    {op2_mul_64              ,AluOp(2, 1, AluOp::a,"MUL_64")},
128    {op2_pred_setgt_uint     ,AluOp(2, 0, AluOp::a,"PRED_SETGT_UINT")},
129    {op2_pred_setge_uint     ,AluOp(2, 0, AluOp::a,"PRED_SETGE_UINT")},
130    {op2_pred_sete           ,AluOp(2, 1, AluOp::a,"PRED_SETE")},
131    {op2_pred_setgt          ,AluOp(2, 1, AluOp::a,"PRED_SETGT")},
132    {op2_pred_setge          ,AluOp(2, 1, AluOp::a,"PRED_SETGE")},
133    {op2_pred_setne          ,AluOp(2, 1, AluOp::a,"PRED_SETNE")},
134    {op2_pred_set_pop        ,AluOp(2, 1, AluOp::a,"PRED_SET_POP")},
135    {op2_pred_sete_push      ,AluOp(2, 1, AluOp::a,"PRED_SETE_PUSH")},
136    {op2_pred_setgt_push     ,AluOp(2, 1, AluOp::a,"PRED_SETGT_PUSH")},
137    {op2_pred_setge_push     ,AluOp(2, 1, AluOp::a,"PRED_SETGE_PUSH")},
138    {op2_pred_setne_push     ,AluOp(2, 1, AluOp::a,"PRED_SETNE_PUSH")},
139    {op2_kille               ,AluOp(2, 1, AluOp::a,"KILLE")},
140    {op2_killgt              ,AluOp(2, 1, AluOp::a,"KILLGT")},
141    {op2_killge              ,AluOp(2, 1, AluOp::a,"KILLGE")},
142    {op2_killne              ,AluOp(2, 1, AluOp::a,"KILLNE")},
143    {op2_and_int             ,AluOp(2, 0, AluOp::a,"AND_INT")},
144    {op2_or_int              ,AluOp(2, 0, AluOp::a,"OR_INT")},
145    {op2_xor_int             ,AluOp(2, 0, AluOp::a,"XOR_INT")},
146    {op2_add_int             ,AluOp(2, 0, AluOp::a,"ADD_INT")},
147    {op2_sub_int             ,AluOp(2, 0, AluOp::a,"SUB_INT")},
148    {op2_max_int             ,AluOp(2, 0, AluOp::a,"MAX_INT")},
149    {op2_min_int             ,AluOp(2, 0, AluOp::a,"MIN_INT")},
150    {op2_max_uint            ,AluOp(2, 0, AluOp::a,"MAX_UINT")},
151    {op2_min_uint            ,AluOp(2, 0, AluOp::a,"MIN_UINT")},
152    {op2_sete_int            ,AluOp(2, 0, AluOp::a,"SETE_INT")},
153    {op2_setgt_int           ,AluOp(2, 0, AluOp::a,"SETGT_INT")},
154    {op2_setge_int           ,AluOp(2, 0, AluOp::a,"SETGE_INT")},
155    {op2_setne_int           ,AluOp(2, 0, AluOp::a,"SETNE_INT")},
156    {op2_setgt_uint          ,AluOp(2, 0, AluOp::a,"SETGT_UINT")},
157    {op2_setge_uint          ,AluOp(2, 0, AluOp::a,"SETGE_UINT")},
158    {op2_killgt_uint         ,AluOp(2, 0, AluOp::a,"KILLGT_UINT")},
159    {op2_killge_uint         ,AluOp(2, 0, AluOp::a,"KILLGE_UINT")},
160    {op2_prede_int           ,AluOp(2, 0, AluOp::a,"PREDE_INT")},
161    {op2_pred_setgt_int      ,AluOp(2, 0, AluOp::a,"PRED_SETGT_INT")},
162    {op2_pred_setge_int      ,AluOp(2, 0, AluOp::a,"PRED_SETGE_INT")},
163    {op2_pred_setne_int      ,AluOp(2, 0, AluOp::a,"PRED_SETNE_INT")},
164    {op2_kille_int           ,AluOp(2, 0, AluOp::a,"KILLE_INT")},
165    {op2_killgt_int          ,AluOp(2, 0, AluOp::a,"KILLGT_INT")},
166    {op2_killge_int          ,AluOp(2, 0, AluOp::a,"KILLGE_INT")},
167    {op2_killne_int          ,AluOp(2, 0, AluOp::a,"KILLNE_INT")},
168    {op2_pred_sete_push_int  ,AluOp(2, 0, AluOp::a,"PRED_SETE_PUSH_INT")},
169    {op2_pred_setgt_push_int ,AluOp(2, 0, AluOp::a,"PRED_SETGT_PUSH_INT")},
170    {op2_pred_setge_push_int ,AluOp(2, 0, AluOp::a,"PRED_SETGE_PUSH_INT")},
171    {op2_pred_setne_push_int ,AluOp(2, 0, AluOp::a,"PRED_SETNE_PUSH_INT")},
172    {op2_pred_setlt_push_int ,AluOp(2, 0, AluOp::a,"PRED_SETLT_PUSH_INT")},
173    {op2_pred_setle_push_int ,AluOp(2, 0, AluOp::a,"PRED_SETLE_PUSH_INT")},
174    {op2_addc_uint           ,AluOp(2, 0, AluOp::a,"ADDC_UINT")},
175    {op2_subb_uint           ,AluOp(2, 0, AluOp::a,"SUBB_UINT")},
176    {op2_set_mode            ,AluOp(2, 0, AluOp::a,"SET_MODE")},
177    {op2_set_lds_size        ,AluOp(2, 0, AluOp::a,"SET_LDS_SIZE")},
178    {op2_mullo_int           ,AluOp(2, 0, AluOp::t,"MULLO_INT")},
179    {op2_mulhi_int           ,AluOp(2, 0, AluOp::t,"MULHI_INT")},
180    {op2_mullo_uint          ,AluOp(2, 0, AluOp::t,"MULLO_UINT")},
181    {op2_mulhi_uint          ,AluOp(2, 0, AluOp::t,"MULHI_UINT")},
182    {op2_dot_ieee            ,AluOp(2, 1, AluOp::v,"DOT_IEEE")},
183    {op2_mulhi_uint24        ,AluOp(2, 0, AluOp::v,"MULHI_UINT24")},
184    {op2_mul_uint24          ,AluOp(2, 0, AluOp::v,"MUL_UINT24")},
185    {op2_sete_64             ,AluOp(2, 1, AluOp::v,"SETE_64")},
186    {op2_setne_64            ,AluOp(2, 1, AluOp::v,"SETNE_64")},
187    {op2_setgt_64            ,AluOp(2, 1, AluOp::v,"SETGT_64")},
188    {op2_setge_64            ,AluOp(2, 1, AluOp::v,"SETGE_64")},
189    {op2_min_64              ,AluOp(2, 1, AluOp::v,"MIN_64")},
190    {op2_max_64              ,AluOp(2, 1, AluOp::v,"MAX_64")},
191    {op2_dot4                ,AluOp(2, 1, AluOp::v,"DOT4")},
192    {op2_dot4_ieee           ,AluOp(2, 1, AluOp::v,"DOT4_IEEE")},
193    {op2_cube                ,AluOp(2, 1, AluOp::v,"CUBE")},
194    {op2_pred_setgt_64       ,AluOp(2, 1, AluOp::v,"PRED_SETGT_64")},
195    {op2_pred_sete_64        ,AluOp(2, 1, AluOp::v,"PRED_SETE_64")},
196    {op2_pred_setge_64       ,AluOp(2, 1, AluOp::v,"PRED_SETGE_64")},
197    {OP2V_MUL_64             ,AluOp(2, 1, AluOp::v,"MUL_64")},
198    {op2_add_64              ,AluOp(2, 1, AluOp::v,"ADD_64")},
199    {op2_sad_accum_prev_uint ,AluOp(2, 0, AluOp::v,"SAD_ACCUM_PREV_UINT")},
200    {op2_dot                 ,AluOp(2, 1, AluOp::v,"DOT")},
201    {op2_mul_prev            ,AluOp(2, 1, AluOp::v,"MUL_PREV")},
202    {op2_mul_ieee_prev       ,AluOp(2, 1, AluOp::v,"MUL_IEEE_PREV")},
203    {op2_add_prev            ,AluOp(2, 1, AluOp::v,"ADD_PREV")},
204    {op2_muladd_prev         ,AluOp(2, 1, AluOp::v,"MULADD_PREV")},
205    {op2_muladd_ieee_prev    ,AluOp(2, 1, AluOp::v,"MULADD_IEEE_PREV")},
206    {op2_interp_xy           ,AluOp(2, 1, AluOp::v,"INTERP_XY")},
207    {op2_interp_zw           ,AluOp(2, 1, AluOp::v,"INTERP_ZW")},
208    {op2_interp_x            ,AluOp(2, 1, AluOp::v,"INTERP_X")},
209    {op2_interp_z            ,AluOp(2, 1, AluOp::v,"INTERP_Z")},
210 
211    {op3_bfe_uint            ,AluOp(3, 0, AluOp::v,"BFE_UINT")},
212    {op3_bfe_int             ,AluOp(3, 0, AluOp::v,"BFE_INT")},
213    {op3_bfi_int             ,AluOp(3, 0, AluOp::v,"BFI_INT")},
214    {op3_fma                 ,AluOp(3, 1, AluOp::v,"FMA")},
215    {op3_cndne_64            ,AluOp(3, 1, AluOp::v,"CNDNE_64")},
216    {op3_fma_64              ,AluOp(3, 1, AluOp::v,"FMA_64")},
217    {op3_lerp_uint           ,AluOp(3, 0, AluOp::v,"LERP_UINT")},
218    {op3_bit_align_int       ,AluOp(3, 0, AluOp::v,"BIT_ALIGN_INT")},
219    {op3_byte_align_int      ,AluOp(3, 0, AluOp::v,"BYTE_ALIGN_INT")},
220    {op3_sad_accum_uint      ,AluOp(3, 0, AluOp::v,"SAD_ACCUM_UINT")},
221    {op3_sad_accum_hi_uint   ,AluOp(3, 0, AluOp::v,"SAD_ACCUM_HI_UINT")},
222    {op3_muladd_uint24       ,AluOp(3, 0, AluOp::v,"MULADD_UINT24")},
223    {op3_lds_idx_op          ,AluOp(3, 0, AluOp::x,"LDS_IDX_OP")},
224    {op3_muladd              ,AluOp(3, 1, AluOp::a,"MULADD")},
225    {op3_muladd_m2           ,AluOp(3, 1, AluOp::a,"MULADD_M2")},
226    {op3_muladd_m4           ,AluOp(3, 1, AluOp::a,"MULADD_M4")},
227    {op3_muladd_d2           ,AluOp(3, 1, AluOp::a,"MULADD_D2")},
228    {op3_muladd_ieee         ,AluOp(3, 1, AluOp::a,"MULADD_IEEE")},
229    {op3_cnde                ,AluOp(3, 1, AluOp::a,"CNDE")},
230    {op3_cndgt               ,AluOp(3, 1, AluOp::a,"CNDGT")},
231    {op3_cndge               ,AluOp(3, 1, AluOp::a,"CNDGE")},
232    {op3_cnde_int            ,AluOp(3, 0, AluOp::a,"CNDE_INT")},
233    {op3_cndgt_int           ,AluOp(3, 0, AluOp::a,"CNDGT_INT")},
234    {op3_cndge_int           ,AluOp(3, 0, AluOp::a,"CNDGE_INT")},
235    {op3_mul_lit             ,AluOp(3, 1, AluOp::t,"MUL_LIT")}
236 };
237 
238 const std::map<AluInlineConstants, AluInlineConstantDescr> alu_src_const = {
239    {ALU_SRC_LDS_OQ_A, {false, "LDS_OQ_A"}},
240    {ALU_SRC_LDS_OQ_B, {false, "LDS_OQ_B"}},
241    {ALU_SRC_LDS_OQ_A_POP, {false, "LDS_OQ_A_POP"}},
242    {ALU_SRC_LDS_OQ_B_POP, {false, "LDS_OQ_B_POP"}},
243    {ALU_SRC_LDS_DIRECT_A, {false, "LDS_DIRECT_A"}},
244    {ALU_SRC_LDS_DIRECT_B, {false, "LDS_DIRECT_B"}},
245    {ALU_SRC_TIME_HI, {false, "TIME_HI"}},
246    {ALU_SRC_TIME_LO, {false, "TIME_LO"}},
247    {ALU_SRC_MASK_HI, {false, "MASK_HI"}},
248    {ALU_SRC_MASK_LO, {false, "MASK_LO"}},
249    {ALU_SRC_HW_WAVE_ID, {false, "HW_WAVE_ID"}},
250    {ALU_SRC_SIMD_ID, {false, "SIMD_ID"}},
251    {ALU_SRC_SE_ID, {false, "SE_ID"}},
252    {ALU_SRC_HW_THREADGRP_ID, {false, "HW_THREADGRP_ID"}},
253    {ALU_SRC_WAVE_ID_IN_GRP, {false, "WAVE_ID_IN_GRP"}},
254    {ALU_SRC_NUM_THREADGRP_WAVES, {false, "NUM_THREADGRP_WAVES"}},
255    {ALU_SRC_HW_ALU_ODD, {false, "HW_ALU_ODD"}},
256    {ALU_SRC_LOOP_IDX, {false, "LOOP_IDX"}},
257    {ALU_SRC_PARAM_BASE_ADDR, {false, "PARAM_BASE_ADDR"}},
258    {ALU_SRC_NEW_PRIM_MASK, {false, "NEW_PRIM_MASK"}},
259    {ALU_SRC_PRIM_MASK_HI, {false, "PRIM_MASK_HI"}},
260    {ALU_SRC_PRIM_MASK_LO, {false, "PRIM_MASK_LO"}},
261    {ALU_SRC_1_DBL_L, {false, "1.0L"}},
262    {ALU_SRC_1_DBL_M, {false, "1.0H"}},
263    {ALU_SRC_0_5_DBL_L, {false, "0.5L"}},
264    {ALU_SRC_0_5_DBL_M, {false, "0.5H"}},
265    {ALU_SRC_0, {false, "0"}},
266    {ALU_SRC_1, {false, "1.0"}},
267    {ALU_SRC_1_INT, {false, "1"}},
268    {ALU_SRC_M_1_INT, {false, "-1"}},
269    {ALU_SRC_0_5, {false, "0.5"}},
270    {ALU_SRC_LITERAL, {true, "ALU_SRC_LITERAL"}},
271    {ALU_SRC_PV, {true, "PV"}},
272    {ALU_SRC_PS, {false, "PS"}}
273 };
274 
275 const std::map<ESDOp, LDSOp> lds_ops = {
276    {DS_OP_ADD           , {2, "DS_ADD"}},
277    {DS_OP_SUB           , {2, "DS_SUB"}},
278    {DS_OP_RSUB          , {2, "DS_RSUB"}},
279    {DS_OP_INC           , {2, "DS_INC"}},
280    {DS_OP_DEC           , {2, "DS_DEC"}},
281    {DS_OP_MIN_INT       , {2, "DS_MIN_INT"}},
282    {DS_OP_MAX_INT       , {2, "DS_MAX_INT"}},
283    {DS_OP_MIN_UINT      , {2, "DS_MIN_UINT"}},
284    {DS_OP_MAX_UINT      , {2, "DS_MAX_UINT"}},
285    {DS_OP_AND           , {2, "DS_AND"}},
286    {DS_OP_OR            , {2, "DS_OR"}},
287    {DS_OP_XOR           , {2, "DS_XOR"}},
288    {DS_OP_MSKOR         , {3, "DS_MSKOR"}},
289    {DS_OP_WRITE         , {2, "DS_WRITE"}},
290    {DS_OP_WRITE_REL     , {3, "DS_WRITE_REL"}},
291    {DS_OP_WRITE2        , {3, "DS_WRITE2"}},
292    {DS_OP_CMP_STORE     , {3, "DS_CMP_STORE"}},
293    {DS_OP_CMP_STORE_SPF , {3, "DS_CMP_STORE_SPF"}},
294    {DS_OP_BYTE_WRITE    , {2, "DS_BYTE_WRITE"}},
295    {DS_OP_SHORT_WRITE   , {2, "DS_SHORT_WRITE"}},
296    {DS_OP_ADD_RET       , {2, "DS_ADD_RET"}},
297    {DS_OP_SUB_RET       , {2, "DS_SUB_RET"}},
298    {DS_OP_RSUB_RET      , {2, "DS_RSUB_RET"}},
299    {DS_OP_INC_RET       , {2, "DS_INC_RET"}},
300    {DS_OP_DEC_RET       , {2, "DS_DEC_RET"}},
301    {DS_OP_MIN_INT_RET   , {2, "DS_MIN_INT_RET"}},
302    {DS_OP_MAX_INT_RET   , {2, "DS_MAX_INT_RET"}},
303    {DS_OP_MIN_UINT_RET  , {2, "DS_MIN_UINT_RET"}},
304    {DS_OP_MAX_UINT_RET  , {2, "DS_MAX_UINT_RET"}},
305    {DS_OP_AND_RET       , {2, "DS_AND_RET"}},
306    {DS_OP_OR_RET        , {2, "DS_OR_RET"}},
307    {DS_OP_XOR_RET       , {2, "DS_XOR_RET"}},
308    {DS_OP_MSKOR_RET     , {3, "DS_MSKOR_RET"}},
309    {DS_OP_XCHG_RET      , {2, "DS_XCHG_RET"}},
310    {DS_OP_XCHG_REL_RET  , {3, "DS_XCHG_REL_RET"}},
311    {DS_OP_XCHG2_RET     , {3, "DS_XCHG2_RET"}},
312    {DS_OP_CMP_XCHG_RET  , {3, "DS_CMP_XCHG_RET"}},
313    {DS_OP_CMP_XCHG_SPF_RET, {3, "DS_CMP_XCHG_SPF_RET"}},
314    {DS_OP_READ_RET      , {1, "DS_READ_RET"}},
315    {DS_OP_READ_REL_RET  , {1, "DS_READ_REL_RET"}},
316    {DS_OP_READ2_RET     , {2, "DS_READ2_RET"}},
317    {DS_OP_READWRITE_RET , {3, "DS_READWRITE_RET"}},
318    {DS_OP_BYTE_READ_RET , {1, "DS_BYTE_READ_RET"}},
319    {DS_OP_UBYTE_READ_RET, {1, "DS_UBYTE_READ_RET"}},
320    {DS_OP_SHORT_READ_RET, {1, "DS_SHORT_READ_RET"}},
321    {DS_OP_USHORT_READ_RET, {1, "DS_USHORT_READ_RET"}},
322    {DS_OP_ATOMIC_ORDERED_ALLOC_RET , {3, "DS_ATOMIC_ORDERED_ALLOC_RET"}}
323 };
324 
325 }
326