Lines Matching refs:GFX6

4 …e=amdgcn-amd-amdpal -mcpu=tahiti -verify-machineinstrs < %s | FileCheck -check-prefixes=GCN,GFX6 %s
34 ; GFX6-LABEL: store_lds_v4i32:
35 ; GFX6: ; %bb.0:
36 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
37 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
38 ; GFX6-NEXT: s_mov_b32 m0, -1
39 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
40 ; GFX6-NEXT: v_mov_b32_e32 v4, s4
41 ; GFX6-NEXT: v_mov_b32_e32 v0, s2
42 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
43 ; GFX6-NEXT: v_mov_b32_e32 v2, s0
44 ; GFX6-NEXT: v_mov_b32_e32 v3, s1
45 ; GFX6-NEXT: ds_write2_b64 v4, v[2:3], v[0:1] offset1:1
46 ; GFX6-NEXT: s_endpgm
149 ; GFX6-LABEL: store_lds_v4i32_align1:
150 ; GFX6: ; %bb.0:
151 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
152 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
153 ; GFX6-NEXT: s_mov_b32 m0, -1
154 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
155 ; GFX6-NEXT: v_mov_b32_e32 v0, s4
156 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
157 ; GFX6-NEXT: v_mov_b32_e32 v2, s2
158 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:12
159 ; GFX6-NEXT: ds_write_b8 v0, v2 offset:8
160 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
161 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:4
162 ; GFX6-NEXT: v_mov_b32_e32 v1, s0
163 ; GFX6-NEXT: s_lshr_b32 s4, s3, 8
164 ; GFX6-NEXT: ds_write_b8 v0, v1
165 ; GFX6-NEXT: v_mov_b32_e32 v1, s4
166 ; GFX6-NEXT: s_lshr_b32 s4, s3, 24
167 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:13
168 ; GFX6-NEXT: v_mov_b32_e32 v1, s4
169 ; GFX6-NEXT: s_lshr_b32 s3, s3, 16
170 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:15
171 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
172 ; GFX6-NEXT: s_lshr_b32 s3, s2, 8
173 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:14
174 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
175 ; GFX6-NEXT: s_lshr_b32 s3, s2, 24
176 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:9
177 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
178 ; GFX6-NEXT: s_lshr_b32 s2, s2, 16
179 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:11
180 ; GFX6-NEXT: v_mov_b32_e32 v1, s2
181 ; GFX6-NEXT: s_lshr_b32 s2, s1, 8
182 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:10
183 ; GFX6-NEXT: v_mov_b32_e32 v1, s2
184 ; GFX6-NEXT: s_lshr_b32 s2, s1, 24
185 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:5
186 ; GFX6-NEXT: v_mov_b32_e32 v1, s2
187 ; GFX6-NEXT: s_lshr_b32 s1, s1, 16
188 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:7
189 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
190 ; GFX6-NEXT: s_lshr_b32 s1, s0, 8
191 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:6
192 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
193 ; GFX6-NEXT: s_lshr_b32 s1, s0, 24
194 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:1
195 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
196 ; GFX6-NEXT: s_lshr_b32 s0, s0, 16
197 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:3
198 ; GFX6-NEXT: v_mov_b32_e32 v1, s0
199 ; GFX6-NEXT: ds_write_b8 v0, v1 offset:2
200 ; GFX6-NEXT: s_endpgm
255 ; GFX6-LABEL: store_lds_v4i32_align2:
256 ; GFX6: ; %bb.0:
257 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
258 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
259 ; GFX6-NEXT: s_mov_b32 m0, -1
260 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
261 ; GFX6-NEXT: v_mov_b32_e32 v0, s4
262 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
263 ; GFX6-NEXT: v_mov_b32_e32 v2, s2
264 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:12
265 ; GFX6-NEXT: ds_write_b16 v0, v2 offset:8
266 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
267 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:4
268 ; GFX6-NEXT: v_mov_b32_e32 v1, s0
269 ; GFX6-NEXT: s_lshr_b32 s3, s3, 16
270 ; GFX6-NEXT: ds_write_b16 v0, v1
271 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
272 ; GFX6-NEXT: s_lshr_b32 s2, s2, 16
273 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:14
274 ; GFX6-NEXT: v_mov_b32_e32 v1, s2
275 ; GFX6-NEXT: s_lshr_b32 s1, s1, 16
276 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:10
277 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
278 ; GFX6-NEXT: s_lshr_b32 s0, s0, 16
279 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:6
280 ; GFX6-NEXT: v_mov_b32_e32 v1, s0
281 ; GFX6-NEXT: ds_write_b16 v0, v1 offset:2
282 ; GFX6-NEXT: s_endpgm
317 ; GFX6-LABEL: store_lds_v4i32_align4:
318 ; GFX6: ; %bb.0:
319 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
320 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
321 ; GFX6-NEXT: s_mov_b32 m0, -1
322 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
323 ; GFX6-NEXT: v_mov_b32_e32 v0, s4
324 ; GFX6-NEXT: v_mov_b32_e32 v1, s1
325 ; GFX6-NEXT: v_mov_b32_e32 v2, s0
326 ; GFX6-NEXT: ds_write2_b32 v0, v2, v1 offset1:1
327 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
328 ; GFX6-NEXT: v_mov_b32_e32 v2, s2
329 ; GFX6-NEXT: ds_write2_b32 v0, v2, v1 offset0:2 offset1:3
330 ; GFX6-NEXT: s_endpgm
363 ; GFX6-LABEL: store_lds_v4i32_align8:
364 ; GFX6: ; %bb.0:
365 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
366 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
367 ; GFX6-NEXT: s_mov_b32 m0, -1
368 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
369 ; GFX6-NEXT: v_mov_b32_e32 v4, s4
370 ; GFX6-NEXT: v_mov_b32_e32 v0, s2
371 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
372 ; GFX6-NEXT: v_mov_b32_e32 v2, s0
373 ; GFX6-NEXT: v_mov_b32_e32 v3, s1
374 ; GFX6-NEXT: ds_write2_b64 v4, v[2:3], v[0:1] offset1:1
375 ; GFX6-NEXT: s_endpgm
408 ; GFX6-LABEL: store_lds_v4i32_align16:
409 ; GFX6: ; %bb.0:
410 ; GFX6-NEXT: s_load_dword s4, s[0:1], 0x9
411 ; GFX6-NEXT: s_load_dwordx4 s[0:3], s[0:1], 0xd
412 ; GFX6-NEXT: s_mov_b32 m0, -1
413 ; GFX6-NEXT: s_waitcnt lgkmcnt(0)
414 ; GFX6-NEXT: v_mov_b32_e32 v4, s4
415 ; GFX6-NEXT: v_mov_b32_e32 v0, s2
416 ; GFX6-NEXT: v_mov_b32_e32 v1, s3
417 ; GFX6-NEXT: v_mov_b32_e32 v2, s0
418 ; GFX6-NEXT: v_mov_b32_e32 v3, s1
419 ; GFX6-NEXT: ds_write2_b64 v4, v[2:3], v[0:1] offset1:1
420 ; GFX6-NEXT: s_endpgm