xref: /qemu/tests/tcg/hexagon/mem_noshuf.c (revision d7a84021)
1 /*
2  *  Copyright(c) 2019-2021 Qualcomm Innovation Center, Inc. All Rights Reserved.
3  *
4  *  This program is free software; you can redistribute it and/or modify
5  *  it under the terms of the GNU General Public License as published by
6  *  the Free Software Foundation; either version 2 of the License, or
7  *  (at your option) any later version.
8  *
9  *  This program is distributed in the hope that it will be useful,
10  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
11  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  *  GNU General Public License for more details.
13  *
14  *  You should have received a copy of the GNU General Public License
15  *  along with this program; if not, see <http://www.gnu.org/licenses/>.
16  */
17 
18 #include <stdio.h>
19 
20 /*
21  *  Make sure that the :mem_noshuf packet attribute is honored.
22  *  This is important when the addresses overlap.
23  *  The store instruction in slot 1 effectively executes first,
24  *  followed by the load instruction in slot 0.
25  */
26 
27 #define MEM_NOSHUF32(NAME, ST_TYPE, LD_TYPE, ST_OP, LD_OP) \
28 static inline unsigned int NAME(ST_TYPE * p, LD_TYPE * q, ST_TYPE x) \
29 { \
30     unsigned int ret; \
31     asm volatile("{\n\t" \
32                  "    " #ST_OP "(%1) = %3\n\t" \
33                  "    %0 = " #LD_OP "(%2)\n\t" \
34                  "}:mem_noshuf\n" \
35                  : "=r"(ret) \
36                  : "r"(p), "r"(q), "r"(x) \
37                  : "memory"); \
38     return ret; \
39 }
40 
41 #define MEM_NOSHUF64(NAME, ST_TYPE, LD_TYPE, ST_OP, LD_OP) \
42 static inline unsigned long long NAME(ST_TYPE * p, LD_TYPE * q, ST_TYPE x) \
43 { \
44     unsigned long long ret; \
45     asm volatile("{\n\t" \
46                  "    " #ST_OP "(%1) = %3\n\t" \
47                  "    %0 = " #LD_OP "(%2)\n\t" \
48                  "}:mem_noshuf\n" \
49                  : "=r"(ret) \
50                  : "r"(p), "r"(q), "r"(x) \
51                  : "memory"); \
52     return ret; \
53 }
54 
55 /* Store byte combinations */
56 MEM_NOSHUF32(mem_noshuf_sb_lb,  signed char,  signed char,      memb, memb)
57 MEM_NOSHUF32(mem_noshuf_sb_lub, signed char,  unsigned char,    memb, memub)
58 MEM_NOSHUF32(mem_noshuf_sb_lh,  signed char,  signed short,     memb, memh)
59 MEM_NOSHUF32(mem_noshuf_sb_luh, signed char,  unsigned short,   memb, memuh)
60 MEM_NOSHUF32(mem_noshuf_sb_lw,  signed char,  signed int,       memb, memw)
61 MEM_NOSHUF64(mem_noshuf_sb_ld,  signed char,  signed long long, memb, memd)
62 
63 /* Store half combinations */
64 MEM_NOSHUF32(mem_noshuf_sh_lb,  signed short, signed char,      memh, memb)
65 MEM_NOSHUF32(mem_noshuf_sh_lub, signed short, unsigned char,    memh, memub)
66 MEM_NOSHUF32(mem_noshuf_sh_lh,  signed short, signed short,     memh, memh)
67 MEM_NOSHUF32(mem_noshuf_sh_luh, signed short, unsigned short,   memh, memuh)
68 MEM_NOSHUF32(mem_noshuf_sh_lw,  signed short, signed int,       memh, memw)
69 MEM_NOSHUF64(mem_noshuf_sh_ld,  signed short, signed long long, memh, memd)
70 
71 /* Store word combinations */
72 MEM_NOSHUF32(mem_noshuf_sw_lb,  signed int,   signed char,      memw, memb)
73 MEM_NOSHUF32(mem_noshuf_sw_lub, signed int,   unsigned char,    memw, memub)
74 MEM_NOSHUF32(mem_noshuf_sw_lh,  signed int,   signed short,     memw, memh)
75 MEM_NOSHUF32(mem_noshuf_sw_luh, signed int,   unsigned short,   memw, memuh)
76 MEM_NOSHUF32(mem_noshuf_sw_lw,  signed int,   signed int,       memw, memw)
77 MEM_NOSHUF64(mem_noshuf_sw_ld,  signed int,   signed long long, memw, memd)
78 
79 /* Store double combinations */
80 MEM_NOSHUF32(mem_noshuf_sd_lb,  long long,    signed char,      memd, memb)
81 MEM_NOSHUF32(mem_noshuf_sd_lub, long long,    unsigned char,    memd, memub)
82 MEM_NOSHUF32(mem_noshuf_sd_lh,  long long,    signed short,     memd, memh)
83 MEM_NOSHUF32(mem_noshuf_sd_luh, long long,    unsigned short,   memd, memuh)
84 MEM_NOSHUF32(mem_noshuf_sd_lw,  long long,    signed int,       memd, memw)
85 MEM_NOSHUF64(mem_noshuf_sd_ld,  long long,    signed long long, memd, memd)
86 
87 static inline unsigned int cancel_sw_lb(int pred, int *p, signed char *q, int x)
88 {
89     unsigned int ret;
90     asm volatile("p0 = cmp.eq(%4, #0)\n\t"
91                  "{\n\t"
92                  "    if (!p0) memw(%1) = %3\n\t"
93                  "    %0 = memb(%2)\n\t"
94                  "}:mem_noshuf\n"
95                  : "=r"(ret)
96                  : "r"(p), "r"(q), "r"(x), "r"(pred)
97                  : "p0", "memory");
98     return ret;
99 }
100 
101 static inline
102 unsigned long long cancel_sw_ld(int pred, int *p, long long *q, int x)
103 {
104     long long ret;
105     asm volatile("p0 = cmp.eq(%4, #0)\n\t"
106                  "{\n\t"
107                  "    if (!p0) memw(%1) = %3\n\t"
108                  "    %0 = memd(%2)\n\t"
109                  "}:mem_noshuf\n"
110                  : "=r"(ret)
111                  : "r"(p), "r"(q), "r"(x), "r"(pred)
112                  : "p0", "memory");
113     return ret;
114 }
115 
116 typedef union {
117     signed long long d[2];
118     unsigned long long ud[2];
119     signed int w[4];
120     unsigned int uw[4];
121     signed short h[8];
122     unsigned short uh[8];
123     signed char b[16];
124     unsigned char ub[16];
125 } Memory;
126 
127 int err;
128 
129 static void check32(int n, int expect)
130 {
131     if (n != expect) {
132         printf("ERROR: 0x%08x != 0x%08x\n", n, expect);
133         err++;
134     }
135 }
136 
137 static void check64(long long n, long long expect)
138 {
139     if (n != expect) {
140         printf("ERROR: 0x%08llx != 0x%08llx\n", n, expect);
141         err++;
142     }
143 }
144 
145 int main()
146 {
147     Memory n;
148     unsigned int res32;
149     unsigned long long res64;
150 
151     /*
152      * Store byte combinations
153      */
154     n.w[0] = ~0;
155     res32 = mem_noshuf_sb_lb(&n.b[0], &n.b[0], 0x87);
156     check32(res32, 0xffffff87);
157 
158     n.w[0] = ~0;
159     res32 = mem_noshuf_sb_lub(&n.b[0], &n.ub[0], 0x87);
160     check32(res32, 0x00000087);
161 
162     n.w[0] = ~0;
163     res32 = mem_noshuf_sb_lh(&n.b[0], &n.h[0], 0x87);
164     check32(res32, 0xffffff87);
165 
166     n.w[0] = ~0;
167     res32 = mem_noshuf_sb_luh(&n.b[0], &n.uh[0], 0x87);
168     check32(res32, 0x0000ff87);
169 
170     n.w[0] = ~0;
171     res32 = mem_noshuf_sb_lw(&n.b[0], &n.w[0], 0x87);
172     check32(res32, 0xffffff87);
173 
174     n.d[0] = ~0LL;
175     res64 = mem_noshuf_sb_ld(&n.b[0], &n.d[0], 0x87);
176     check64(res64, 0xffffffffffffff87LL);
177 
178     /*
179      * Store half combinations
180      */
181     n.w[0] = ~0;
182     res32 = mem_noshuf_sh_lb(&n.h[0], &n.b[0], 0x8787);
183     check32(res32, 0xffffff87);
184 
185     n.w[0] = ~0;
186     res32 = mem_noshuf_sh_lub(&n.h[0], &n.ub[1], 0x8f87);
187     check32(res32, 0x0000008f);
188 
189     n.w[0] = ~0;
190     res32 = mem_noshuf_sh_lh(&n.h[0], &n.h[0], 0x8a87);
191     check32(res32, 0xffff8a87);
192 
193     n.w[0] = ~0;
194     res32 = mem_noshuf_sh_luh(&n.h[0], &n.uh[0], 0x8a87);
195     check32(res32, 0x8a87);
196 
197     n.w[0] = ~0;
198     res32 = mem_noshuf_sh_lw(&n.h[1], &n.w[0], 0x8a87);
199     check32(res32, 0x8a87ffff);
200 
201     n.w[0] = ~0;
202     res64 = mem_noshuf_sh_ld(&n.h[1], &n.d[0], 0x8a87);
203     check64(res64, 0xffffffff8a87ffffLL);
204 
205     /*
206      * Store word combinations
207      */
208     n.w[0] = ~0;
209     res32 = mem_noshuf_sw_lb(&n.w[0], &n.b[0], 0x12345687);
210     check32(res32, 0xffffff87);
211 
212     n.w[0] = ~0;
213     res32 = mem_noshuf_sw_lub(&n.w[0], &n.ub[0], 0x12345687);
214     check32(res32, 0x00000087);
215 
216     n.w[0] = ~0;
217     res32 = mem_noshuf_sw_lh(&n.w[0], &n.h[0], 0x1234f678);
218     check32(res32, 0xfffff678);
219 
220     n.w[0] = ~0;
221     res32 = mem_noshuf_sw_luh(&n.w[0], &n.uh[0], 0x12345678);
222     check32(res32, 0x00005678);
223 
224     n.w[0] = ~0;
225     res32 = mem_noshuf_sw_lw(&n.w[0], &n.w[0], 0x12345678);
226     check32(res32, 0x12345678);
227 
228     n.d[0] = ~0LL;
229     res64 = mem_noshuf_sw_ld(&n.w[0], &n.d[0], 0x12345678);
230     check64(res64, 0xffffffff12345678LL);
231 
232     /*
233      * Store double combinations
234      */
235     n.d[0] = ~0LL;
236     res32 = mem_noshuf_sd_lb(&n.d[0], &n.b[1], 0x123456789abcdef0);
237     check32(res32, 0xffffffde);
238 
239     n.d[0] = ~0LL;
240     res32 = mem_noshuf_sd_lub(&n.d[0], &n.ub[1], 0x123456789abcdef0);
241     check32(res32, 0x000000de);
242 
243     n.d[0] = ~0LL;
244     res32 = mem_noshuf_sd_lh(&n.d[0], &n.h[1], 0x123456789abcdef0);
245     check32(res32, 0xffff9abc);
246 
247     n.d[0] = ~0LL;
248     res32 = mem_noshuf_sd_luh(&n.d[0], &n.uh[1], 0x123456789abcdef0);
249     check32(res32, 0x00009abc);
250 
251     n.d[0] = ~0LL;
252     res32 = mem_noshuf_sd_lw(&n.d[0], &n.w[1], 0x123456789abcdef0);
253     check32(res32, 0x12345678);
254 
255     n.d[0] = ~0LL;
256     res64 = mem_noshuf_sd_ld(&n.d[0], &n.d[0], 0x123456789abcdef0);
257     check64(res64, 0x123456789abcdef0LL);
258 
259     /*
260      * Predicated word stores
261      */
262     n.w[0] = ~0;
263     res32 = cancel_sw_lb(0, &n.w[0], &n.b[0], 0x12345678);
264     check32(res32, 0xffffffff);
265 
266     n.w[0] = ~0;
267     res32 = cancel_sw_lb(1, &n.w[0], &n.b[0], 0x12345687);
268     check32(res32, 0xffffff87);
269 
270     /*
271      * Predicated double stores
272      */
273     n.d[0] = ~0LL;
274     res64 = cancel_sw_ld(0, &n.w[0], &n.d[0], 0x12345678);
275     check64(res64, 0xffffffffffffffffLL);
276 
277     n.d[0] = ~0LL;
278     res64 = cancel_sw_ld(1, &n.w[0], &n.d[0], 0x12345678);
279     check64(res64, 0xffffffff12345678LL);
280 
281     n.d[0] = ~0LL;
282     res64 = cancel_sw_ld(0, &n.w[1], &n.d[0], 0x12345678);
283     check64(res64, 0xffffffffffffffffLL);
284 
285     n.d[0] = ~0LL;
286     res64 = cancel_sw_ld(1, &n.w[1], &n.d[0], 0x12345678);
287     check64(res64, 0x12345678ffffffffLL);
288 
289     /*
290      * No overlap tests
291      */
292     n.w[0] = ~0;
293     res32 = mem_noshuf_sb_lb(&n.b[1], &n.b[0], 0x87);
294     check32(res32, 0xffffffff);
295 
296     n.w[0] = ~0;
297     res32 = mem_noshuf_sb_lb(&n.b[0], &n.b[1], 0x87);
298     check32(res32, 0xffffffff);
299 
300     n.w[0] = ~0;
301     res32 = mem_noshuf_sh_lh(&n.h[1], &n.h[0], 0x8787);
302     check32(res32, 0xffffffff);
303 
304     n.w[0] = ~0;
305     res32 = mem_noshuf_sh_lh(&n.h[0], &n.h[1], 0x8787);
306     check32(res32, 0xffffffff);
307 
308     n.d[0] = ~0LL;
309     res32 = mem_noshuf_sw_lw(&n.w[0], &n.w[1], 0x12345678);
310     check32(res32, 0xffffffff);
311 
312     n.d[0] = ~0LL;
313     res32 = mem_noshuf_sw_lw(&n.w[1], &n.w[0], 0x12345678);
314     check32(res32, 0xffffffff);
315 
316     n.d[0] = ~0LL;
317     n.d[1] = ~0LL;
318     res64 = mem_noshuf_sd_ld(&n.d[1], &n.d[0], 0x123456789abcdef0LL);
319     check64(res64, 0xffffffffffffffffLL);
320 
321     n.d[0] = ~0LL;
322     n.d[1] = ~0LL;
323     res64 = mem_noshuf_sd_ld(&n.d[0], &n.d[1], 0x123456789abcdef0LL);
324     check64(res64, 0xffffffffffffffffLL);
325 
326     puts(err ? "FAIL" : "PASS");
327     return err;
328 }
329