Lines Matching refs:BO

37 #define BO	%rsi  macro
90 movapd -16 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
93 movapd -14 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
96 mulpd -10 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm0 ;\
98 movapd -12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
105 movapd 0 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
108 movapd -6 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
110 mulpd -10 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm2 ;\
112 movapd -4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
119 movapd -8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
122 movapd -6 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
124 mulpd -2 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm4 ;\
126 movapd -4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
133 movapd 8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
136 movapd 2 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
138 mulpd -2 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm6 ;\
140 movapd 4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
148 movapd 0 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
151 movapd 2 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
153 mulpd 6 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm0 ;\
155 movapd 4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
162 movapd 16 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
165 movapd 10 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
167 mulpd 6 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm2 ;\
169 movapd 12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
176 movapd 8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
179 movapd 10 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
181 mulpd 14 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm4 ;\
183 movapd 12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
190 movapd 24 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
193 movapd 18 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
195 mulpd 14 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm6 ;\
197 movapd 20 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
205 movapd -16 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
208 movapd -14 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
211 mulpd -10 * SIZE + 2 * (xx) * SIZE(BO), %xmm0 ;\
213 movapd -12 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
220 movapd 0 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
223 movapd -6 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
225 mulpd -10 * SIZE + 2 * (xx) * SIZE(BO), %xmm2 ;\
227 movapd -4 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
234 movapd -8 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
237 movapd -6 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
239 mulpd -2 * SIZE + 2 * (xx) * SIZE(BO), %xmm4 ;\
241 movapd -4 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
248 movapd 8 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
251 movapd 2 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
253 mulpd -2 * SIZE + 2 * (xx) * SIZE(BO), %xmm6 ;\
255 movapd 4 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
263 movapd 0 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
266 movapd 2 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
268 mulpd 6 * SIZE + 2 * (xx) * SIZE(BO), %xmm0 ;\
270 movapd 4 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
277 movapd 16 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
280 movapd 10 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
282 mulpd 6 * SIZE + 2 * (xx) * SIZE(BO), %xmm2 ;\
284 movapd 12 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
291 movapd 8 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
294 movapd 10 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
296 mulpd 14 * SIZE + 2 * (xx) * SIZE(BO), %xmm4 ;\
298 movapd 12 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
305 movapd 24 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
308 movapd 18 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
310 mulpd 14 * SIZE + 2 * (xx) * SIZE(BO), %xmm6 ;\
312 movapd 20 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
415 leaq 16 * SIZE + BUFFER, BO
426 movq %mm0, -16 * SIZE(BO)
427 movq %mm0, -15 * SIZE(BO)
429 movq %mm1, -14 * SIZE(BO)
430 movq %mm1, -13 * SIZE(BO)
433 movq %mm2, -12 * SIZE(BO)
434 movq %mm2, -11 * SIZE(BO)
436 movq %mm3, -10 * SIZE(BO)
437 movq %mm3, -9 * SIZE(BO)
439 PREFETCHW (WPREFETCHSIZE + 0) * SIZE(BO)
442 movq %mm4, -8 * SIZE(BO)
443 movq %mm4, -7 * SIZE(BO)
445 movq %mm5, -6 * SIZE(BO)
446 movq %mm5, -5 * SIZE(BO)
448 PREFETCHW (WPREFETCHSIZE + 8) * SIZE(BO)
451 movq %mm6, -4 * SIZE(BO)
452 movq %mm6, -3 * SIZE(BO)
454 movq %mm7, -2 * SIZE(BO)
455 movq %mm7, -1 * SIZE(BO)
460 movq %mm0, 0 * SIZE(BO)
461 movq %mm0, 1 * SIZE(BO)
463 movq %mm1, 2 * SIZE(BO)
464 movq %mm1, 3 * SIZE(BO)
467 movq %mm2, 4 * SIZE(BO)
468 movq %mm2, 5 * SIZE(BO)
470 movq %mm3, 6 * SIZE(BO)
471 movq %mm3, 7 * SIZE(BO)
473 PREFETCHW (WPREFETCHSIZE + 16) * SIZE(BO)
476 movq %mm4, 8 * SIZE(BO)
477 movq %mm4, 9 * SIZE(BO)
479 movq %mm5, 10 * SIZE(BO)
480 movq %mm5, 11 * SIZE(BO)
482 PREFETCHW (WPREFETCHSIZE + 24) * SIZE(BO)
485 movq %mm6, 12 * SIZE(BO)
486 movq %mm6, 13 * SIZE(BO)
488 movq %mm7, 14 * SIZE(BO)
489 movq %mm7, 15 * SIZE(BO)
491 addq $ 32 * SIZE, BO
506 movq %mm0, -16 * SIZE(BO)
507 movq %mm0, -15 * SIZE(BO)
509 movq %mm1, -14 * SIZE(BO)
510 movq %mm1, -13 * SIZE(BO)
513 movq %mm2, -12 * SIZE(BO)
514 movq %mm2, -11 * SIZE(BO)
516 movq %mm3, -10 * SIZE(BO)
517 movq %mm3, -9 * SIZE(BO)
520 addq $ 8 * SIZE, BO
541 leaq 16 * SIZE + BUFFER, BO
543 leaq 16 * SIZE + BUFFER, BO
547 leaq (BO, %rax, 8), BO
551 movapd -16 * SIZE(BO), %xmm1
555 movapd -14 * SIZE(BO), %xmm3
558 movapd -12 * SIZE(BO), %xmm5
561 movapd -8 * SIZE(BO), %xmm7
591 leaq (BO, %rax, 8), BO
791 addq $32 * SIZE, BO
810 addq $ 32 * SIZE, BO
832 leaq (BO, %rax, 8), BO
839 movapd -14 * SIZE(BO, %rax, 8), %xmm1
842 movapd -12 * SIZE(BO, %rax, 8), %xmm1
844 mulpd -10 * SIZE(BO, %rax, 8), %xmm0
846 movapd -16 * SIZE(BO, %rax, 8), %xmm1
851 movapd -14 * SIZE(BO, %rax, 8), %xmm1
854 movapd -12 * SIZE(BO, %rax, 8), %xmm1
856 mulpd -10 * SIZE(BO, %rax, 8), %xmm2
858 movapd -8 * SIZE(BO, %rax, 8), %xmm1
953 leaq (BO, %rax, 8), BO
974 leaq 16 * SIZE + BUFFER, BO
976 leaq 16 * SIZE + BUFFER, BO
980 leaq (BO, %rax, 8), BO
987 movapd -16 * SIZE(BO), %xmm1
989 movapd -8 * SIZE(BO), %xmm3
1014 movapd -14 * SIZE(BO), %xmm1
1018 movapd -12 * SIZE(BO), %xmm1
1020 mulpd -10 * SIZE(BO), %xmm0
1022 movapd 0 * SIZE(BO), %xmm1
1027 movapd -6 * SIZE(BO), %xmm3
1030 movapd -4 * SIZE(BO), %xmm3
1032 mulpd -2 * SIZE(BO), %xmm0
1034 movapd 8 * SIZE(BO), %xmm3
1039 movapd 2 * SIZE(BO), %xmm1
1043 movapd 4 * SIZE(BO), %xmm1
1045 mulpd 6 * SIZE(BO), %xmm0
1047 movapd 16 * SIZE(BO), %xmm1
1052 movapd 10 * SIZE(BO), %xmm3
1055 movapd 12 * SIZE(BO), %xmm3
1057 mulpd 14 * SIZE(BO), %xmm0
1059 movapd 24 * SIZE(BO), %xmm3
1064 movapd 18 * SIZE(BO), %xmm1
1067 movapd 20 * SIZE(BO), %xmm1
1069 mulpd 22 * SIZE(BO), %xmm2
1071 movapd 32 * SIZE(BO), %xmm1
1076 movapd 26 * SIZE(BO), %xmm3
1079 movapd 28 * SIZE(BO), %xmm3
1081 mulpd 30 * SIZE(BO), %xmm2
1083 movapd 40 * SIZE(BO), %xmm3
1088 movapd 34 * SIZE(BO), %xmm1
1091 movapd 36 * SIZE(BO), %xmm1
1093 mulpd 38 * SIZE(BO), %xmm2
1095 movapd 48 * SIZE(BO), %xmm1
1100 movapd 42 * SIZE(BO), %xmm3
1103 movapd 44 * SIZE(BO), %xmm3
1105 mulpd 46 * SIZE(BO), %xmm2
1107 movapd 56 * SIZE(BO), %xmm3
1112 addq $64 * SIZE, BO
1129 movapd -14 * SIZE(BO), %xmm1
1132 movapd -12 * SIZE(BO), %xmm1
1134 mulpd -10 * SIZE(BO), %xmm0
1136 movapd 0 * SIZE(BO), %xmm1
1141 movapd -6 * SIZE(BO), %xmm3
1144 movapd -4 * SIZE(BO), %xmm3
1146 mulpd -2 * SIZE(BO), %xmm0
1148 movapd 8 * SIZE(BO), %xmm3
1153 movapd 2 * SIZE(BO), %xmm1
1156 movapd 4 * SIZE(BO), %xmm1
1158 mulpd 6 * SIZE(BO), %xmm0
1160 movapd 16 * SIZE(BO), %xmm1
1165 movapd 10 * SIZE(BO), %xmm3
1168 movapd 12 * SIZE(BO), %xmm3
1170 mulpd 14 * SIZE(BO), %xmm0
1172 movapd 24 * SIZE(BO), %xmm3
1177 addq $32 * SIZE, BO
1197 movapd -14 * SIZE(BO), %xmm1
1200 movapd -12 * SIZE(BO), %xmm1
1202 mulpd -10 * SIZE(BO), %xmm0
1204 movapd -8 * SIZE(BO), %xmm1
1209 addq $8 * SIZE, BO
1271 leaq (BO, %rax, 8), BO
1299 leaq BUFFER, BO
1316 movlpd %xmm8, 0 * SIZE(BO)
1317 movlpd %xmm8, 1 * SIZE(BO)
1318 movlpd %xmm9, 2 * SIZE(BO)
1319 movlpd %xmm9, 3 * SIZE(BO)
1320 movlpd %xmm10, 4 * SIZE(BO)
1321 movlpd %xmm10, 5 * SIZE(BO)
1322 movlpd %xmm11, 6 * SIZE(BO)
1323 movlpd %xmm11, 7 * SIZE(BO)
1324 movlpd %xmm12, 8 * SIZE(BO)
1325 movlpd %xmm12, 9 * SIZE(BO)
1326 movlpd %xmm13, 10 * SIZE(BO)
1327 movlpd %xmm13, 11 * SIZE(BO)
1328 movlpd %xmm14, 12 * SIZE(BO)
1329 movlpd %xmm14, 13 * SIZE(BO)
1330 movlpd %xmm15, 14 * SIZE(BO)
1331 movlpd %xmm15, 15 * SIZE(BO)
1333 subq $-16 * SIZE, BO
1350 movlpd %xmm8, 0 * SIZE(BO)
1351 movlpd %xmm8, 1 * SIZE(BO)
1352 movlpd %xmm9, 2 * SIZE(BO)
1353 movlpd %xmm9, 3 * SIZE(BO)
1355 addq $4 * SIZE, BO
1375 leaq 16 * SIZE + BUFFER, BO
1377 leaq 16 * SIZE + BUFFER, BO
1381 leaq (BO, %rax, 4), BO
1386 movapd -16 * SIZE(BO), %xmm1
1390 movapd -8 * SIZE(BO), %xmm3
1415 mulpd -14 * SIZE(BO), %xmm0
1417 movapd -16 * SIZE(BO), %xmm1
1421 mulpd -14 * SIZE(BO), %xmm0
1423 movapd -12 * SIZE(BO), %xmm1
1427 mulpd -10 * SIZE(BO), %xmm0
1429 movapd -12 * SIZE(BO), %xmm1
1433 mulpd -10 * SIZE(BO), %xmm0
1435 movapd 0 * SIZE(BO), %xmm1
1440 mulpd -6 * SIZE(BO), %xmm2
1442 movapd -8 * SIZE(BO), %xmm3
1446 mulpd -6 * SIZE(BO), %xmm2
1448 movapd -4 * SIZE(BO), %xmm3
1452 mulpd -2 * SIZE(BO), %xmm2
1454 movapd -4 * SIZE(BO), %xmm3
1458 mulpd -2 * SIZE(BO), %xmm2
1460 movapd 8 * SIZE(BO), %xmm3
1465 subq $-16 * SIZE, BO
1485 mulpd -14 * SIZE(BO), %xmm0
1487 movapd -16 * SIZE(BO), %xmm1
1491 mulpd -14 * SIZE(BO), %xmm0
1493 movapd -12 * SIZE(BO), %xmm1
1498 addq $4 * SIZE, BO # boffset1 += 8
1559 leaq (BO, %rax, 4), BO
1579 leaq 16 * SIZE + BUFFER, BO
1581 leaq 16 * SIZE + BUFFER, BO
1585 leaq (BO, %rax, 4), BO
1589 movapd -16 * SIZE(BO), %xmm1
1591 movapd -8 * SIZE(BO), %xmm3
1620 mulpd -14 * SIZE(BO), %xmm0
1622 movapd -12 * SIZE(BO), %xmm1
1626 mulpd -10 * SIZE(BO), %xmm0
1628 movapd 0 * SIZE(BO), %xmm1
1632 mulpd -6 * SIZE(BO), %xmm0
1634 movapd -4 * SIZE(BO), %xmm3
1638 mulpd -2 * SIZE(BO), %xmm0
1640 movapd 8 * SIZE(BO), %xmm3
1645 mulpd 2 * SIZE(BO), %xmm2
1647 movapd 4 * SIZE(BO), %xmm1
1651 mulpd 6 * SIZE(BO), %xmm2
1653 movapd 16 * SIZE(BO), %xmm1
1657 mulpd 10 * SIZE(BO), %xmm2
1659 movapd 12 * SIZE(BO), %xmm3
1663 mulpd 14 * SIZE(BO), %xmm2
1665 movapd 24 * SIZE(BO), %xmm3
1670 subq $-32 * SIZE, BO
1687 mulpd -14 * SIZE(BO), %xmm0
1689 movapd -12 * SIZE(BO), %xmm1
1693 mulpd -10 * SIZE(BO), %xmm0
1695 movapd 0 * SIZE(BO), %xmm1
1699 mulpd -6 * SIZE(BO), %xmm0
1701 movapd -4 * SIZE(BO), %xmm3
1705 mulpd -2 * SIZE(BO), %xmm0
1711 subq $-16 * SIZE, BO
1731 mulpd -14 * SIZE(BO), %xmm0
1733 movapd -12 * SIZE(BO), %xmm1
1738 addq $4 * SIZE, BO # boffset1 += 8