Lines Matching refs:BO

55 #define BO	%rsi  macro
109 movaps -32 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
112 movaps -28 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
115 mulps -20 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm0 ;\
117 movaps -24 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
124 movaps 0 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
127 movaps -12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
129 mulps -20 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm2 ;\
131 movaps -8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
138 movaps -16 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
141 movaps -12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
143 mulps -4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm4 ;\
145 movaps -8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
152 movaps 16 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
155 movaps 4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
157 mulps -4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm6 ;\
159 movaps 8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
167 movaps 0 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
170 movaps 4 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
172 mulps 12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm0 ;\
174 movaps 8 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
181 movaps 32 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm1 ;\
184 movaps 20 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
186 mulps 12 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm2 ;\
188 movaps 24 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
195 movaps 16 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
198 movaps 20 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
200 mulps 28 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm4 ;\
202 movaps 24 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
209 movaps 48 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm7 ;\
212 movaps 36 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm3 ;\
214 mulps 28 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm6 ;\
216 movaps 40 * SIZE + 2 * (xx) * SIZE(BO, %rax, 8), %xmm5 ;\
224 movaps -32 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
227 movaps -28 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
230 mulps -20 * SIZE + 2 * (xx) * SIZE(BO), %xmm0 ;\
232 movaps -24 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
239 movaps 0 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
242 movaps -12 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
244 mulps -20 * SIZE + 2 * (xx) * SIZE(BO), %xmm2 ;\
246 movaps -8 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
253 movaps -16 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
256 movaps -12 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
258 mulps -4 * SIZE + 2 * (xx) * SIZE(BO), %xmm4 ;\
260 movaps -8 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
267 movaps 16 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
270 movaps 4 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
272 mulps -4 * SIZE + 2 * (xx) * SIZE(BO), %xmm6 ;\
274 movaps 8 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
282 movaps 0 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
285 movaps 4 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
287 mulps 12 * SIZE + 2 * (xx) * SIZE(BO), %xmm0 ;\
289 movaps 8 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
296 movaps 32 * SIZE + 2 * (xx) * SIZE(BO), %xmm1 ;\
299 movaps 20 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
301 mulps 12 * SIZE + 2 * (xx) * SIZE(BO), %xmm2 ;\
303 movaps 24 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
310 movaps 16 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
313 movaps 20 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
315 mulps 28 * SIZE + 2 * (xx) * SIZE(BO), %xmm4 ;\
317 movaps 24 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
324 movaps 48 * SIZE + 2 * (xx) * SIZE(BO), %xmm7 ;\
327 movaps 36 * SIZE + 2 * (xx) * SIZE(BO), %xmm3 ;\
329 mulps 28 * SIZE + 2 * (xx) * SIZE(BO), %xmm6 ;\
331 movaps 40 * SIZE + 2 * (xx) * SIZE(BO), %xmm5 ;\
420 leaq BUFFER, BO
442 PREFETCHW (WPREFETCHSIZE + 0) * SIZE(BO)
445 movq %mm0, 0 * SIZE(BO)
446 movq %mm0, 2 * SIZE(BO)
449 movq %mm1, 4 * SIZE(BO)
450 movq %mm1, 6 * SIZE(BO)
452 movq %mm2, 8 * SIZE(BO)
453 movq %mm2, 10 * SIZE(BO)
455 movq %mm3, 12 * SIZE(BO)
456 movq %mm3, 14 * SIZE(BO)
458 PREFETCHW (WPREFETCHSIZE + 16) * SIZE(BO)
461 movq %mm4, 16 * SIZE(BO)
462 movq %mm4, 18 * SIZE(BO)
464 movq %mm5, 20 * SIZE(BO)
465 movq %mm5, 22 * SIZE(BO)
467 movq %mm6, 24 * SIZE(BO)
468 movq %mm6, 26 * SIZE(BO)
470 movq %mm7, 28 * SIZE(BO)
471 movq %mm7, 30 * SIZE(BO)
475 addq $32 * SIZE, BO
499 movq %mm0, 0 * SIZE(BO)
500 movq %mm0, 2 * SIZE(BO)
501 movq %mm1, 4 * SIZE(BO)
502 movq %mm1, 6 * SIZE(BO)
503 movq %mm2, 8 * SIZE(BO)
504 movq %mm2, 10 * SIZE(BO)
505 movq %mm3, 12 * SIZE(BO)
506 movq %mm3, 14 * SIZE(BO)
509 addq $16 * SIZE, BO
531 leaq 32 * SIZE + BUFFER, BO
533 leaq 32 * SIZE + BUFFER, BO
537 leaq (BO, %rax, 8), BO
541 movaps -32 * SIZE(BO), %xmm1
544 movaps -28 * SIZE(BO), %xmm3
547 movaps -24 * SIZE(BO), %xmm5
550 movaps -16 * SIZE(BO), %xmm7
583 leaq (BO, %rax, 8), BO
783 addq $64 * SIZE, BO
802 addq $ 64 * SIZE, BO
822 leaq (BO, %rax, 8), BO
829 movaps -28 * SIZE(BO, %rax, 8), %xmm1
832 movaps -24 * SIZE(BO, %rax, 8), %xmm1
834 mulps -20 * SIZE(BO, %rax, 8), %xmm0
836 movaps -32 * SIZE(BO, %rax, 8), %xmm1
841 movaps -28 * SIZE(BO, %rax, 8), %xmm1
844 movaps -24 * SIZE(BO, %rax, 8), %xmm1
846 mulps -20 * SIZE(BO, %rax, 8), %xmm2
848 movaps -16 * SIZE(BO, %rax, 8), %xmm1
929 leaq (BO, %rax, 8), BO
950 leaq BUFFER, BO
952 leaq BUFFER, BO
956 leaq (BO, %rax, 8), BO
962 movaps 0 * SIZE(BO), %xmm9
963 movaps 16 * SIZE(BO), %xmm11
964 movaps 32 * SIZE(BO), %xmm13
965 movaps 48 * SIZE(BO), %xmm15
997 movaps 4 * SIZE(BO), %xmm9
1000 movaps 8 * SIZE(BO), %xmm9
1002 mulps 12 * SIZE(BO), %xmm8
1004 movaps 64 * SIZE(BO), %xmm9
1010 movaps 20 * SIZE(BO), %xmm11
1013 movaps 24 * SIZE(BO), %xmm11
1015 mulps 28 * SIZE(BO), %xmm8
1017 movaps 80 * SIZE(BO), %xmm11
1023 movaps 36 * SIZE(BO), %xmm13
1026 movaps 40 * SIZE(BO), %xmm13
1028 mulps 44 * SIZE(BO), %xmm8
1030 movaps 96 * SIZE(BO), %xmm13
1036 movaps 52 * SIZE(BO), %xmm15
1039 movaps 56 * SIZE(BO), %xmm15
1041 mulps 60 * SIZE(BO), %xmm8
1043 movaps 112 * SIZE(BO), %xmm15
1052 movaps 68 * SIZE(BO), %xmm9
1055 movaps 72 * SIZE(BO), %xmm9
1057 mulps 76 * SIZE(BO), %xmm10
1059 movaps 128 * SIZE(BO), %xmm9
1065 movaps 84 * SIZE(BO), %xmm11
1068 movaps 88 * SIZE(BO), %xmm11
1070 mulps 92 * SIZE(BO), %xmm10
1072 movaps 144 * SIZE(BO), %xmm11
1078 movaps 100 * SIZE(BO), %xmm13
1081 movaps 104 * SIZE(BO), %xmm13
1083 mulps 108 * SIZE(BO), %xmm10
1085 movaps 160 * SIZE(BO), %xmm13
1091 movaps 116 * SIZE(BO), %xmm15
1094 movaps 120 * SIZE(BO), %xmm15
1096 mulps 124 * SIZE(BO), %xmm10
1098 movaps 176 * SIZE(BO), %xmm15
1103 addq $128 * SIZE, BO
1123 movaps 4 * SIZE(BO), %xmm9
1126 movaps 8 * SIZE(BO), %xmm9
1128 mulps 12 * SIZE(BO), %xmm8
1130 movaps 16 * SIZE(BO), %xmm9
1135 addq $16 * SIZE, BO # boffset1 += 8
1179 leaq (BO, %rax, 8), BO
1198 leaq BUFFER, BO
1200 leaq BUFFER, BO
1204 leaq (BO, %rax, 8), BO
1210 movaps 0 * SIZE(BO), %xmm9
1211 movaps 16 * SIZE(BO), %xmm11
1212 movaps 32 * SIZE(BO), %xmm13
1213 movaps 48 * SIZE(BO), %xmm15
1245 movaps 4 * SIZE(BO), %xmm9
1248 movaps 8 * SIZE(BO), %xmm9
1251 movaps 12 * SIZE(BO), %xmm9
1255 movaps 64 * SIZE(BO), %xmm9
1259 movaps 20 * SIZE(BO), %xmm11
1262 movaps 24 * SIZE(BO), %xmm11
1265 movaps 28 * SIZE(BO), %xmm11
1269 movaps 80 * SIZE(BO), %xmm11
1273 movaps 36 * SIZE(BO), %xmm13
1276 movaps 40 * SIZE(BO), %xmm13
1279 movaps 44 * SIZE(BO), %xmm13
1283 movaps 96 * SIZE(BO), %xmm13
1287 movaps 52 * SIZE(BO), %xmm15
1290 movaps 56 * SIZE(BO), %xmm15
1293 movaps 60 * SIZE(BO), %xmm15
1297 movaps 112 * SIZE(BO), %xmm15
1301 movaps 68 * SIZE(BO), %xmm9
1304 movaps 72 * SIZE(BO), %xmm9
1307 movaps 76 * SIZE(BO), %xmm9
1311 movaps 128 * SIZE(BO), %xmm9
1315 movaps 84 * SIZE(BO), %xmm11
1318 movaps 88 * SIZE(BO), %xmm11
1321 movaps 92 * SIZE(BO), %xmm11
1325 movaps 144 * SIZE(BO), %xmm11
1329 movaps 100 * SIZE(BO), %xmm13
1332 movaps 104 * SIZE(BO), %xmm13
1335 movaps 108 * SIZE(BO), %xmm13
1339 movaps 160 * SIZE(BO), %xmm13
1343 movaps 116 * SIZE(BO), %xmm15
1346 movaps 120 * SIZE(BO), %xmm15
1349 movaps 124 * SIZE(BO), %xmm15
1353 movaps 176 * SIZE(BO), %xmm15
1356 addq $128 * SIZE, BO
1376 movaps 4 * SIZE(BO), %xmm9
1379 movaps 8 * SIZE(BO), %xmm9
1382 movaps 12 * SIZE(BO), %xmm9
1386 movaps 16 * SIZE(BO), %xmm9
1389 addq $16 * SIZE, BO # boffset1 += 8
1435 leaq (BO, %rax, 8), BO
1454 leaq BUFFER, BO
1456 leaq BUFFER, BO
1460 leaq (BO, %rax, 8), BO
1461 leaq (BO, %rax, 8), BO
1467 movss 0 * SIZE(BO), %xmm9
1468 movss 16 * SIZE(BO), %xmm11
1469 movss 32 * SIZE(BO), %xmm13
1470 movss 48 * SIZE(BO), %xmm15
1502 movss 4 * SIZE(BO), %xmm9
1505 movss 8 * SIZE(BO), %xmm9
1508 movss 12 * SIZE(BO), %xmm9
1512 movss 64 * SIZE(BO), %xmm9
1516 movss 20 * SIZE(BO), %xmm11
1519 movss 24 * SIZE(BO), %xmm11
1522 movss 28 * SIZE(BO), %xmm11
1526 movss 80 * SIZE(BO), %xmm11
1530 movss 36 * SIZE(BO), %xmm13
1533 movss 40 * SIZE(BO), %xmm13
1536 movss 44 * SIZE(BO), %xmm13
1540 movss 96 * SIZE(BO), %xmm13
1544 movss 52 * SIZE(BO), %xmm15
1547 movss 56 * SIZE(BO), %xmm15
1550 movss 60 * SIZE(BO), %xmm15
1554 movss 112 * SIZE(BO), %xmm15
1558 movss 68 * SIZE(BO), %xmm9
1561 movss 72 * SIZE(BO), %xmm9
1564 movss 76 * SIZE(BO), %xmm9
1568 movss 128 * SIZE(BO), %xmm9
1572 movss 84 * SIZE(BO), %xmm11
1575 movss 88 * SIZE(BO), %xmm11
1578 movss 92 * SIZE(BO), %xmm11
1582 movss 144 * SIZE(BO), %xmm11
1586 movss 100 * SIZE(BO), %xmm13
1589 movss 104 * SIZE(BO), %xmm13
1592 movss 108 * SIZE(BO), %xmm13
1596 movss 160 * SIZE(BO), %xmm13
1600 movss 116 * SIZE(BO), %xmm15
1603 movss 120 * SIZE(BO), %xmm15
1606 movss 124 * SIZE(BO), %xmm15
1610 movss 176 * SIZE(BO), %xmm15
1613 addq $128 * SIZE, BO
1633 movss 4 * SIZE(BO), %xmm9
1636 movss 8 * SIZE(BO), %xmm9
1639 movss 12 * SIZE(BO), %xmm9
1643 movss 16 * SIZE(BO), %xmm9
1646 addq $16 * SIZE, BO # boffset1 += 8
1680 leaq (BO, %rax, 8), BO
1681 leaq (BO, %rax, 8), BO
1708 leaq BUFFER, BO
1737 movaps %xmm0, 0 * SIZE(BO)
1738 movaps %xmm1, 4 * SIZE(BO)
1739 movaps %xmm2, 8 * SIZE(BO)
1740 movaps %xmm3, 12 * SIZE(BO)
1741 movaps %xmm4, 16 * SIZE(BO)
1742 movaps %xmm5, 20 * SIZE(BO)
1743 movaps %xmm6, 24 * SIZE(BO)
1744 movaps %xmm7, 28 * SIZE(BO)
1747 addq $32 * SIZE, BO
1771 movq %mm0, 0 * SIZE(BO)
1772 movq %mm0, 2 * SIZE(BO)
1773 movq %mm1, 4 * SIZE(BO)
1774 movq %mm1, 6 * SIZE(BO)
1775 movq %mm2, 8 * SIZE(BO)
1776 movq %mm2, 10 * SIZE(BO)
1777 movq %mm3, 12 * SIZE(BO)
1778 movq %mm3, 14 * SIZE(BO)
1779 movq %mm4, 16 * SIZE(BO)
1780 movq %mm4, 18 * SIZE(BO)
1781 movq %mm5, 20 * SIZE(BO)
1782 movq %mm5, 22 * SIZE(BO)
1783 movq %mm6, 24 * SIZE(BO)
1784 movq %mm6, 26 * SIZE(BO)
1785 movq %mm7, 28 * SIZE(BO)
1786 movq %mm7, 30 * SIZE(BO)
1789 addq $32 * SIZE, BO
1811 movaps %xmm0, 0 * SIZE(BO)
1812 movaps %xmm1, 4 * SIZE(BO)
1822 movq %mm0, 0 * SIZE(BO)
1823 movq %mm0, 2 * SIZE(BO)
1824 movq %mm1, 4 * SIZE(BO)
1825 movq %mm1, 6 * SIZE(BO)
1829 addq $ 8 * SIZE, BO
1849 leaq BUFFER, BO
1851 leaq BUFFER, BO
1855 leaq (BO, %rax, 4), BO
1863 movaps 0 * SIZE(BO), %xmm9
1864 movaps 16 * SIZE(BO), %xmm11
1865 movaps 32 * SIZE(BO), %xmm13
1866 movaps 48 * SIZE(BO), %xmm15
1900 mulps 4 * SIZE(BO), %xmm8
1902 movaps 0 * SIZE(BO), %xmm9
1906 mulps 4 * SIZE(BO), %xmm8
1908 movaps 8 * SIZE(BO), %xmm9
1913 mulps 12 * SIZE(BO), %xmm8
1915 movaps 8 * SIZE(BO), %xmm9
1919 mulps 12 * SIZE(BO), %xmm8
1921 movaps 64 * SIZE(BO), %xmm9
1929 mulps 20 * SIZE(BO), %xmm10
1931 movaps 16 * SIZE(BO), %xmm11
1935 mulps 20 * SIZE(BO), %xmm10
1937 movaps 24 * SIZE(BO), %xmm11
1942 mulps 28 * SIZE(BO), %xmm10
1944 movaps 24 * SIZE(BO), %xmm11
1948 mulps 28 * SIZE(BO), %xmm10
1950 movaps 80 * SIZE(BO), %xmm11
1958 mulps 36 * SIZE(BO), %xmm12
1960 movaps 32 * SIZE(BO), %xmm13
1964 mulps 36 * SIZE(BO), %xmm12
1966 movaps 40 * SIZE(BO), %xmm13
1971 mulps 44 * SIZE(BO), %xmm12
1973 movaps 40 * SIZE(BO), %xmm13
1977 mulps 44 * SIZE(BO), %xmm12
1979 movaps 96 * SIZE(BO), %xmm13
1987 mulps 52 * SIZE(BO), %xmm14
1989 movaps 48 * SIZE(BO), %xmm15
1993 mulps 52 * SIZE(BO), %xmm14
1995 movaps 56 * SIZE(BO), %xmm15
2000 mulps 60 * SIZE(BO), %xmm14
2002 movaps 56 * SIZE(BO), %xmm15
2006 mulps 60 * SIZE(BO), %xmm14
2008 movaps 112 * SIZE(BO), %xmm15
2013 addq $64 * SIZE, BO
2032 mulps 4 * SIZE(BO), %xmm8
2034 movaps 0 * SIZE(BO), %xmm9
2038 mulps 4 * SIZE(BO), %xmm8
2040 movaps 8 * SIZE(BO), %xmm9
2045 addq $8 * SIZE, BO # boffset1 += 8
2091 leaq (BO, %rax, 4), BO
2113 leaq BUFFER, BO
2115 leaq BUFFER, BO
2119 leaq (BO, %rax, 4), BO
2125 movaps 0 * SIZE(BO), %xmm9
2126 movaps 16 * SIZE(BO), %xmm11
2127 movaps 32 * SIZE(BO), %xmm13
2128 movaps 48 * SIZE(BO), %xmm15
2160 mulps 4 * SIZE(BO), %xmm8
2162 movaps 8 * SIZE(BO), %xmm9
2167 mulps 12 * SIZE(BO), %xmm8
2169 movaps 64 * SIZE(BO), %xmm9
2174 mulps 20 * SIZE(BO), %xmm8
2176 movaps 24 * SIZE(BO), %xmm11
2181 mulps 28 * SIZE(BO), %xmm8
2183 movaps 80 * SIZE(BO), %xmm11
2188 mulps 36 * SIZE(BO), %xmm10
2190 movaps 40 * SIZE(BO), %xmm13
2195 mulps 44 * SIZE(BO), %xmm10
2197 movaps 96 * SIZE(BO), %xmm13
2202 mulps 52 * SIZE(BO), %xmm10
2204 movaps 56 * SIZE(BO), %xmm15
2209 mulps 60 * SIZE(BO), %xmm10
2211 movaps 112 * SIZE(BO), %xmm15
2216 addq $64 * SIZE, BO
2235 mulps 4 * SIZE(BO), %xmm8
2237 movaps 8 * SIZE(BO), %xmm9
2242 addq $8 * SIZE, BO # boffset1 += 8
2277 leaq (BO, %rax, 4), BO
2296 leaq BUFFER, BO
2298 leaq BUFFER, BO
2302 leaq (BO, %rax, 4), BO
2308 movaps 0 * SIZE(BO), %xmm9
2309 movaps 16 * SIZE(BO), %xmm11
2310 movaps 32 * SIZE(BO), %xmm13
2311 movaps 48 * SIZE(BO), %xmm15
2343 movaps 4 * SIZE(BO), %xmm9
2347 movaps 8 * SIZE(BO), %xmm9
2351 movaps 12 * SIZE(BO), %xmm9
2355 movaps 64 * SIZE(BO), %xmm9
2359 movaps 20 * SIZE(BO), %xmm11
2363 movaps 24 * SIZE(BO), %xmm11
2367 movaps 28 * SIZE(BO), %xmm11
2371 movaps 80 * SIZE(BO), %xmm11
2375 movaps 36 * SIZE(BO), %xmm13
2379 movaps 40 * SIZE(BO), %xmm13
2383 movaps 44 * SIZE(BO), %xmm13
2387 movaps 96 * SIZE(BO), %xmm13
2391 movaps 52 * SIZE(BO), %xmm15
2395 movaps 56 * SIZE(BO), %xmm15
2399 movaps 60 * SIZE(BO), %xmm15
2403 movaps 112 * SIZE(BO), %xmm15
2406 addq $64 * SIZE, BO
2426 movaps 4 * SIZE(BO), %xmm9
2430 movaps 8 * SIZE(BO), %xmm9
2433 addq $8 * SIZE, BO # boffset1 += 8
2470 leaq (BO, %rax, 4), BO
2489 leaq BUFFER, BO
2491 leaq BUFFER, BO
2495 leaq (BO, %rax, 8), BO
2501 movss 0 * SIZE(BO), %xmm9
2502 movss 16 * SIZE(BO), %xmm11
2503 movss 32 * SIZE(BO), %xmm13
2504 movss 48 * SIZE(BO), %xmm15
2536 movss 4 * SIZE(BO), %xmm9
2540 movss 8 * SIZE(BO), %xmm9
2544 movss 12 * SIZE(BO), %xmm9
2548 movss 64 * SIZE(BO), %xmm9
2552 movss 20 * SIZE(BO), %xmm11
2556 movss 24 * SIZE(BO), %xmm11
2560 movss 28 * SIZE(BO), %xmm11
2564 movss 80 * SIZE(BO), %xmm11
2568 movss 36 * SIZE(BO), %xmm13
2572 movss 40 * SIZE(BO), %xmm13
2576 movss 44 * SIZE(BO), %xmm13
2580 movss 96 * SIZE(BO), %xmm13
2584 movss 52 * SIZE(BO), %xmm15
2588 movss 56 * SIZE(BO), %xmm15
2592 movss 60 * SIZE(BO), %xmm15
2596 movss 112 * SIZE(BO), %xmm15
2599 addq $64 * SIZE, BO
2619 movss 4 * SIZE(BO), %xmm9
2623 movss 8 * SIZE(BO), %xmm9
2626 addq $8 * SIZE, BO # boffset1 += 8
2656 leaq (BO, %rax, 8), BO
2683 leaq BUFFER, BO
2713 movaps %xmm0, 0 * SIZE(BO)
2714 movaps %xmm1, 4 * SIZE(BO)
2715 movaps %xmm2, 8 * SIZE(BO)
2716 movaps %xmm3, 12 * SIZE(BO)
2717 movaps %xmm4, 16 * SIZE(BO)
2718 movaps %xmm5, 20 * SIZE(BO)
2719 movaps %xmm6, 24 * SIZE(BO)
2720 movaps %xmm7, 28 * SIZE(BO)
2723 addq $32 * SIZE, BO
2747 movq %mm0, 0 * SIZE(BO)
2748 movq %mm0, 2 * SIZE(BO)
2749 movq %mm1, 4 * SIZE(BO)
2750 movq %mm1, 6 * SIZE(BO)
2751 movq %mm2, 8 * SIZE(BO)
2752 movq %mm2, 10 * SIZE(BO)
2753 movq %mm3, 12 * SIZE(BO)
2754 movq %mm3, 14 * SIZE(BO)
2755 movq %mm4, 16 * SIZE(BO)
2756 movq %mm4, 18 * SIZE(BO)
2757 movq %mm5, 20 * SIZE(BO)
2758 movq %mm5, 22 * SIZE(BO)
2759 movq %mm6, 24 * SIZE(BO)
2760 movq %mm6, 26 * SIZE(BO)
2761 movq %mm7, 28 * SIZE(BO)
2762 movq %mm7, 30 * SIZE(BO)
2765 addq $32 * SIZE, BO
2783 movaps %xmm0, 0 * SIZE(BO)
2789 movq %mm0, 0 * SIZE(BO)
2790 movq %mm0, 2 * SIZE(BO)
2794 addq $ 4 * SIZE, BO
2813 leaq BUFFER, BO
2815 leaq BUFFER, BO
2819 leaq (BO, %rax, 2), BO
2827 movaps 0 * SIZE(BO), %xmm9
2828 movaps 16 * SIZE(BO), %xmm11
2829 movaps 32 * SIZE(BO), %xmm13
2830 movaps 48 * SIZE(BO), %xmm15
2868 movaps 4 * SIZE(BO), %xmm9
2875 movaps 8 * SIZE(BO), %xmm9
2885 movaps 12 * SIZE(BO), %xmm9
2892 movaps 32 * SIZE(BO), %xmm9
2902 movaps 20 * SIZE(BO), %xmm11
2909 movaps 24 * SIZE(BO), %xmm11
2919 movaps 28 * SIZE(BO), %xmm11
2926 movaps 48 * SIZE(BO), %xmm11
2929 addq $32 * SIZE, BO
2952 movaps 4 * SIZE(BO), %xmm9
2955 addq $4 * SIZE, BO # boffset1 += 8
2986 leaq (BO, %rax, 2), BO
3006 leaq BUFFER, BO
3008 leaq BUFFER, BO
3012 leaq (BO, %rax, 2), BO
3018 movaps 0 * SIZE(BO), %xmm9
3019 movaps 16 * SIZE(BO), %xmm11
3051 mulps 4 * SIZE(BO), %xmm8
3053 movaps 32 * SIZE(BO), %xmm9
3056 mulps 8 * SIZE(BO), %xmm8
3059 mulps 12 * SIZE(BO), %xmm8
3068 mulps 20 * SIZE(BO), %xmm10
3070 movaps 48 * SIZE(BO), %xmm11
3073 mulps 24 * SIZE(BO), %xmm10
3076 mulps 28 * SIZE(BO), %xmm10
3081 addq $32 * SIZE, BO
3102 movaps 4 * SIZE(BO), %xmm9
3105 addq $4 * SIZE, BO # boffset1 += 8
3134 leaq (BO, %rax, 2), BO
3152 leaq BUFFER, BO
3154 leaq BUFFER, BO
3158 leaq (BO, %rax, 2), BO
3164 movaps 0 * SIZE(BO), %xmm9
3165 movaps 16 * SIZE(BO), %xmm11
3198 movaps 4 * SIZE(BO), %xmm9
3202 movaps 8 * SIZE(BO), %xmm9
3207 movaps 12 * SIZE(BO), %xmm9
3212 movaps 32 * SIZE(BO), %xmm9
3217 movaps 20 * SIZE(BO), %xmm11
3222 movaps 24 * SIZE(BO), %xmm11
3227 movaps 28 * SIZE(BO), %xmm11
3232 movaps 48 * SIZE(BO), %xmm11
3235 addq $32 * SIZE, BO
3256 movaps 4 * SIZE(BO), %xmm9
3259 addq $4 * SIZE, BO # boffset1 += 8
3284 leaq (BO, %rax, 2), BO
3302 leaq BUFFER, BO
3304 leaq BUFFER, BO
3308 leaq (BO, %rax, 4), BO
3314 movss 0 * SIZE(BO), %xmm9
3315 movss 16 * SIZE(BO), %xmm11
3347 mulss 4 * SIZE(BO), %xmm8
3349 movss 32 * SIZE(BO), %xmm9
3352 mulss 8 * SIZE(BO), %xmm8
3355 mulss 12 * SIZE(BO), %xmm8
3360 mulss 20 * SIZE(BO), %xmm10
3362 movss 48 * SIZE(BO), %xmm11
3365 mulss 24 * SIZE(BO), %xmm10
3368 mulss 28 * SIZE(BO), %xmm10
3373 addq $32 * SIZE, BO
3394 movss 4 * SIZE(BO), %xmm9
3397 addq $4 * SIZE, BO