Lines Matching refs:D4

342 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
803 vmovdqu `16*3`($ctx),$D4 # preload r0^2
834 vpshufd \$0xEE,$D4,$D3 # 34xx -> 3434
835 vpshufd \$0x44,$D4,$D0 # xx12 -> 1212
838 vpshufd \$0xEE,$D1,$D4
841 vmovdqa $D4,-0x80(%r11)
848 vpshufd \$0xEE,$D0,$D4
851 vmovdqa $D4,-0x60(%r11)
858 vpshufd \$0xEE,$D2,$D4
861 vmovdqa $D4,-0x40(%r11)
868 vpshufd \$0xEE,$D1,$D4
870 vmovdqa $D4,-0x20(%r11)
873 vmovdqa 0x00(%rsp),$D4 # preload r0^2
900 # and $D4 is preloaded with r0^2...
902 vpmuludq $T0,$D4,$D0 # d0 = h0*r0
903 vpmuludq $T1,$D4,$D1 # d1 = h1*r0
905 vpmuludq $T2,$D4,$D2 # d3 = h2*r0
907 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
908 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
915 vpaddq $H1,$D4,$D4 # d4 += h3*r1
928 vpaddq $H0,$D4,$D4 # d4 += h2*r2
943 vpaddq $H1,$D4,$D4 # d4 += h1*r3
965 vpaddq $T4,$D4,$D4 # d4 += h0*r4
1015 vpaddq $T4,$D4,$D4
1022 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1031 vpaddq $T0,$D4,$D4 # d4 += h2*r2
1044 vpaddq $T1,$D4,$D4 # d4 += h1*r3
1067 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
1076 vmovdqa 0x00(%rsp),$D4 # preload r0^2
1127 vpshufd \$0x10,$D4,$D4 # r0^n, xx12 -> x1x2
1150 vpmuludq $T2,$D4,$D2 # d2 = h2*r0
1151 vpmuludq $T0,$D4,$D0 # d0 = h0*r0
1153 vpmuludq $T1,$D4,$D1 # d1 = h1*r0
1154 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
1155 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
1158 vpaddq $H0,$D4,$D4 # d4 += h3*r1
1172 vpaddq $H1,$D4,$D4 # d4 += h2*r2
1185 vpaddq $H0,$D4,$D4 # d4 += h1*r3
1198 vpaddq $H2,$D4,$D4 # h4 = d4 + h0*r4
1249 vpaddq $T4,$D4,$D4 # d4 += h4*r0
1252 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1266 vpaddq $T1,$D4,$D4 # d4 += h2*r2
1279 vpaddq $T0,$D4,$D4 # d4 += h1*r3
1292 vpaddq $T2,$D4,$D4 # d4 += h0*r4
1306 vpsrldq \$8,$D4,$T4
1312 vpaddq $T4,$D4,$D4
1322 vpaddq $H3,$D4,$D4 # h3 -> h4
1328 vpsrlq \$26,$D4,$H4
1329 vpand $MASK,$D4,$D4
1349 vpaddq $H3,$D4,$D4 # h3 -> h4
1355 vmovd $D4,`4*4-48-64`($ctx)
1440 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1760 vmovdqu `16*7-64`($ctx),%x#$D4
1773 vpermd $D4,$T0,$D4
1777 vmovdqa $D4,0xe0-0x90(%rax)
1847 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1857 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1869 vpaddq $H2,$D4,$D4 # d4 += h4*r0
1888 vpaddq $T4,$D4,$D4 # d4 += h1*r3
1906 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
1920 vpsrlq \$26,$H4,$D4
1929 vpaddq $D4,$H0,$H0
1930 vpsllq \$2,$D4,$D4
1931 vpaddq $D4,$H0,$H0 # h4 -> h0
1982 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1992 vpaddq $T4,$D4,$D4 # d4 += h3*r1
2003 vpaddq $H2,$D4,$D4 # d4 += h4*r0
2017 vpaddq $T4,$D4,$D4 # d4 += h1*r3
2031 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
2070 vpsrlq \$26,$H4,$D4
2077 vpaddq $D4,$H0,$H0
2078 vpsllq \$2,$D4,$D4
2079 vpaddq $D4,$H0,$H0 # h4 -> h0
2136 map(s/%y/%z/,($D0,$D1,$D2,$D3,$D4));
2184 vmovdqu `16*7-64`($ctx),%x#$D4 # ... ${R4}
2199 vpermd $D4,$T2,$R4
2221 vpmuludq $T0,$R4,$D4 # d4 = r0'*r4
2234 vpaddq $M4,$D4,$D4 # d4 += r1'*r3
2245 vpaddq $M4,$D4,$D4 # d4 += r2'*r2
2255 vpaddq $M4,$D4,$D4 # d4 += r3'*r1
2265 vpaddq $M4,$D4,$D4 # d4 += r2'*r0
2281 vpaddq $M3,$D4,$D4 # d3 -> d4
2287 vpsrlq \$26,$D4,$M4
2288 vpandq $MASK,$D4,$D4
2308 vpaddq $M3,$D4,$D4 # d3 -> d4
2312 # $D0-$D4, ...
2336 vpermd $D4,$M0,${R4}{%k1}
2398 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2417 vpaddq $M4,$D4,$D4 # d4 += h0*r4
2426 vpaddq $M4,$D4,$D4 # d4 += h1*r3
2438 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2448 vpaddq $M4,$D4,$D4 # d4 += h4*r0
2468 vpaddq $H3,$D4,$H4 # h3 -> h4
2478 vpsrlq \$26,$H4,$D4
2485 vpaddq $D4,$H0,$H0
2486 vpsllq \$2,$D4,$D4
2487 vpaddq $D4,$H0,$H0 # h4 -> h0
2540 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2557 vpaddq $M4,$D4,$D4 # d4 += h0*r4
2567 vpaddq $M4,$D4,$D4 # d4 += h1*r3
2577 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2588 vpaddq $M4,$D4,$D4 # d4 += h4*r0
2605 vpermq \$0xb1,$D4,$H4
2610 vpaddq $D4,$H4,$H4
2617 vpermq \$0x2,$H4,$D4
2622 vpaddq $D4,$H4,$H4
2628 vextracti64x4 \$0x1,$H4,%y#$D4
2633 vpaddq $D4,$H4,${H4}{%k3}{z} # it's passed to .Ltail_avx2
2639 map(s/%z/%y/,($H0,$H1,$H2,$H3,$H4, $D0,$D1,$D2,$D3,$D4, $MASK));
2657 vpsrlq \$26,$H4,$D4
2666 vpaddq $D4,$H0,$H0
2667 vpsllq \$2,$D4,$D4
2670 vpaddq $D4,$H0,$H0 # h4 -> h0