Lines Matching full:h3
420 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
716 vmovd $h1#d,$H3
818 vmovd $h1#d,$H3
848 vmovd 4*3($ctx),$H3
971 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
972 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
973 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
974 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
975 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
985 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
991 vpmuludq $T3,$H2,$H1 # h3*r1
993 vpaddq $H1,$D4,$D4 # d4 += h3*r1
994 vmovdqa $H3,0x30(%r11) #
998 vmovdqa 0x30(%rsp),$H3 # r2^2
1002 vpmuludq $T2,$H3,$H0 # h2*r2
1007 vpmuludq $T1,$H3,$H1 # h1*r2
1008 vpmuludq $T0,$H3,$H3 # h0*r2
1011 vpaddq $H3,$D2,$D2 # d2 += h0*r2
1013 vpmuludq $T3,$H4,$H4 # h3*s2
1015 vmovdqa 0x60(%rsp),$H3 # s3^2
1016 vpaddq $H4,$D0,$D0 # d0 += h3*s2
1023 vpmuludq $T4,$H3,$H0 # h4*s3
1024 vpmuludq $T3,$H3,$H1 # h3*s3
1027 vpaddq $H1,$D1,$D1 # d1 += h3*s3
1028 vpmuludq $T2,$H3,$H3 # h2*s3
1030 vpaddq $H3,$D0,$D0 # d0 += h2*s3
1034 vpmuludq $T3,$H4,$T3 # h3*s4
1037 vpaddq $T3,$D2,$D2 # d2 += h3*s4
1039 vpsrldq \$6,$H1,$H3 #
1048 vpunpcklqdq $H3,$H2,$H3 # 2:3
1054 vpsrlq \$4,$H3,$H2
1057 vpsrlq \$30,$H3,$H3
1059 vpand $MASK,$H3,$H3 # 3
1065 vpaddq 0x30(%r11),$H3,$H3
1076 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1077 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1078 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1079 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1080 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1088 vpmuludq $H3,$T4,$T1 # h3*r0
1097 vpmuludq $H3,$T2,$T0 # h3*r1
1100 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1117 vpmuludq $H3,$T4,$T4 # h3*s2
1119 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1128 vpmuludq $H3,$T3,$T2 # h3*s3
1130 vpaddq $T2,$D1,$D1 # d1 += h3*s3
1135 vpmuludq $H3,$T4,$H3 # h3*s4
1140 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*s4
1141 vpaddq $H4,$D3,$H3 # h3 = d3 + h4*s4
1168 vpsrlq \$26,$H3,$D3
1169 vpand $MASK,$H3,$H3
1170 vpaddq $D3,$H4,$H4 # h3 -> h4
1189 vpaddq $D2,$H3,$H3 # h2 -> h3
1195 vpsrlq \$26,$H3,$D3
1196 vpand $MASK,$H3,$H3
1197 vpaddq $D3,$H4,$H4 # h3 -> h4
1212 vpaddq $H3,$T3,$T3
1219 vmovdqa $H3,0x30(%r11)
1222 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1223 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1224 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1225 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1226 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1232 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
1235 vpmuludq $T3,$H2,$H0 # h3*r1
1236 vpaddq $H0,$D4,$D4 # d4 += h3*r1
1237 vpshufd \$0x10,`16*2-64`($ctx),$H3 # s1^n
1245 vpmuludq $T4,$H3,$H3 # h4*s1
1246 vpaddq $H3,$D0,$D0 # d0 += h4*s1
1253 vpshufd \$0x10,`16*5-64`($ctx),$H3 # r3^n
1259 vpmuludq $T3,$H2,$H2 # h3*s2
1260 vpaddq $H2,$D0,$D0 # d0 += h3*s2
1262 vpmuludq $T1,$H3,$H0 # h1*r3
1264 vpmuludq $T0,$H3,$H3 # h0*r3
1265 vpaddq $H3,$D3,$D3 # d3 += h0*r3
1269 vpshufd \$0x10,`16*8-64`($ctx),$H3 # s4^n
1270 vpmuludq $T3,$H4,$H0 # h3*s3
1271 vpaddq $H0,$D1,$D1 # d1 += h3*s3
1277 vpmuludq $T4,$H3,$H1 # h4*s4
1278 vpaddq $H1,$D3,$D3 # h3 = d3 + h4*s4
1279 vpmuludq $T3,$H3,$H0 # h3*s4
1280 vpaddq $H0,$D2,$D2 # h2 = d2 + h3*s4
1281 vpmuludq $T2,$H3,$H1 # h2*s4
1283 vpmuludq $T1,$H3,$H3 # h1*s4
1284 vpaddq $H3,$D0,$D0 # h0 = d0 + h1*s4
1292 vpsrldq \$6,$H1,$H3
1295 vpunpcklqdq $H3,$H2,$H3 # 2:3
1300 vpsrlq \$4,$H3,$H2
1302 vpsrlq \$30,$H3,$H3
1304 vpand $MASK,$H3,$H3 # 3
1311 vpaddq 0x30(%r11),$H3,$H3
1324 vpmuludq $H3,$T4,$T1 # h3*r0
1325 vpaddq $T1,$D3,$D3 # d3 += h3*r0
1329 vpmuludq $H3,$T2,$T0 # h3*r1
1330 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1353 vpmuludq $H3,$T2,$T2 # h3*s2
1354 vpaddq $T2,$D0,$D0 # d0 += h3*s2
1364 vpmuludq $H3,$T4,$T0 # h3*s3
1365 vpaddq $T0,$D1,$D1 # d1 += h3*s3
1373 vpmuludq $H3,$T3,$T0 # h3*s4
1374 vpaddq $T0,$D2,$D2 # d2 += h3*s4
1398 vpsrlq \$26,$D3,$H3
1400 vpaddq $H3,$D4,$D4 # h3 -> h4
1419 vpaddq $H2,$D3,$D3 # h2 -> h3
1425 vpsrlq \$26,$D3,$H3
1427 vpaddq $H3,$D4,$D4 # h3 -> h4
1517 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1644 vmovd $h1#d,%x#$H3
1751 vmovd $h1#d,%x#$H3
1792 vmovd 4*3($ctx),%x#$H3
1909 vpaddq $H3,$T3,$H3
1915 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1916 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1917 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1918 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1919 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1924 # d4 = h2*r2 + h4*r0 + h3*r1 + h1*r3 + h0*r4
1925 # d3 = h2*r1 + h3*r0 + h1*r2 + h0*r3 + h4*5*r4
1926 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1927 # d1 = h2*5*r4 + h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3
1928 # d0 = h2*5*r3 + h0*r0 + h4*5*r1 + h3*5*r2 + h1*5*r4
1940 vpmuludq $H3,$T1,$T4 # h3*r1
1942 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1950 vpmuludq $H3,$T0,$T4 # h3*r0
1953 vpaddq $T4,$D3,$D3 # d3 += h3*r0
1957 vpmuludq $H3,$T1,$T4 # h3*s2
1960 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1975 vpmuludq $H3,$T3,$T4 # h3*s3
1978 vpaddq $T4,$D1,$D1 # d1 += h3*s3
1982 vpmuludq $H3,$S4,$H3 # h3*s4
1985 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
1986 vpaddq $H4,$D3,$H3 # h3 = d3 + h4*r4
1997 vpsrlq \$26,$H3,$D3
1998 vpand $MASK,$H3,$H3
1999 vpaddq $D3,$H4,$H4 # h3 -> h4
2023 vpaddq $D2,$H3,$H3 # h2 -> h3
2034 vpsrlq \$26,$H3,$D3
2035 vpand $MASK,$H3,$H3
2036 vpaddq $D3,$H4,$H4 # h3 -> h4
2059 vpaddq $H3,$T3,$H3
2075 vpmuludq $H3,$T1,$T4 # h3*r1
2077 vpaddq $T4,$D4,$D4 # d4 += h3*r1
2085 vpmuludq $H3,$T0,$T4 # h3*r0
2087 vpaddq $T4,$D3,$D3 # d3 += h3*r0
2090 vpmuludq $H3,$T1,$T4 # h3*s2
2092 vpaddq $T4,$D0,$D0 # d0 += h3*s2
2104 vpmuludq $H3,$T3,$T4 # h3*s3
2106 vpaddq $T4,$D1,$D1 # d1 += h3*s3
2109 vpmuludq $H3,$S4,$H3 # h3*s4
2111 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2112 vpaddq $H4,$D3,$H3 # h3 = d3 + h4*r4
2124 vpsrldq \$8,$H3,$T3
2129 vpaddq $T3,$H3,$H3
2133 vpermq \$0x2,$H3,$T3
2138 vpaddq $T3,$H3,$H3
2147 vpsrlq \$26,$H3,$D3
2148 vpand $MASK,$H3,$H3
2149 vpaddq $D3,$H4,$H4 # h3 -> h4
2168 vpaddq $D2,$H3,$H3 # h2 -> h3
2174 vpsrlq \$26,$H3,$D3
2175 vpand $MASK,$H3,$H3
2176 vpaddq $D3,$H4,$H4 # h3 -> h4
2181 vmovd %x#$H3,`4*3-48-64`($ctx)
2214 map(s/%y/%z/,($H0,$H1,$H2,$H3,$H4));
2455 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
2456 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
2457 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
2458 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
2459 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
2464 # d3 = h2*r1 + h0*r3 + h1*r2 + h3*r0 + h4*5*r4
2465 # d4 = h2*r2 + h0*r4 + h1*r3 + h3*r1 + h4*r0
2466 # d0 = h2*5*r3 + h0*r0 + h1*5*r4 + h3*5*r2 + h4*5*r1
2467 # d1 = h2*5*r4 + h0*r1 + h1*r0 + h3*5*r3 + h4*5*r2
2468 # d2 = h2*r0 + h0*r2 + h1*r1 + h3*5*r4 + h4*5*r3
2480 vpaddq $H3,$T3,$H3
2507 vpmuludq $H3,$R0,$M3
2508 vpmuludq $H3,$R1,$M4
2511 vpaddq $M3,$D3,$D3 # d3 += h3*r0
2512 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2518 vpmuludq $H3,$S2,$M0
2519 vpmuludq $H3,$S3,$M1
2521 vpmuludq $H3,$S4,$M2
2523 vpaddq $M0,$D0,$D0 # d0 += h3*s2
2524 vpaddq $M1,$D1,$D1 # d1 += h3*s3
2525 vpaddq $M2,$D2,$D2 # d2 += h3*s4
2540 vpsrlq \$26,$D3,$H3
2542 vpaddq $H3,$D4,$H4 # h3 -> h4
2568 vpaddq $D2,$D3,$H3 # h2 -> h3
2578 vpsrlq \$26,$H3,$D3
2579 vpandq $MASK,$H3,$H3
2580 vpaddq $D3,$H4,$H4 # h3 -> h4
2622 vpaddq $H3,$T3,$H3
2646 vpmuludq $H3,$R0,$M3
2647 vpmuludq $H3,$R1,$M4
2650 vpaddq $M3,$D3,$D3 # d3 += h3*r0
2651 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2658 vpmuludq $H3,$S2,$M0
2659 vpmuludq $H3,$S3,$M1
2660 vpmuludq $H3,$S4,$M2
2661 vpaddq $M3,$D3,$H3 # h3 = d3 + h4*s4
2663 vpaddq $M0,$D0,$D0 # d0 += h3*s2
2664 vpaddq $M1,$D1,$D1 # d1 += h3*s3
2665 vpaddq $M2,$D2,$D2 # d2 += h3*s4
2678 vpermq \$0xb1,$H3,$D3
2683 vpaddq $D3,$H3,$H3
2690 vpermq \$0x2,$H3,$D3
2695 vpaddq $D3,$H3,$H3
2701 vextracti64x4 \$0x1,$H3,%y#$D3
2706 vpaddq $D3,$H3,${H3}{%k3}{z} # keep single qword in case
2713 map(s/%z/%y/,($H0,$H1,$H2,$H3,$H4, $D0,$D1,$D2,$D3,$D4, $MASK));
2718 vpsrlq \$26,$H3,$D3
2719 vpand $MASK,$H3,$H3
2723 vpaddq $D3,$H4,$H4 # h3 -> h4
2750 vpaddq $D2,$H3,$H3 # h2 -> h3
2758 vpsrlq \$26,$H3,$D3
2759 vpand $MASK,$H3,$H3
2762 vpaddq $D3,$H4,$H4 # h3 -> h4
2772 vmovd %x#$H3,`4*3-48-64`($ctx)