Lines Matching full:t3
419 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
891 vpsrldq \$6,$T1,$T3
894 vpunpcklqdq $T3,$T2,$T3 # 2:3
899 vpsrlq \$4,$T3,$T2
901 vpsrlq \$30,$T3,$T3
903 vpand $MASK,$T3,$T3 # 3
984 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
990 vpmuludq $T3,$H2,$H1 # h3*r1
1012 vpmuludq $T3,$H4,$H4 # h3*s2
1023 vpmuludq $T3,$H3,$H1 # h3*s3
1033 vpmuludq $T3,$H4,$T3 # h3*s4
1036 vpaddq $T3,$D2,$D2 # d2 += h3*s4
1098 vmovdqa -0x60(%r11),$T3 # r2^4
1106 vpmuludq $H2,$T3,$T0 # h2*r2
1107 vpmuludq $H1,$T3,$T1 # h1*r2
1111 vpmuludq $H0,$T3,$T3 # h0*r2
1113 vpaddq $T3,$D2,$D2 # d2 += h0*r2
1115 vmovdqa -0x30(%r11),$T3 # s3^4
1123 vpmuludq $H4,$T3,$T0 # h4*s3
1127 vpmuludq $H3,$T3,$T2 # h3*s3
1128 vpmuludq $H2,$T3,$T3 # h2*s3
1131 vpaddq $T3,$D0,$D0 # d0 += h2*s3
1138 vpsrldq \$6,$T1,$T3 #
1148 vpunpcklqdq $T3,$T2,$T3 # 2:3
1155 vpsrlq \$4,$T3,$T2
1158 vpsrlq \$30,$T3,$T3
1160 vpand $MASK,$T3,$T3 # 3
1211 vpaddq $H3,$T3,$T3
1231 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
1234 vpmuludq $T3,$H2,$H0 # h3*r1
1258 vpmuludq $T3,$H2,$H2 # h3*s2
1269 vpmuludq $T3,$H4,$H0 # h3*s3
1278 vpmuludq $T3,$H3,$H0 # h3*s4
1330 vpshufd \$0x32,`16*2-64`($ctx),$T3 # s1
1338 vpmuludq $H4,$T3,$T3 # h4*s1
1339 vpaddq $T3,$D0,$D0 # d0 += h4*s1
1346 vpshufd \$0x32,`16*5-64`($ctx),$T3 # r3
1355 vpmuludq $H1,$T3,$T0 # h1*r3
1357 vpmuludq $H0,$T3,$T3 # h0*r3
1358 vpaddq $T3,$D3,$D3 # d3 += h0*r3
1362 vpshufd \$0x32,`16*8-64`($ctx),$T3 # s4
1370 vpmuludq $H4,$T3,$T1 # h4*s4
1372 vpmuludq $H3,$T3,$T0 # h3*s4
1374 vpmuludq $H2,$T3,$T1 # h2*s4
1376 vpmuludq $H1,$T3,$T3 # h1*s4
1377 vpaddq $T3,$D0,$D0 # d0 += h1*s4
1384 vpsrldq \$8,$D3,$T3
1388 vpaddq $T3,$D3,$D3
1516 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1836 vmovdqu `16*1-64`($ctx),%x#$T3
1845 vpermd $T3,$T0,$T3
1850 vmovdqa $T3,0x20-0x90(%rax)
1874 vpsrldq \$6,$T1,$T3
1876 vpunpcklqdq $T3,$T2,$T2 # 2:3
1879 vpsrlq \$30,$T2,$T3
1886 vpand $MASK,$T3,$T3 # 3
1908 vpaddq $H3,$T3,$H3
1911 vmovdqa `32*6-0x90`(%rax),$T3 # s3^4
1932 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
1974 vpmuludq $H3,$T3,$T4 # h3*s3
1975 vpmuludq $H4,$T3,$H2 # h4*s3
1976 vpsrldq \$6,$T1,$T3
1986 vpunpcklqdq $T3,$T2,$T3 # 2:3
2007 vpsrlq \$4,$T3,$T2
2025 vpsrlq \$30,$T3,$T3
2039 vpand $MASK,$T3,$T3 # 3
2058 vpaddq $H3,$T3,$H3
2061 vmovdqu `32*6+4-0x90`(%rax),$T3 # s3^4
2067 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
2103 vpmuludq $H3,$T3,$T4 # h3*s3
2104 vpmuludq $H4,$T3,$H2 # h4*s3
2123 vpsrldq \$8,$H3,$T3
2128 vpaddq $T3,$H3,$H3
2132 vpermq \$0x2,$H3,$T3
2137 vpaddq $T3,$H3,$H3
2211 map(s/%y/%z/,($T4,$T0,$T1,$T2,$T3)); # switch to %zmm domain
2256 vmovdqu `16*6-64`($ctx),%x#$T3 # ... ${S3}
2271 vpermd $T3,$T2,$S3
2302 vpsrlq \$32,$R3,$T3
2321 vpmuludq $T3,$S2,$M0
2322 vpmuludq $T3,$R0,$M3
2323 vpmuludq $T3,$R1,$M4
2324 vpmuludq $T3,$S3,$M1
2325 vpmuludq $T3,$S4,$M2
2345 vmovdqu64 16*0($inp),%z#$T3
2387 vpunpcklqdq $T4,$T3,$T0 # transpose input
2388 vpunpckhqdq $T4,$T3,$T4
2423 vpsllq \$12,$T4,$T3
2424 vporq $T3,$T2,$T2
2426 vpsrlq \$14,$T4,$T3
2431 #vpandq $MASK,$T3,$T3 # 3
2474 vpandq $MASK,$T3,$T3 # 3
2479 vpaddq $H3,$T3,$H3
2482 vmovdqu64 16*0($inp),$T3 # load input
2503 vpunpcklqdq $T4,$T3,$T0 # transpose input
2504 vpunpckhqdq $T4,$T3,$T4
2537 vpsllq \$12,$T4,$T3
2543 vporq $T3,$T2,$T2
2569 vpsrlq \$14,$T4,$T3
2583 #vpandq $MASK,$T3,$T3 # 3
2617 vpandq $MASK,$T3,$T3 # 3
2621 vpaddq $H3,$T3,$H3
2711 map(s/%z/%y/,($T0,$T1,$T2,$T3,$T4, $PADBIT));
2720 vpsrldq \$6,$T1,$T3
2726 vpunpcklqdq $T3,$T2,$T2 # 2:3
2735 vpsrlq \$30,$T2,$T3
2759 vpand $MASK,$T3,$T3 # 3
3024 my ($T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD) = map("%ymm$_",(24..31));
3069 vmovdqu64 16*2($inp),$T3
3072 vpunpcklqdq $T3,$T2,$T1 # transpose data
3073 vpunpckhqdq $T3,$T2,$T3
3077 vpsrlq \$24,$T3,$T2 # splat the data
3082 vpsllq \$20,$T3,$T3
3083 vporq $T3,$T1,$T1
3239 vpxorq $T3,$T3,$T3
3242 vpunpcklqdq $T3,$T2,$T1 # transpose data
3243 vpunpckhqdq $T3,$T2,$T3
3247 vpsrlq \$24,$T3,$T2 # splat the data
3252 vpsllq \$20,$T3,$T3
3253 vporq $T3,$T1,$T1
3279 vmovdqu64 16*2($inp),$T3
3288 vpunpcklqdq $T3,$T2,$T1 # transpose data
3289 vpunpckhqdq $T3,$T2,$T3
3304 vpsrlq \$24,$T3,$T2
3315 vpsllq \$20,$T3,$T3
3328 vporq $T3,$T1,$T1
3465 my ($T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD) = map("%ymm$_",(24..31));
3577 map(s/%y/%z/, $T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD);
3586 vmovdqu64 16*4($inp),$T3
3606 vpunpcklqdq $T3,$T2,$T1 # transpose data
3607 vpunpckhqdq $T3,$T2,$T3
3611 vpsrlq \$24,$T3,$T2 # splat the data
3616 vpsllq \$20,$T3,$T3
3617 vporq $T3,$T1,$T1
3644 vmovdqu64 16*4($inp),$T3
3653 vpunpcklqdq $T3,$T2,$T1 # transpose data
3654 vpunpckhqdq $T3,$T2,$T3
3669 vpsrlq \$24,$T3,$T2
3680 vpsllq \$20,$T3,$T3
3693 vporq $T3,$T1,$T1
3777 map(s/%z/%y/, $T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD);