Lines Matching full:t4

420 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
893 vpunpckhqdq $T1,$T0,$T4 # 4
897 vpsrlq \$40,$T4,$T4 # 4
905 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
986 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
989 vpmuludq 0x20(%rsp),$T4,$H0 # h4*s1
1012 vpmuludq $T4,$H4,$H0 # h4*s2
1023 vpmuludq $T4,$H3,$H0 # h4*s3
1035 vpmuludq $T4,$H4,$T4 # h4*s4
1038 vpaddq $T4,$D3,$D3 # d3 += h4*s4
1040 vpmuludq 0x70(%rsp),$T0,$T4 # h0*r4
1043 vpaddq $T4,$D4,$D4 # d4 += h0*r4
1044 vmovdqa -0x90(%r11),$T4 # r0^4
1082 vpmuludq $H0,$T4,$T0 # h0*r0
1083 vpmuludq $H1,$T4,$T1 # h1*r0
1087 vpmuludq $H2,$T4,$T0 # h2*r0
1088 vpmuludq $H3,$T4,$T1 # h3*r0
1091 vpmuludq $H4,$T4,$T4 # h4*r0
1093 vpaddq $T4,$D4,$D4
1106 vmovdqa -0x50(%r11),$T4 # s2^4
1113 vpmuludq $H4,$T4,$T0 # h4*s2
1117 vpmuludq $H3,$T4,$T4 # h3*s2
1119 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1121 vmovdqa -0x10(%r11),$T4 # s4^4
1134 vpmuludq $H2,$T4,$H2 # h2*s4
1135 vpmuludq $H3,$T4,$H3 # h3*s4
1138 vpmuludq $H4,$T4,$H4 # h4*s4
1143 vpmuludq $H1,$T4,$H0
1144 vpunpckhqdq $T1,$T0,$T4 # 4
1151 #vpsrlq \$40,$T4,$T4 # 4
1152 vpsrldq \$`40/8`,$T4,$T4 # 4
1158 vpand 0(%rcx),$T4,$T4 # .Lmask24
1162 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
1213 vpaddq $H4,$T4,$T4
1233 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
1245 vpmuludq $T4,$H3,$H3 # h4*s1
1256 vpmuludq $T4,$H2,$H1 # h4*s2
1267 vpmuludq $T4,$H4,$H1 # h4*s3
1277 vpmuludq $T4,$H3,$H1 # h4*s4
1307 vpshufd \$0x32,`16*0-64`($ctx),$T4 # r0^n, 34xx -> x3x4
1317 vpmuludq $H0,$T4,$T0 # h0*r0
1319 vpmuludq $H1,$T4,$T1 # h1*r0
1321 vpmuludq $H2,$T4,$T0 # h2*r0
1324 vpmuludq $H3,$T4,$T1 # h3*r0
1326 vpmuludq $H4,$T4,$T4 # h4*r0
1327 vpaddq $T4,$D4,$D4 # d4 += h4*r0
1334 vpshufd \$0x32,`16*3-64`($ctx),$T4 # r2
1343 vpmuludq $H2,$T4,$T1 # h2*r2
1345 vpmuludq $H1,$T4,$T0 # h1*r2
1348 vpmuludq $H0,$T4,$T4 # h0*r2
1349 vpaddq $T4,$D2,$D2 # d2 += h0*r2
1352 vpshufd \$0x32,`16*6-64`($ctx),$T4 # s3
1361 vpmuludq $H4,$T4,$T1 # h4*s3
1364 vpmuludq $H3,$T4,$T0 # h3*s3
1366 vpmuludq $H2,$T4,$T4 # h2*s3
1367 vpaddq $T4,$D0,$D0 # d0 += h2*s3
1384 vpsrldq \$8,$D4,$T4
1390 vpaddq $T4,$D4,$D4
1517 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1838 vmovdqu `16*2-64`($ctx),%x#$T4
1848 vpermd $T4,$T0,$T4
1853 vmovdqa $T4,0x40-0x90(%rax)
1876 vpunpckhqdq $T1,$T0,$T4 # 4
1883 vpsrlq \$40,$T4,$T4 # 4
1888 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
1911 vpaddq $H4,$T4,$H4
1936 vpmuludq $H0,$T1,$T4 # h0*r1
1938 vpaddq $T4,$D1,$D1 # d1 += h0*r1
1940 vpmuludq $H3,$T1,$T4 # h3*r1
1942 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1946 vpmuludq $H0,$T0,$T4 # h0*r0
1948 vpaddq $T4,$D0,$D0 # d0 += h0*r0
1950 vpmuludq $H3,$T0,$T4 # h3*r0
1953 vpaddq $T4,$D3,$D3 # d3 += h3*r0
1957 vpmuludq $H3,$T1,$T4 # h3*s2
1960 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1963 vpmuludq $H1,$T2,$T4 # h1*r2
1965 vpaddq $T4,$D3,$D3 # d3 += h1*r2
1970 vpmuludq $H1,$H2,$T4 # h1*r3
1973 vpaddq $T4,$D4,$D4 # d4 += h1*r3
1975 vpmuludq $H3,$T3,$T4 # h3*s3
1978 vpaddq $T4,$D1,$D1 # d1 += h3*s3
1980 vpunpckhqdq $T1,$T0,$T4 # 4
2032 vpsrlq \$40,$T4,$T4 # 4
2041 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
2061 vpaddq $H4,$T4,$H4
2071 vpmuludq $H0,$T1,$T4 # h0*r1
2073 vpaddq $T4,$D1,$D1 # d1 += h0*r1
2075 vpmuludq $H3,$T1,$T4 # h3*r1
2077 vpaddq $T4,$D4,$D4 # d4 += h3*r1
2080 vpmuludq $H0,$T0,$T4 # h0*r0
2082 vpaddq $T4,$D0,$D0 # d0 += h0*r0
2085 vpmuludq $H3,$T0,$T4 # h3*r0
2087 vpaddq $T4,$D3,$D3 # d3 += h3*r0
2090 vpmuludq $H3,$T1,$T4 # h3*s2
2092 vpaddq $T4,$D0,$D0 # d0 += h3*s2
2095 vpmuludq $H1,$T2,$T4 # h1*r2
2097 vpaddq $T4,$D3,$D3 # d3 += h1*r2
2100 vpmuludq $H1,$H2,$T4 # h1*r3
2102 vpaddq $T4,$D4,$D4 # d4 += h1*r3
2104 vpmuludq $H3,$T3,$T4 # h3*s3
2106 vpaddq $T4,$D1,$D1 # d1 += h3*s3
2125 vpsrldq \$8,$H4,$T4
2130 vpaddq $T4,$H4,$H4
2134 vpermq \$0x2,$H4,$T4
2139 vpaddq $T4,$H4,$H4
2212 map(s/%y/%z/,($T4,$T0,$T1,$T2,$T3)); # switch to %zmm domain
2259 vmovdqu `16*8-64`($ctx),%x#$T4 # ... ${S4}
2275 vpermd $T4,$T2,$S4
2315 vpsrlq \$32,$R4,$T4
2333 vpmuludq $T4,$S4,$M3
2334 vpmuludq $T4,$R0,$M4
2335 vpmuludq $T4,$S1,$M0
2336 vpmuludq $T4,$S2,$M1
2337 vpmuludq $T4,$S3,$M2
2347 vmovdqu64 16*4($inp),%z#$T4
2388 vpunpcklqdq $T4,$T3,$T0 # transpose input
2389 vpunpckhqdq $T4,$T3,$T4
2424 vpsllq \$12,$T4,$T3
2427 vpsrlq \$14,$T4,$T3
2428 vpsrlq \$40,$T4,$T4 # 4
2433 #vporq $PADBIT,$T4,$T4 # padbit, yes, always
2477 vporq $PADBIT,$T4,$T4 # padbit, yes, always
2481 vpaddq $H4,$T4,$H4
2484 vmovdqu64 16*4($inp),$T4
2504 vpunpcklqdq $T4,$T3,$T0 # transpose input
2505 vpunpckhqdq $T4,$T3,$T4
2538 vpsllq \$12,$T4,$T3
2570 vpsrlq \$14,$T4,$T3
2576 vpsrlq \$40,$T4,$T4 # 4
2585 #vporq $PADBIT,$T4,$T4 # padbit, yes, always
2620 vporq $PADBIT,$T4,$T4 # padbit, yes, always
2623 vpaddq $H4,$T4,$H4
2712 map(s/%z/%y/,($T0,$T1,$T2,$T3,$T4, $PADBIT));
2722 vpunpckhqdq $T1,$T0,$T4 # 4
2743 vpsrlq \$40,$T4,$T4 # 4
2761 vpor 32(%rcx),$T4,$T4 # padbit, yes, always