Lines Matching refs:xmm0
98 cvtss2sd ARG_X, %xmm0 /* DP x */
106 andpd MO1(DP_ABS_MASK),%xmm0 /* DP |x| */
120 subsd MO2(PIO4J,%edx,8), %xmm0/* t = |x| - j * Pi/4 */
125 movaps %xmm0, %xmm4 /* t */
127 mulsd %xmm0, %xmm0 /* y=t^2 */
129 unpcklpd %xmm0, %xmm0 /* y|y */
131 movaps %xmm0, %xmm1 /* y|y */
132 mulpd %xmm0, %xmm0 /* z=t^4|z=t^4 */
135 mulpd %xmm0, %xmm2 /* z*S4 */
137 mulpd %xmm0, %xmm3 /* z*S3 */
140 mulpd %xmm0, %xmm2 /* z*(S2+z*S4) */
143 mulpd %xmm0, %xmm3 /* z*(S1+z*S3) */
165 cvtpd2ps %xmm3, %xmm0 /* SP results */
167 movss %xmm0, (%eax) /* store sin(x) from xmm0[0] */
168 shufps $1, %xmm0, %xmm0 /* move cos(x) to xmm0[0] */
169 movss %xmm0, (%ecx) /* store cos(x) */
183 cvtpd2ps %xmm3, %xmm0 /* SP results */
185 movss %xmm0, (%ecx) /* store cos(x) from xmm0[0] */
186 shufps $1, %xmm0, %xmm0 /* move sin(x) to xmm0[0] */
187 movss %xmm0, (%eax) /* store sin(x) */
202 mulsd %xmm0, %xmm1 /* |x|/(Pi/4) */
213 addsd %xmm2, %xmm0 /* |x| - j*PIO4HI */
215 addsd %xmm4, %xmm0 /* t = |x| - j*PIO4HI - j*PIO4LO */
231 movapd %xmm0, %xmm3 /* |x| */
236 movapd %xmm0, %xmm5 /* |x| */
238 movapd %xmm0, %xmm1 /* |x| */
240 mulsd 0*8+MO2(_FPI,%eax,8), %xmm0/* tmp0 = FPI[j]*|x| */
273 addsd %xmm3, %xmm0 /* t += tmp0 */
275 addsd %xmm1, %xmm0 /* t += tmp1 */
276 mulsd MO1(DP_PIO4), %xmm0 /* t *= PI04 */
287 movaps %xmm0, %xmm3 /* DP x */
289 mulsd %xmm0, %xmm0 /* DP y=x^2 */
290 unpcklpd %xmm0, %xmm0 /* DP y|y */
291 movaps %xmm0, %xmm1 /* y|y */
292 mulpd %xmm0, %xmm0 /* z=x^4|z=x^4 */
295 mulpd %xmm0, %xmm4 /* z*S4 */
297 mulpd %xmm0, %xmm5 /* z*S3 */
299 mulpd %xmm0, %xmm4 /* z*(S2+z*S4) */
301 mulpd %xmm0, %xmm5 /* z*(S1+z*S3) */
310 cvtpd2ps %xmm3, %xmm0 /* SP results */
311 movss %xmm0, (%eax) /* store sin(x) from xmm0[0] */
312 shufps $1, %xmm0, %xmm0 /* move cos(x) to xmm0[0] */
313 movss %xmm0, (%ecx) /* store cos(x) */
323 movaps %xmm0, %xmm1 /* DP x */
325 mulsd %xmm0, %xmm0 /* DP x^2 */
326 unpcklpd %xmm0, %xmm0 /* DP x^2|x^2 */
329 mulpd %xmm0, %xmm3 /* DP x^2*DP_SIN2_1 */
331 mulpd %xmm0, %xmm3 /* DP x^2*DP_SIN2_0+x^4*DP_SIN2_1 */
335 cvtpd2ps %xmm3, %xmm0 /* SP results */
337 movss %xmm0, (%eax) /* store sin(x) from xmm0[0] */
338 shufps $1, %xmm0, %xmm0 /* move cos(x) to xmm0[0] */
339 movss %xmm0, (%ecx) /* store cos(x) */
355 movaps %xmm0, %xmm3 /* DP x */
356 mulsd MO1(DP_SMALL), %xmm0 /* DP x*DP_SMALL */
357 subsd %xmm0, %xmm3 /* DP sin result is x-x*DP_SMALL */
359 cvtsd2ss %xmm3, %xmm0 /* sin(x) */
362 movss %xmm0, (%eax) /* sin(x) store */
370 movss MO1(SP_ONE), %xmm0 /* 1.0 */
374 movss %xmm0, (%ecx) /* cos(+-0)==1 */