#include #include void vclrx(float *fc, int k, int n, int f); void vclrx_csal( float *C, int K, int N, int XFLAG); void vclrx(float *fc, int k, int n, int f) { __m128 *pC = (__m128*)fc; __m128 c0,c1,c2,c3; if (k != 1) { printf("vmovx_csal\n"); vclrx_csal(fc,k,n,f); return; } if (n > 3) { c0 = _mm_xor_ps(c0,c0); while (n >= 4) { *pC++ = c0; n -= 4; } } return; } void vclrx_csal( float *C, int K, int N, int XFLAG) { ( void ) XFLAG; int i; float zero; zero = 0.0; C -= K; for ( i = 0; i < N; i++ ) { *( C += K ) = zero; } }