sse-11.c

来自「用于进行gcc测试」· C语言 代码 · 共 75 行

C
75
字号
/* PR rtl-optimization/21239 *//* { dg-do run } *//* { dg-options "-O2 -msse2" } */#include "sse2-check.h"#include <emmintrin.h>voidfoo (unsigned int x, double *y, const double *z){  __m128d tmp;  while (x)    {      tmp = _mm_load_sd (z);      _mm_store_sd (y, tmp);      --x; ++z; ++y;    }}voidbar (unsigned int x, float *y, const float *z){  __m128 tmp;  unsigned int i;  for (i = 0; i < x; ++i)    {      tmp = (__m128) { *z, 0, 0, 0 };      *y = __builtin_ia32_vec_ext_v4sf (tmp, 0);      ++z; ++y;    }  for (i = 0; i < x; ++i)    {      tmp = (__m128) { 0, *z, 0, 0 };      *y = __builtin_ia32_vec_ext_v4sf (tmp, 1);      ++z; ++y;    }  for (i = 0; i < x; ++i)    {      tmp = (__m128) { 0, 0, *z, 0 };      *y = __builtin_ia32_vec_ext_v4sf (tmp, 2);      ++z; ++y;    }  for (i = 0; i < x; ++i)    {      tmp = (__m128) { 0, 0, 0, *z };      *y = __builtin_ia32_vec_ext_v4sf (tmp, 3);      ++z; ++y;    }}static voidsse2_test (void){  unsigned int i;  double a[16], b[16];  float c[16], d[16];  for (i = 0; i < 16; ++i)    {      a[i] = 1;      b[i] = 2;      c[i] = 3;      d[i] = 4;    }  foo (16, a, b);  bar (4, c, d);  for (i = 0; i < 16; ++i)    {      if (a[i] != 2)	abort ();      if (c[i] != 4)	abort ();    }}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?