sse4_1-pinsrb.c

来自「用于进行gcc测试」· C语言 代码 · 共 103 行

C
103
字号
/* { dg-do run } *//* { dg-require-effective-target sse4 } *//* { dg-options "-O2 -msse4.1" } */#include "sse4_1-check.h"#include <smmintrin.h>#include <string.h>#define msk0 0x00#define msk1 0x01#define msk2 0x02#define msk3 0x03#define msk4 0x04#define msk5 0x05#define msk6 0x06#define msk7 0x07#define msk8 0x08#define msk9 0x09#define mskA 0x0A#define mskB 0x0B#define mskC 0x0C#define mskD 0x0D#define mskE 0x0E#define mskF 0x0Fstatic voidsse4_1_test (void){  union    {      __m128i x;      unsigned int i[4];      unsigned char c[16];    } res [16], val, tmp;  int masks[16];  unsigned char ins[4] = { 3, 4, 5, 6 };  int i;  val.i[0] = 0x35251505;  val.i[1] = 0x75655545;  val.i[2] = 0xB5A59585;  val.i[3] = 0xF5E5D5C5;  /* Check pinsrb imm8, r32, xmm.  */  res[0].x = _mm_insert_epi8 (val.x, ins[0], msk0);  res[1].x = _mm_insert_epi8 (val.x, ins[0], msk1);  res[2].x = _mm_insert_epi8 (val.x, ins[0], msk2);  res[3].x = _mm_insert_epi8 (val.x, ins[0], msk3);  res[4].x = _mm_insert_epi8 (val.x, ins[0], msk4);  res[5].x = _mm_insert_epi8 (val.x, ins[0], msk5);  res[6].x = _mm_insert_epi8 (val.x, ins[0], msk6);  res[7].x = _mm_insert_epi8 (val.x, ins[0], msk7);  res[8].x = _mm_insert_epi8 (val.x, ins[0], msk8);  res[9].x = _mm_insert_epi8 (val.x, ins[0], msk9);  res[10].x = _mm_insert_epi8 (val.x, ins[0], mskA);  res[11].x = _mm_insert_epi8 (val.x, ins[0], mskB);  res[12].x = _mm_insert_epi8 (val.x, ins[0], mskC);  res[13].x = _mm_insert_epi8 (val.x, ins[0], mskD);  res[14].x = _mm_insert_epi8 (val.x, ins[0], mskE);  res[15].x = _mm_insert_epi8 (val.x, ins[0], mskF);  masks[0] = msk0;  masks[1] = msk1;  masks[2] = msk2;  masks[3] = msk3;  masks[4] = msk4;  masks[5] = msk5;  masks[6] = msk6;  masks[7] = msk7;  masks[8] = msk8;  masks[9] = msk9;  masks[10] = mskA;  masks[11] = mskB;  masks[12] = mskC;  masks[13] = mskD;  masks[14] = mskE;  masks[15] = mskF;  for (i = 0; i < 16; i++)    {      tmp.x = val.x;      tmp.c[masks[i]] = ins[0];      if (memcmp (&tmp, &res[i], sizeof (tmp)))	abort ();    }      /* Check pinsrb imm8, m8, xmm.  */  for (i = 0; i < 16; i++)    {      res[i].x = _mm_insert_epi8 (val.x, ins[i % 4], msk0);      masks[i] = msk0;    }  for (i = 0; i < 16; i++)    {      tmp.x = val.x;      tmp.c[masks[i]] = ins[i % 4];      if (memcmp (&tmp, &res[i], sizeof (tmp)))	abort ();    }}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?