sse4_1-ptest-1.c
来自「用于进行gcc测试」· C语言 代码 · 共 110 行
C
110 行
/* { dg-do run } *//* { dg-require-effective-target sse4 } *//* { dg-options "-O2 -msse4.1" } */#include "sse4_1-check.h"#include <smmintrin.h>static intmake_ptestz (__m128i m, __m128i v){ union { __m128i x; unsigned char c[16]; } val, mask; int i, z; mask.x = m; val.x = v; z = 1; for (i = 0; i < 16; i++) if ((mask.c[i] & val.c[i])) { z = 0; break; } return z;}static intmake_ptestc (__m128i m, __m128i v){ union { __m128i x; unsigned char c[16]; } val, mask; int i, c; mask.x = m; val.x = v; c = 1; for (i = 0; i < 16; i++) if ((val.c[i] & ~mask.c[i])) { c = 0; break; } return c;}static voidsse4_1_test (void){ union { __m128i x; unsigned int i[4]; } val[4]; int i, j, l; int res[32]; val[0].i[0] = 0x11111111; val[0].i[1] = 0x00000000; val[0].i[2] = 0x00000000; val[0].i[3] = 0x11111111; val[1].i[0] = 0x00000000; val[1].i[1] = 0x11111111; val[1].i[2] = 0x11111111; val[1].i[3] = 0x00000000; val[2].i[0] = 0; val[2].i[1] = 0; val[2].i[2] = 0; val[2].i[3] = 0; val[3].i[0] = 0xffffffff; val[3].i[1] = 0xffffffff; val[3].i[2] = 0xffffffff; val[3].i[3] = 0xffffffff; l = 0; for(i = 0; i < 4; i++) for(j = 0; j < 4; j++) { res[l++] = _mm_testz_si128 (val[j].x, val[i].x); res[l++] = _mm_testc_si128 (val[j].x, val[i].x); } l = 0; for(i = 0; i < 4; i++) for(j = 0; j < 4; j++) { if (res[l++] != make_ptestz (val[j].x, val[i].x)) abort (); if (res[l++] != make_ptestc (val[j].x, val[i].x)) abort (); } if (res[2] != _mm_testz_si128 (val[1].x, val[0].x)) abort (); if (res[3] != _mm_testc_si128 (val[1].x, val[0].x)) abort ();}
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?