120 lines
3.3 KiB
C
120 lines
3.3 KiB
C
/* { dg-do run } */
|
|
/* { dg-require-effective-target sse4 } */
|
|
/* { dg-options "-O2 -msse4.2" } */
|
|
|
|
#ifndef CHECK_H
|
|
#define CHECK_H "sse4_2-check.h"
|
|
#endif
|
|
|
|
#ifndef TEST
|
|
#define TEST sse4_2_test
|
|
#endif
|
|
|
|
#include CHECK_H
|
|
|
|
#include "sse4_2-pcmpstr.h"
|
|
|
|
#define NUM 1024
|
|
|
|
#define IMM_VAL0 \
|
|
(_SIDD_SBYTE_OPS | _SIDD_CMP_RANGES | _SIDD_MASKED_POSITIVE_POLARITY)
|
|
#define IMM_VAL1 \
|
|
(_SIDD_UBYTE_OPS | _SIDD_CMP_EQUAL_EACH | _SIDD_NEGATIVE_POLARITY \
|
|
| _SIDD_BIT_MASK)
|
|
#define IMM_VAL2 \
|
|
(_SIDD_UWORD_OPS | _SIDD_CMP_EQUAL_ANY | _SIDD_NEGATIVE_POLARITY)
|
|
#define IMM_VAL3 \
|
|
(_SIDD_SWORD_OPS | _SIDD_CMP_EQUAL_ORDERED \
|
|
| _SIDD_MASKED_NEGATIVE_POLARITY | _SIDD_UNIT_MASK)
|
|
|
|
static void
|
|
TEST (void)
|
|
{
|
|
union
|
|
{
|
|
__m128i x[NUM];
|
|
char c[NUM *16];
|
|
} src1, src2;
|
|
__m128i res, correct;
|
|
int correct_flags, l1, l2;
|
|
int flags, cf, zf, sf, of, af;
|
|
int i;
|
|
|
|
for (i = 0; i < NUM *16; i++)
|
|
{
|
|
src1.c[i] = rand ();
|
|
src2.c[i] = rand ();
|
|
}
|
|
|
|
for (i = 0; i < NUM; i++)
|
|
{
|
|
l1 = rand () % 18;
|
|
l2 = rand () % 18;
|
|
|
|
switch ((rand () % 4))
|
|
{
|
|
case 0:
|
|
res = _mm_cmpestrm (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
cf = _mm_cmpestrc (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
zf = _mm_cmpestrz (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
sf = _mm_cmpestrs (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
of = _mm_cmpestro (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
af = _mm_cmpestra (src1.x[i], l1, src2.x[i], l2, IMM_VAL0);
|
|
correct = cmp_em (&src1.x[i], l1, &src2.x[i], l2, IMM_VAL0,
|
|
&correct_flags);
|
|
break;
|
|
|
|
case 1:
|
|
res = _mm_cmpestrm (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
cf = _mm_cmpestrc (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
zf = _mm_cmpestrz (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
sf = _mm_cmpestrs (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
of = _mm_cmpestro (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
af = _mm_cmpestra (src1.x[i], l1, src2.x[i], l2, IMM_VAL1);
|
|
correct = cmp_em (&src1.x[i], l1, &src2.x[i], l2, IMM_VAL1,
|
|
&correct_flags);
|
|
break;
|
|
|
|
case 2:
|
|
res = _mm_cmpestrm (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
cf = _mm_cmpestrc (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
zf = _mm_cmpestrz (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
sf = _mm_cmpestrs (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
of = _mm_cmpestro (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
af = _mm_cmpestra (src1.x[i], l1, src2.x[i], l2, IMM_VAL2);
|
|
correct = cmp_em (&src1.x[i], l1, &src2.x[i], l2, IMM_VAL2,
|
|
&correct_flags);
|
|
break;
|
|
|
|
default:
|
|
res = _mm_cmpestrm (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
cf = _mm_cmpestrc (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
zf = _mm_cmpestrz (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
sf = _mm_cmpestrs (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
of = _mm_cmpestro (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
af = _mm_cmpestra (src1.x[i], l1, src2.x[i], l2, IMM_VAL3);
|
|
correct = cmp_em (&src1.x[i], l1, &src2.x[i], l2, IMM_VAL3,
|
|
&correct_flags);
|
|
break;
|
|
}
|
|
|
|
if (memcmp (&correct, &res, sizeof (res)))
|
|
abort ();
|
|
|
|
flags = 0;
|
|
if (cf)
|
|
flags |= CFLAG;
|
|
if (zf)
|
|
flags |= ZFLAG;
|
|
if (sf)
|
|
flags |= SFLAG;
|
|
if (of)
|
|
flags |= OFLAG;
|
|
|
|
if (flags != correct_flags
|
|
|| (af && (cf || zf))
|
|
|| (!af && !(cf || zf)))
|
|
abort ();
|
|
}
|
|
}
|