1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
|
/* { dg-do compile { target i?86-*-* x86_64-*-* } } */
/* { dg-options "-msse4" } */
#include <nmmintrin.h>
__m128i load (char *);
char *
foo (const unsigned char *s1, const unsigned char *s2,
int bmsk, __m128i frag2)
{
int len = 0;
char *p1 = (char *) s1;
char *p2 = (char *) s2;
__m128i frag1, fruc, mask;
int cmp_c, cmp_s;
if( !p2[0]) return (char *) s1;
if( !p1[0] ) return NULL;
if( p2[1]) frag2 = load (p2);
frag1 = load (p1);
fruc = _mm_loadu_si128 ((__m128i *) s1);
mask = _mm_cmpistrm(fruc, frag2, 0x44);
frag2 = _mm_blendv_epi8(frag2, mask, mask);
frag1 = _mm_blendv_epi8(frag1, mask, mask);
cmp_c = _mm_cmpistrc(frag2, frag1, 0x0c);
cmp_s = _mm_cmpistrs(frag2, frag1, 0x0c);
if( cmp_s & cmp_c )
__asm("bsfl %[bmsk], %[len]" : [len] "=r" (len) : [bmsk] "r" (bmsk) );
return p2 + len;
}
|