// RUN: %clang_cc1 -emit-llvm %s -o - | FileCheck %s
typedef __attribute__(( ext_vector_type(4) )) float float4;
typedef __attribute__(( ext_vector_type(2) )) float float2;
typedef __attribute__(( ext_vector_type(4) )) int int4;
typedef __attribute__(( ext_vector_type(4) )) unsigned int uint4;
// CHECK: @foo = global <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>
float4 foo = (float4){ 1.0, 2.0, 3.0, 4.0 };
// CHECK: @bar = constant <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 0x7FF0000000000000>
const float4 bar = (float4){ 1.0, 2.0, 3.0, __builtin_inff() };
// CHECK: @test1
// CHECK: fadd <4 x float>
float4 test1(float4 V) {
return V.wzyx+V;
}
float2 vec2, vec2_2;
float4 vec4, vec4_2;
float f;
// CHECK: @test2
// CHECK: shufflevector {{.*}} <i32 0, i32 1>
// CHECK: extractelement
// CHECK: shufflevector {{.*}} <i32 1, i32 1, i32 1, i32 1>
// CHECK: insertelement
// CHECK: shufflevector {{.*}} <i32 1, i32 0>
void test2() {
vec2 = vec4.xy; // shorten
f = vec2.x; // extract elt
vec4 = vec4.yyyy; // splat
vec2.x = f; // insert one.
vec2.yx = vec2; // reverse
}
// CHECK: @test3
// CHECK: store <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>
void test3(float4 *out) {
*out = ((float4) {1.0f, 2.0f, 3.0f, 4.0f });
}
// CHECK: @test4
// CHECK: store <4 x float>
// CHECK: store <4 x float>
void test4(float4 *out) {
float a = 1.0f;
float b = 2.0f;
float c = 3.0f;
float d = 4.0f;
*out = ((float4) {a,b,c,d});
}
// CHECK: @test5
// CHECK: shufflevector {{.*}} <4 x i32> zeroinitializer
// CHECK: fmul <4 x float>
// CHECK: fmul <4 x float>
// CHECK: shufflevector {{.*}} <4 x i32> zeroinitializer
// CHECK: fmul <4 x float>
void test5(float4 *out) {
float a;
float4 b;
a = 1.0f;
b = a;
b = b * 5.0f;
b = 5.0f * b;
b *= a;
*out = b;
}
// CHECK: @test6
void test6(float4 *ap, float4 *bp, float c) {
float4 a = *ap;
float4 b = *bp;
// CHECK: fadd <4 x float>
// CHECK: fsub <4 x float>
// CHECK: fmul <4 x float>
// CHECK: fdiv <4 x float>
a = a + b;
a = a - b;
a = a * b;
a = a / b;
// CHECK: fadd <4 x float>
// CHECK: fsub <4 x float>
// CHECK: fmul <4 x float>
// CHECK: fdiv <4 x float>
a = a + c;
a = a - c;
a = a * c;
a = a / c;
// CHECK: fadd <4 x float>
// CHECK: fsub <4 x float>
// CHECK: fmul <4 x float>
// CHECK: fdiv <4 x float>
a += b;
a -= b;
a *= b;
a /= b;
// CHECK: fadd <4 x float>
// CHECK: fsub <4 x float>
// CHECK: fmul <4 x float>
// CHECK: fdiv <4 x float>
a += c;
a -= c;
a *= c;
a /= c;
// Vector comparisons can sometimes crash the x86 backend: rdar://6326239,
// reject them until the implementation is stable.
#if 0
int4 cmp;
cmp = a < b;
cmp = a <= b;
cmp = a < b;
cmp = a >= b;
cmp = a == b;
cmp = a != b;
#endif
}
// CHECK: @test7
void test7(int4 *ap, int4 *bp, int c) {
int4 a = *ap;
int4 b = *bp;
// CHECK: add <4 x i32>
// CHECK: sub <4 x i32>
// CHECK: mul <4 x i32>
// CHECK: sdiv <4 x i32>
// CHECK: srem <4 x i32>
a = a + b;
a = a - b;
a = a * b;
a = a / b;
a = a % b;
// CHECK: add <4 x i32>
// CHECK: sub <4 x i32>
// CHECK: mul <4 x i32>
// CHECK: sdiv <4 x i32>
// CHECK: srem <4 x i32>
a = a + c;
a = a - c;
a = a * c;
a = a / c;
a = a % c;
// CHECK: add <4 x i32>
// CHECK: sub <4 x i32>
// CHECK: mul <4 x i32>
// CHECK: sdiv <4 x i32>
// CHECK: srem <4 x i32>
a += b;
a -= b;
a *= b;
a /= b;
a %= b;
// CHECK: add <4 x i32>
// CHECK: sub <4 x i32>
// CHECK: mul <4 x i32>
// CHECK: sdiv <4 x i32>
// CHECK: srem <4 x i32>
a += c;
a -= c;
a *= c;
a /= c;
a %= c;
// Vector comparisons.
// CHECK: icmp slt
// CHECK: icmp sle
// CHECK: icmp sgt
// CHECK: icmp sge
// CHECK: icmp eq
// CHECK: icmp ne
int4 cmp;
cmp = a < b;
cmp = a <= b;
cmp = a > b;
cmp = a >= b;
cmp = a == b;
cmp = a != b;
}
// CHECK: @test8
void test8(float4 *ap, float4 *bp, int c) {
float4 a = *ap;
float4 b = *bp;
// Vector comparisons.
// CHECK: fcmp olt
// CHECK: fcmp ole
// CHECK: fcmp ogt
// CHECK: fcmp oge
// CHECK: fcmp oeq
// CHECK: fcmp une
int4 cmp;
cmp = a < b;
cmp = a <= b;
cmp = a > b;
cmp = a >= b;
cmp = a == b;
cmp = a != b;
}
// CHECK: @test9
// CHECK: extractelement <4 x i32>
int test9(int4 V) {
return V.xy.x;
}
// CHECK: @test10
// CHECK: add <4 x i32>
// CHECK: extractelement <4 x i32>
int test10(int4 V) {
return (V+V).x;
}
// CHECK: @test11
// CHECK: extractelement <4 x i32>
int4 test11a();
int test11() {
return test11a().x;
}
// CHECK: @test12
// CHECK: shufflevector {{.*}} <i32 2, i32 1, i32 0>
// CHECK: shufflevector {{.*}} <i32 0, i32 1, i32 2, i32 undef>
// CHECK: shufflevector {{.*}} <i32 4, i32 5, i32 6, i32 3>
int4 test12(int4 V) {
V.xyz = V.zyx;
return V;
}
// CHECK: @test13
// CHECK: shufflevector {{.*}} <i32 2, i32 1, i32 0, i32 3>
int4 test13(int4 *V) {
return V->zyxw;
}
// CHECK: @test14
void test14(uint4 *ap, uint4 *bp, unsigned c) {
uint4 a = *ap;
uint4 b = *bp;
int4 d;
// CHECK: udiv <4 x i32>
// CHECK: urem <4 x i32>
a = a / b;
a = a % b;
// CHECK: udiv <4 x i32>
// CHECK: urem <4 x i32>
a = a / c;
a = a % c;
// CHECK: icmp ult
// CHECK: icmp ule
// CHECK: icmp ugt
// CHECK: icmp uge
// CHECK: icmp eq
// CHECK: icmp ne
d = a < b;
d = a <= b;
d = a > b;
d = a >= b;
d = a == b;
d = a != b;
}
// CHECK: @test15
int4 test15(uint4 V0) {
// CHECK: icmp eq <4 x i32>
int4 V = !V0;
V = V && V;
V = V || V;
return V;
}