
Summary: This patch enables .rgba accessors to ext_vector_type types and adds tests for syntax validation and code generation. 'a' and 'b' can appear either in the point access mode or the numeric access mode (for indices 10 and 11). To disambiguate between the two usages, the accessor type is explicitly passed to relevant methods. Reviewers: rsmith Subscribers: Anastasia, bader, srhines, cfe-commits Differential Revision: http://reviews.llvm.org/D20602 llvm-svn: 276455
341 lines
6.9 KiB
C
341 lines
6.9 KiB
C
// RUN: %clang_cc1 -emit-llvm %s -o - | FileCheck %s
|
|
|
|
typedef __attribute__(( ext_vector_type(4) )) float float4;
|
|
typedef __attribute__(( ext_vector_type(2) )) float float2;
|
|
typedef __attribute__(( ext_vector_type(4) )) int int4;
|
|
typedef __attribute__(( ext_vector_type(4) )) unsigned int uint4;
|
|
|
|
// CHECK: @foo = global <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>
|
|
float4 foo = (float4){ 1.0, 2.0, 3.0, 4.0 };
|
|
|
|
// CHECK: @bar = constant <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 0x7FF0000000000000>
|
|
const float4 bar = (float4){ 1.0, 2.0, 3.0, __builtin_inff() };
|
|
|
|
// CHECK: @test1
|
|
// CHECK: fadd <4 x float>
|
|
float4 test1(float4 V) {
|
|
return V.wzyx+V;
|
|
}
|
|
|
|
float2 vec2, vec2_2;
|
|
float4 vec4, vec4_2;
|
|
float f;
|
|
|
|
// CHECK: @test2
|
|
// CHECK: shufflevector {{.*}} <i32 0, i32 1>
|
|
// CHECK: extractelement
|
|
// CHECK: shufflevector {{.*}} <i32 1, i32 1, i32 1, i32 1>
|
|
// CHECK: insertelement
|
|
// CHECK: shufflevector {{.*}} <i32 1, i32 0>
|
|
void test2() {
|
|
vec2 = vec4.xy; // shorten
|
|
f = vec2.x; // extract elt
|
|
vec4 = vec4.yyyy; // splat
|
|
|
|
vec2.x = f; // insert one.
|
|
vec2.yx = vec2; // reverse
|
|
}
|
|
|
|
// CHECK: @test3
|
|
// CHECK: store <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>
|
|
void test3(float4 *out) {
|
|
*out = ((float4) {1.0f, 2.0f, 3.0f, 4.0f });
|
|
}
|
|
|
|
// CHECK: @test4
|
|
// CHECK: store <4 x float>
|
|
// CHECK: store <4 x float>
|
|
void test4(float4 *out) {
|
|
float a = 1.0f;
|
|
float b = 2.0f;
|
|
float c = 3.0f;
|
|
float d = 4.0f;
|
|
*out = ((float4) {a,b,c,d});
|
|
}
|
|
|
|
// CHECK: @test5
|
|
// CHECK: shufflevector {{.*}} <4 x i32> zeroinitializer
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: shufflevector {{.*}} <4 x i32> zeroinitializer
|
|
// CHECK: fmul <4 x float>
|
|
void test5(float4 *out) {
|
|
float a;
|
|
float4 b;
|
|
|
|
a = 1.0f;
|
|
b = a;
|
|
b = b * 5.0f;
|
|
b = 5.0f * b;
|
|
b *= a;
|
|
|
|
*out = b;
|
|
}
|
|
|
|
// CHECK: @test6
|
|
void test6(float4 *ap, float4 *bp, float c) {
|
|
float4 a = *ap;
|
|
float4 b = *bp;
|
|
|
|
// CHECK: fadd <4 x float>
|
|
// CHECK: fsub <4 x float>
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: fdiv <4 x float>
|
|
a = a + b;
|
|
a = a - b;
|
|
a = a * b;
|
|
a = a / b;
|
|
|
|
// CHECK: fadd <4 x float>
|
|
// CHECK: fsub <4 x float>
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: fdiv <4 x float>
|
|
a = a + c;
|
|
a = a - c;
|
|
a = a * c;
|
|
a = a / c;
|
|
|
|
// CHECK: fadd <4 x float>
|
|
// CHECK: fsub <4 x float>
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: fdiv <4 x float>
|
|
a += b;
|
|
a -= b;
|
|
a *= b;
|
|
a /= b;
|
|
|
|
// CHECK: fadd <4 x float>
|
|
// CHECK: fsub <4 x float>
|
|
// CHECK: fmul <4 x float>
|
|
// CHECK: fdiv <4 x float>
|
|
a += c;
|
|
a -= c;
|
|
a *= c;
|
|
a /= c;
|
|
|
|
// Vector comparisons can sometimes crash the x86 backend: rdar://6326239,
|
|
// reject them until the implementation is stable.
|
|
#if 0
|
|
int4 cmp;
|
|
cmp = a < b;
|
|
cmp = a <= b;
|
|
cmp = a < b;
|
|
cmp = a >= b;
|
|
cmp = a == b;
|
|
cmp = a != b;
|
|
#endif
|
|
}
|
|
|
|
// CHECK: @test7
|
|
void test7(int4 *ap, int4 *bp, int c) {
|
|
int4 a = *ap;
|
|
int4 b = *bp;
|
|
|
|
// CHECK: add <4 x i32>
|
|
// CHECK: sub <4 x i32>
|
|
// CHECK: mul <4 x i32>
|
|
// CHECK: sdiv <4 x i32>
|
|
// CHECK: srem <4 x i32>
|
|
a = a + b;
|
|
a = a - b;
|
|
a = a * b;
|
|
a = a / b;
|
|
a = a % b;
|
|
|
|
// CHECK: add <4 x i32>
|
|
// CHECK: sub <4 x i32>
|
|
// CHECK: mul <4 x i32>
|
|
// CHECK: sdiv <4 x i32>
|
|
// CHECK: srem <4 x i32>
|
|
a = a + c;
|
|
a = a - c;
|
|
a = a * c;
|
|
a = a / c;
|
|
a = a % c;
|
|
|
|
// CHECK: add <4 x i32>
|
|
// CHECK: sub <4 x i32>
|
|
// CHECK: mul <4 x i32>
|
|
// CHECK: sdiv <4 x i32>
|
|
// CHECK: srem <4 x i32>
|
|
a += b;
|
|
a -= b;
|
|
a *= b;
|
|
a /= b;
|
|
a %= b;
|
|
|
|
// CHECK: add <4 x i32>
|
|
// CHECK: sub <4 x i32>
|
|
// CHECK: mul <4 x i32>
|
|
// CHECK: sdiv <4 x i32>
|
|
// CHECK: srem <4 x i32>
|
|
a += c;
|
|
a -= c;
|
|
a *= c;
|
|
a /= c;
|
|
a %= c;
|
|
|
|
|
|
// Vector comparisons.
|
|
// CHECK: icmp slt
|
|
// CHECK: icmp sle
|
|
// CHECK: icmp sgt
|
|
// CHECK: icmp sge
|
|
// CHECK: icmp eq
|
|
// CHECK: icmp ne
|
|
int4 cmp;
|
|
cmp = a < b;
|
|
cmp = a <= b;
|
|
cmp = a > b;
|
|
cmp = a >= b;
|
|
cmp = a == b;
|
|
cmp = a != b;
|
|
}
|
|
|
|
// CHECK: @test8
|
|
void test8(float4 *ap, float4 *bp, int c) {
|
|
float4 a = *ap;
|
|
float4 b = *bp;
|
|
|
|
// Vector comparisons.
|
|
// CHECK: fcmp olt
|
|
// CHECK: fcmp ole
|
|
// CHECK: fcmp ogt
|
|
// CHECK: fcmp oge
|
|
// CHECK: fcmp oeq
|
|
// CHECK: fcmp une
|
|
int4 cmp;
|
|
cmp = a < b;
|
|
cmp = a <= b;
|
|
cmp = a > b;
|
|
cmp = a >= b;
|
|
cmp = a == b;
|
|
cmp = a != b;
|
|
}
|
|
|
|
// CHECK: @test9
|
|
// CHECK: extractelement <4 x i32>
|
|
int test9(int4 V) {
|
|
return V.xy.x;
|
|
}
|
|
|
|
// CHECK: @test10
|
|
// CHECK: add <4 x i32>
|
|
// CHECK: extractelement <4 x i32>
|
|
int test10(int4 V) {
|
|
return (V+V).x;
|
|
}
|
|
|
|
// CHECK: @test11
|
|
// CHECK: extractelement <4 x i32>
|
|
int4 test11a();
|
|
int test11() {
|
|
return test11a().x;
|
|
}
|
|
|
|
// CHECK: @test12
|
|
// CHECK: shufflevector {{.*}} <i32 2, i32 1, i32 0>
|
|
// CHECK: shufflevector {{.*}} <i32 0, i32 1, i32 2, i32 undef>
|
|
// CHECK: shufflevector {{.*}} <i32 4, i32 5, i32 6, i32 3>
|
|
int4 test12(int4 V) {
|
|
V.xyz = V.zyx;
|
|
return V;
|
|
}
|
|
|
|
// CHECK: @test13
|
|
// CHECK: shufflevector {{.*}} <i32 2, i32 1, i32 0, i32 3>
|
|
int4 test13(int4 *V) {
|
|
return V->zyxw;
|
|
}
|
|
|
|
// CHECK: @test14
|
|
void test14(uint4 *ap, uint4 *bp, unsigned c) {
|
|
uint4 a = *ap;
|
|
uint4 b = *bp;
|
|
int4 d;
|
|
|
|
// CHECK: udiv <4 x i32>
|
|
// CHECK: urem <4 x i32>
|
|
a = a / b;
|
|
a = a % b;
|
|
|
|
// CHECK: udiv <4 x i32>
|
|
// CHECK: urem <4 x i32>
|
|
a = a / c;
|
|
a = a % c;
|
|
|
|
// CHECK: icmp ult
|
|
// CHECK: icmp ule
|
|
// CHECK: icmp ugt
|
|
// CHECK: icmp uge
|
|
// CHECK: icmp eq
|
|
// CHECK: icmp ne
|
|
d = a < b;
|
|
d = a <= b;
|
|
d = a > b;
|
|
d = a >= b;
|
|
d = a == b;
|
|
d = a != b;
|
|
}
|
|
|
|
// CHECK: @test15
|
|
int4 test15(uint4 V0) {
|
|
// CHECK: icmp eq <4 x i32>
|
|
int4 V = !V0;
|
|
V = V && V;
|
|
V = V || V;
|
|
return V;
|
|
}
|
|
|
|
// CHECK: @test16
|
|
void test16(float2 a, float2 b) {
|
|
float2 t0 = (a + b) / 2;
|
|
}
|
|
|
|
typedef char char16 __attribute__((ext_vector_type(16)));
|
|
|
|
// CHECK: @test17
|
|
void test17(void) {
|
|
char16 valA;
|
|
char valB;
|
|
char valC;
|
|
char16 destVal = valC ? valA : valB;
|
|
}
|
|
|
|
typedef __attribute__(( ext_vector_type(16) )) float float16;
|
|
|
|
float16 vec16, vec16_2;
|
|
|
|
// CHECK: @test_rgba
|
|
void test_rgba() {
|
|
// CHECK: fadd <4 x float>
|
|
vec4_2 = vec4.abgr + vec4;
|
|
|
|
// CHECK: shufflevector {{.*}} <i32 0, i32 1>
|
|
vec2 = vec4.rg;
|
|
// CHECK: shufflevector {{.*}} <i32 2, i32 3>
|
|
vec2_2 = vec4.ba;
|
|
// CHECK: extractelement {{.*}} 2
|
|
f = vec4.b;
|
|
// CHECK: shufflevector {{.*}} <i32 2, i32 2, i32 2, i32 2>
|
|
vec4_2 = vec4_2.bbbb;
|
|
|
|
// CHECK: insertelement {{.*}} 0
|
|
vec2.r = f;
|
|
// CHECK: shufflevector {{.*}} <i32 1, i32 0>
|
|
vec2.gr = vec2;
|
|
|
|
// CHECK: extractelement {{.*}} 0
|
|
f = vec4_2.rg.r;
|
|
// CHECK: shufflevector {{.*}} <i32 2, i32 1, i32 0>
|
|
// CHECK: shufflevector {{.*}} <i32 0, i32 1, i32 2, i32 undef>
|
|
// CHECK: shufflevector {{.*}} <i32 4, i32 5, i32 6, i32 3>
|
|
vec4.rgb = vec4.bgr;
|
|
|
|
// CHECK: extractelement {{.*}} 11
|
|
// CHECK: insertelement {{.*}} 2
|
|
vec4.b = vec16.sb;
|
|
// CHECK: shufflevector {{.*}} <i32 10, i32 11, i32 12, i32 13>
|
|
vec4_2 = vec16.sabcd;
|
|
}
|