
Fixes #152585. The `dot2add` DXILOpFunction should be `dx.op.dot2AddHalf.f32` (i.e. it has [a single overload that's a float](https://github.com/microsoft/DirectXShaderCompiler/blob/main/utils/hct/hctdb.py#L3960), rather than no overloads). It was also being defined for too low of a DXIL version - [dxc says SM6.4](https://github.com/microsoft/DirectXShaderCompiler/blob/main/utils/hct/hctdb.py#L740).
176 lines
12 KiB
HLSL
176 lines
12 KiB
HLSL
// RUN: %clang_cc1 -finclude-default-header -fnative-half-type -triple \
|
|
// RUN: dxil-pc-shadermodel6.4-compute %s -emit-llvm -o - | \
|
|
// RUN: FileCheck %s --check-prefixes=CHECK,CHECK-DXIL
|
|
// RUN: %clang_cc1 -finclude-default-header -fnative-half-type -triple \
|
|
// RUN: spirv-pc-vulkan-compute %s -emit-llvm -o - | \
|
|
// RUN: FileCheck %s --check-prefixes=CHECK,CHECK-SPIRV
|
|
|
|
// Test basic lowering to runtime function call.
|
|
|
|
// CHECK-LABEL: define {{.*}}test_default_parameter_type
|
|
float test_default_parameter_type(half2 p1, half2 p2, float p3) {
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_float_arg2_type
|
|
float test_float_arg2_type(half2 p1, float2 p2, float p3) {
|
|
// CHECK: %conv = fptrunc reassoc nnan ninf nsz arcp afn <2 x float> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_float_arg1_type
|
|
float test_float_arg1_type(float2 p1, half2 p2, float p3) {
|
|
// CHECK: %conv = fptrunc reassoc nnan ninf nsz arcp afn <2 x float> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_double_arg3_type
|
|
float test_double_arg3_type(half2 p1, half2 p2, double p3) {
|
|
// CHECK: %conv = fptrunc reassoc nnan ninf nsz arcp afn double %{{.*}} to float
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_float_arg1_arg2_type
|
|
float test_float_arg1_arg2_type(float2 p1, float2 p2, float p3) {
|
|
// CHECK: %conv = fptrunc reassoc nnan ninf nsz arcp afn <2 x float> %{{.*}} to <2 x half>
|
|
// CHECK: %conv1 = fptrunc reassoc nnan ninf nsz arcp afn <2 x float> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_double_arg1_arg2_type
|
|
float test_double_arg1_arg2_type(double2 p1, double2 p2, float p3) {
|
|
// CHECK: %conv = fptrunc reassoc nnan ninf nsz arcp afn <2 x double> %{{.*}} to <2 x half>
|
|
// CHECK: %conv1 = fptrunc reassoc nnan ninf nsz arcp afn <2 x double> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_int16_arg1_arg2_type
|
|
float test_int16_arg1_arg2_type(int16_t2 p1, int16_t2 p2, float p3) {
|
|
// CHECK: %conv = sitofp <2 x i16> %{{.*}} to <2 x half>
|
|
// CHECK: %conv1 = sitofp <2 x i16> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_int32_arg1_arg2_type
|
|
float test_int32_arg1_arg2_type(int32_t2 p1, int32_t2 p2, float p3) {
|
|
// CHECK: %conv = sitofp <2 x i32> %{{.*}} to <2 x half>
|
|
// CHECK: %conv1 = sitofp <2 x i32> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_int64_arg1_arg2_type
|
|
float test_int64_arg1_arg2_type(int64_t2 p1, int64_t2 p2, float p3) {
|
|
// CHECK: %conv = sitofp <2 x i64> %{{.*}} to <2 x half>
|
|
// CHECK: %conv1 = sitofp <2 x i64> %{{.*}} to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|
|
|
|
// CHECK-LABEL: define {{.*}}test_bool_arg1_arg2_type
|
|
float test_bool_arg1_arg2_type(bool2 p1, bool2 p2, float p3) {
|
|
// CHECK: %loadedv = trunc <2 x i32> %{{.*}} to <2 x i1>
|
|
// CHECK: %conv = uitofp <2 x i1> %loadedv to <2 x half>
|
|
// CHECK: %loadedv1 = trunc <2 x i32> %{{.*}} to <2 x i1>
|
|
// CHECK: %conv2 = uitofp <2 x i1> %loadedv1 to <2 x half>
|
|
// CHECK-SPIRV: %[[MUL:.*]] = call reassoc nnan ninf nsz arcp afn half @llvm.spv.fdot.v2f16(<2 x half> %{{.*}}, <2 x half> %{{.*}})
|
|
// CHECK-SPIRV: %[[CONV:.*]] = fpext reassoc nnan ninf nsz arcp afn half %[[MUL]] to float
|
|
// CHECK-SPIRV: %[[C:.*]] = load float, ptr %c.addr.i, align 4
|
|
// CHECK-SPIRV: %[[RES:.*]] = fadd reassoc nnan ninf nsz arcp afn float %[[CONV]], %[[C]]
|
|
// CHECK-DXIL: %[[AX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[AY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[BX:.*]] = extractelement <2 x half> %{{.*}}, i32 0
|
|
// CHECK-DXIL: %[[BY:.*]] = extractelement <2 x half> %{{.*}}, i32 1
|
|
// CHECK-DXIL: %[[RES:.*]] = call {{.*}} float @llvm.dx.dot2add(float %{{.*}}, half %[[AX]], half %[[AY]], half %[[BX]], half %[[BY]])
|
|
// CHECK: ret float %[[RES]]
|
|
return dot2add(p1, p2, p3);
|
|
}
|