
- Redefines `DXILAttribute` to denote a function attribute, compatible to how it was define in DXC/LLVM 3.7 - Fix how `DXILAttribute` is emitted to be a struct of set attributes instead of an "or" of the enums - Implement the lowering of `DXILAttribute` to LLVM function attributes in `DXILOpBuilder.cpp`. A custom mapping is defined. - Audit all current ops to specify the correct attributes consistent with DXC. This is done here to allow for testing. - Update testcases in `llvm/test/CodeGen/DirectX` of all ops with attributes to match that attributes are set - Update testcases of ops that had previously incorrectly set attributes to check there is no attributes set - Defines `DXILProperty` to denote the other type of attributes from DXC used to query properties. - Emit `DXILProperty` as a struct of set attributes. - Updates `DXIL.td` to specify applicable `DXILProperty`s on ops Note: `DXILProperty` was referred to as 'queryable attributes' in design discussion. Changed to property to allow for better expression in `DXIL.td` Resolves #114461 Resolves #115912
103 lines
4.8 KiB
LLVM
103 lines
4.8 KiB
LLVM
; RUN: opt -S -dxil-intrinsic-expansion -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,EXPCHECK
|
|
; RUN: opt -S -dxil-intrinsic-expansion -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s --check-prefixes=CHECK,DOPCHECK
|
|
|
|
; Make sure dxil operation function calls for dot are generated for int/uint vectors.
|
|
|
|
; CHECK-LABEL: dot_int16_t2
|
|
define noundef i16 @dot_int16_t2(<2 x i16> noundef %a, <2 x i16> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <2 x i16> %a, i64 0
|
|
; CHECK: extractelement <2 x i16> %b, i64 0
|
|
; CHECK: mul i16 %{{.*}}, %{{.*}}
|
|
; CHECK: extractelement <2 x i16> %a, i64 1
|
|
; CHECK: extractelement <2 x i16> %b, i64 1
|
|
; EXPCHECK: call i16 @llvm.dx.imad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
|
|
; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 48, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR:]]
|
|
%dot = call i16 @llvm.dx.sdot.v3i16(<2 x i16> %a, <2 x i16> %b)
|
|
ret i16 %dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_int4
|
|
define noundef i32 @dot_int4(<4 x i32> noundef %a, <4 x i32> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <4 x i32> %a, i64 0
|
|
; CHECK: extractelement <4 x i32> %b, i64 0
|
|
; CHECK: mul i32 %{{.*}}, %{{.*}}
|
|
; CHECK: extractelement <4 x i32> %a, i64 1
|
|
; CHECK: extractelement <4 x i32> %b, i64 1
|
|
; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
; CHECK: extractelement <4 x i32> %a, i64 2
|
|
; CHECK: extractelement <4 x i32> %b, i64 2
|
|
; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
; CHECK: extractelement <4 x i32> %a, i64 3
|
|
; CHECK: extractelement <4 x i32> %b, i64 3
|
|
; EXPCHECK: call i32 @llvm.dx.imad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 48, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
%dot = call i32 @llvm.dx.sdot.v4i32(<4 x i32> %a, <4 x i32> %b)
|
|
ret i32 %dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_uint16_t3
|
|
define noundef i16 @dot_uint16_t3(<3 x i16> noundef %a, <3 x i16> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <3 x i16> %a, i64 0
|
|
; CHECK: extractelement <3 x i16> %b, i64 0
|
|
; CHECK: mul i16 %{{.*}}, %{{.*}}
|
|
; CHECK: extractelement <3 x i16> %a, i64 1
|
|
; CHECK: extractelement <3 x i16> %b, i64 1
|
|
; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
|
|
; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]]
|
|
; CHECK: extractelement <3 x i16> %a, i64 2
|
|
; CHECK: extractelement <3 x i16> %b, i64 2
|
|
; EXPCHECK: call i16 @llvm.dx.umad.i16(i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}})
|
|
; DOPCHECK: call i16 @dx.op.tertiary.i16(i32 49, i16 %{{.*}}, i16 %{{.*}}, i16 %{{.*}}) #[[#ATTR]]
|
|
%dot = call i16 @llvm.dx.udot.v3i16(<3 x i16> %a, <3 x i16> %b)
|
|
ret i16 %dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_uint4
|
|
define noundef i32 @dot_uint4(<4 x i32> noundef %a, <4 x i32> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <4 x i32> %a, i64 0
|
|
; CHECK: extractelement <4 x i32> %b, i64 0
|
|
; CHECK: mul i32 %{{.*}}, %{{.*}}
|
|
; CHECK: extractelement <4 x i32> %a, i64 1
|
|
; CHECK: extractelement <4 x i32> %b, i64 1
|
|
; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
; CHECK: extractelement <4 x i32> %a, i64 2
|
|
; CHECK: extractelement <4 x i32> %b, i64 2
|
|
; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
; CHECK: extractelement <4 x i32> %a, i64 3
|
|
; CHECK: extractelement <4 x i32> %b, i64 3
|
|
; EXPCHECK: call i32 @llvm.dx.umad.i32(i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}})
|
|
; DOPCHECK: call i32 @dx.op.tertiary.i32(i32 49, i32 %{{.*}}, i32 %{{.*}}, i32 %{{.*}}) #[[#ATTR]]
|
|
%dot = call i32 @llvm.dx.udot.v4i32(<4 x i32> %a, <4 x i32> %b)
|
|
ret i32 %dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_uint64_t4
|
|
define noundef i64 @dot_uint64_t4(<2 x i64> noundef %a, <2 x i64> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <2 x i64> %a, i64 0
|
|
; CHECK: extractelement <2 x i64> %b, i64 0
|
|
; CHECK: mul i64 %{{.*}}, %{{.*}}
|
|
; CHECK: extractelement <2 x i64> %a, i64 1
|
|
; CHECK: extractelement <2 x i64> %b, i64 1
|
|
; EXPCHECK: call i64 @llvm.dx.umad.i64(i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}})
|
|
; DOPCHECK: call i64 @dx.op.tertiary.i64(i32 49, i64 %{{.*}}, i64 %{{.*}}, i64 %{{.*}}) #[[#ATTR]]
|
|
%dot = call i64 @llvm.dx.udot.v2i64(<2 x i64> %a, <2 x i64> %b)
|
|
ret i64 %dot
|
|
}
|
|
|
|
; DOPCHECK: attributes #[[#ATTR]] = {{{.*}} memory(none) {{.*}}}
|
|
|
|
declare i16 @llvm.dx.sdot.v2i16(<2 x i16>, <2 x i16>)
|
|
declare i32 @llvm.dx.sdot.v4i32(<4 x i32>, <4 x i32>)
|
|
declare i16 @llvm.dx.udot.v3i32(<3 x i16>, <3 x i16>)
|
|
declare i32 @llvm.dx.udot.v4i32(<4 x i32>, <4 x i32>)
|
|
declare i64 @llvm.dx.udot.v2i64(<2 x i64>, <2 x i64>)
|