diff options
Diffstat (limited to 'llvm/test/CodeGen/DirectX/fdot.ll')
| -rw-r--r-- | llvm/test/CodeGen/DirectX/fdot.ll | 94 |
1 files changed, 94 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/DirectX/fdot.ll b/llvm/test/CodeGen/DirectX/fdot.ll new file mode 100644 index 000000000000..3e13b2ad2650 --- /dev/null +++ b/llvm/test/CodeGen/DirectX/fdot.ll @@ -0,0 +1,94 @@ +; RUN: opt -S -dxil-op-lower < %s | FileCheck %s + +; Make sure dxil operation function calls for dot are generated for int/uint vectors. + +; CHECK-LABEL: dot_half2 +define noundef half @dot_half2(<2 x half> noundef %a, <2 x half> noundef %b) { +entry: +; CHECK: extractelement <2 x half> %a, i32 0 +; CHECK: extractelement <2 x half> %a, i32 1 +; CHECK: extractelement <2 x half> %b, i32 0 +; CHECK: extractelement <2 x half> %b, i32 1 +; CHECK: call half @dx.op.dot2.f16(i32 54, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}) + %dx.dot = call half @llvm.dx.dot2.v2f16(<2 x half> %a, <2 x half> %b) + ret half %dx.dot +} + +; CHECK-LABEL: dot_half3 +define noundef half @dot_half3(<3 x half> noundef %a, <3 x half> noundef %b) { +entry: +; CHECK: extractelement <3 x half> %a, i32 0 +; CHECK: extractelement <3 x half> %a, i32 1 +; CHECK: extractelement <3 x half> %a, i32 2 +; CHECK: extractelement <3 x half> %b, i32 0 +; CHECK: extractelement <3 x half> %b, i32 1 +; CHECK: extractelement <3 x half> %b, i32 2 +; CHECK: call half @dx.op.dot3.f16(i32 55, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}) + %dx.dot = call half @llvm.dx.dot3.v3f16(<3 x half> %a, <3 x half> %b) + ret half %dx.dot +} + +; CHECK-LABEL: dot_half4 +define noundef half @dot_half4(<4 x half> noundef %a, <4 x half> noundef %b) { +entry: +; CHECK: extractelement <4 x half> %a, i32 0 +; CHECK: extractelement <4 x half> %a, i32 1 +; CHECK: extractelement <4 x half> %a, i32 2 +; CHECK: extractelement <4 x half> %a, i32 3 +; CHECK: extractelement <4 x half> %b, i32 0 +; CHECK: extractelement <4 x half> %b, i32 1 +; CHECK: extractelement <4 x half> %b, i32 2 +; CHECK: extractelement <4 x half> %b, i32 3 +; CHECK: call half @dx.op.dot4.f16(i32 56, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}) + %dx.dot = call half @llvm.dx.dot4.v4f16(<4 x half> %a, <4 x half> %b) + ret half %dx.dot +} + +; CHECK-LABEL: dot_float2 +define noundef float @dot_float2(<2 x float> noundef %a, <2 x float> noundef %b) { +entry: +; CHECK: extractelement <2 x float> %a, i32 0 +; CHECK: extractelement <2 x float> %a, i32 1 +; CHECK: extractelement <2 x float> %b, i32 0 +; CHECK: extractelement <2 x float> %b, i32 1 +; CHECK: call float @dx.op.dot2.f32(i32 54, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}) + %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %a, <2 x float> %b) + ret float %dx.dot +} + +; CHECK-LABEL: dot_float3 +define noundef float @dot_float3(<3 x float> noundef %a, <3 x float> noundef %b) { +entry: +; CHECK: extractelement <3 x float> %a, i32 0 +; CHECK: extractelement <3 x float> %a, i32 1 +; CHECK: extractelement <3 x float> %a, i32 2 +; CHECK: extractelement <3 x float> %b, i32 0 +; CHECK: extractelement <3 x float> %b, i32 1 +; CHECK: extractelement <3 x float> %b, i32 2 +; CHECK: call float @dx.op.dot3.f32(i32 55, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}) + %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %a, <3 x float> %b) + ret float %dx.dot +} + +; CHECK-LABEL: dot_float4 +define noundef float @dot_float4(<4 x float> noundef %a, <4 x float> noundef %b) { +entry: +; CHECK: extractelement <4 x float> %a, i32 0 +; CHECK: extractelement <4 x float> %a, i32 1 +; CHECK: extractelement <4 x float> %a, i32 2 +; CHECK: extractelement <4 x float> %a, i32 3 +; CHECK: extractelement <4 x float> %b, i32 0 +; CHECK: extractelement <4 x float> %b, i32 1 +; CHECK: extractelement <4 x float> %b, i32 2 +; CHECK: extractelement <4 x float> %b, i32 3 +; CHECK: call float @dx.op.dot4.f32(i32 56, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}) + %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %a, <4 x float> %b) + ret float %dx.dot +} + +declare half @llvm.dx.dot.v2f16(<2 x half> , <2 x half> ) +declare half @llvm.dx.dot.v3f16(<3 x half> , <3 x half> ) +declare half @llvm.dx.dot.v4f16(<4 x half> , <4 x half> ) +declare float @llvm.dx.dot.v2f32(<2 x float>, <2 x float>) +declare float @llvm.dx.dot.v3f32(<3 x float>, <3 x float>) +declare float @llvm.dx.dot.v4f32(<4 x float>, <4 x float>) |
