|
| 1 | +; RUN: opt -S -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s |
| 2 | + |
| 3 | +; Make sure correct dxil expansions for atan2 are generated for float and half. |
| 4 | + |
| 5 | +define noundef float @atan2_float(float noundef %y, float noundef %x) { |
| 6 | +entry: |
| 7 | +; CHECK: [[DIV:%.+]] = fdiv float %y, %x |
| 8 | +; CHECK: [[TAN:%.+]] = call float @dx.op.unary.f32(i32 17, float [[DIV]]) |
| 9 | +; CHECK-DAG: [[ADD_PI:%.+]] = fadd float [[TAN]], 0x400921FB60000000 |
| 10 | +; CHECK-DAG: [[SUB_PI:%.+]] = fsub float [[TAN]], 0x400921FB60000000 |
| 11 | +; CHECK-DAG: [[X_LT_0:%.+]] = fcmp olt float %x, 0.000000e+00 |
| 12 | +; CHECK-DAG: [[X_EQ_0:%.+]] = fcmp oeq float %x, 0.000000e+00 |
| 13 | +; CHECK-DAG: [[Y_GE_0:%.+]] = fcmp oge float %y, 0.000000e+00 |
| 14 | +; CHECK-DAG: [[Y_LT_0:%.+]] = fcmp olt float %y, 0.000000e+00 |
| 15 | +; CHECK: [[XLT0_AND_YGE0:%.+]] = and i1 [[X_LT_0]], [[Y_GE_0]] |
| 16 | +; CHECK: [[SELECT_ADD_PI:%.+]] = select i1 [[XLT0_AND_YGE0]], float [[ADD_PI]], float [[TAN]] |
| 17 | +; CHECK: [[XLT0_AND_YLT0:%.+]] = and i1 [[X_LT_0]], [[Y_LT_0]] |
| 18 | +; CHECK: [[SELECT_SUB_PI:%.+]] = select i1 [[XLT0_AND_YLT0]], float [[SUB_PI]], float [[SELECT_ADD_PI]] |
| 19 | +; CHECK: [[XEQ0_AND_YLT0:%.+]] = and i1 [[X_EQ_0]], [[Y_LT_0]] |
| 20 | +; CHECK: [[SELECT_NEGHPI:%.+]] = select i1 [[XEQ0_AND_YLT0]], float 0xBFF921FB60000000, float [[SELECT_SUB_PI]] |
| 21 | +; CHECK: [[XEQ0_AND_YGE0:%.+]] = and i1 [[X_EQ_0]], [[Y_GE_0]] |
| 22 | +; CHECK: [[SELECT_HPI:%.+]] = select i1 [[XEQ0_AND_YGE0]], float 0x3FF921FB60000000, float [[SELECT_NEGHPI]] |
| 23 | +; CHECK: ret float [[SELECT_HPI]] |
| 24 | + %elt.atan2 = call float @llvm.atan2.f32(float %y, float %x) |
| 25 | + ret float %elt.atan2 |
| 26 | +} |
| 27 | + |
| 28 | +define noundef half @atan2_half(half noundef %y, half noundef %x) { |
| 29 | +entry: |
| 30 | +; CHECK: [[DIV:%.+]] = fdiv half %y, %x |
| 31 | +; CHECK: [[TAN:%.+]] = call half @dx.op.unary.f16(i32 17, half [[DIV]]) |
| 32 | +; CHECK-DAG: [[ADD_PI:%.+]] = fadd half [[TAN]], 0xH4248 |
| 33 | +; CHECK-DAG: [[SUB_PI:%.+]] = fsub half [[TAN]], 0xH4248 |
| 34 | +; CHECK-DAG: [[X_LT_0:%.+]] = fcmp olt half %x, 0xH0000 |
| 35 | +; CHECK-DAG: [[X_EQ_0:%.+]] = fcmp oeq half %x, 0xH0000 |
| 36 | +; CHECK-DAG: [[Y_GE_0:%.+]] = fcmp oge half %y, 0xH0000 |
| 37 | +; CHECK-DAG: [[Y_LT_0:%.+]] = fcmp olt half %y, 0xH0000 |
| 38 | +; CHECK: [[XLT0_AND_YGE0:%.+]] = and i1 [[X_LT_0]], [[Y_GE_0]] |
| 39 | +; CHECK: [[SELECT_ADD_PI:%.+]] = select i1 [[XLT0_AND_YGE0]], half [[ADD_PI]], half [[TAN]] |
| 40 | +; CHECK: [[XLT0_AND_YLT0:%.+]] = and i1 [[X_LT_0]], [[Y_LT_0]] |
| 41 | +; CHECK: [[SELECT_SUB_PI:%.+]] = select i1 [[XLT0_AND_YLT0]], half [[SUB_PI]], half [[SELECT_ADD_PI]] |
| 42 | +; CHECK: [[XEQ0_AND_YLT0:%.+]] = and i1 [[X_EQ_0]], [[Y_LT_0]] |
| 43 | +; CHECK: [[SELECT_NEGHPI:%.+]] = select i1 [[XEQ0_AND_YLT0]], half 0xHBE48, half [[SELECT_SUB_PI]] |
| 44 | +; CHECK: [[XEQ0_AND_YGE0:%.+]] = and i1 [[X_EQ_0]], [[Y_GE_0]] |
| 45 | +; CHECK: [[SELECT_HPI:%.+]] = select i1 [[XEQ0_AND_YGE0]], half 0xH3E48, half [[SELECT_NEGHPI]] |
| 46 | +; CHECK: ret half [[SELECT_HPI]] |
| 47 | + %elt.atan2 = call half @llvm.atan2.f16(half %y, half %x) |
| 48 | + ret half %elt.atan2 |
| 49 | +} |
| 50 | + |
| 51 | +declare half @llvm.atan2.f16(half, half) |
| 52 | +declare float @llvm.atan2.f32(float, float) |
0 commit comments