| # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 3 |
| # RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=+real-true16 -run-pass=si-fix-sgpr-copies -verify-machineinstrs -o - %s | FileCheck --check-prefixes=REAL16 %s |
| # RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=-real-true16 -run-pass=si-fix-sgpr-copies -verify-machineinstrs -o - %s | FileCheck --check-prefixes=FAKE16 %s |
| |
| --- |
| name: fmac_f16 |
| body: | |
| bb.0: |
| ; REAL16-LABEL: name: fmac_f16 |
| ; REAL16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; REAL16-NEXT: [[DEF1:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
| ; REAL16-NEXT: [[DEF2:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
| ; REAL16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; REAL16-NEXT: [[V_FMAC_F16_t16_e64_:%[0-9]+]]:vgpr_16 = nofpexcept V_FMAC_F16_t16_e64 0, killed [[DEF1]], 0, [[DEF2]], 0, [[V_CVT_F32_U32_e64_]].lo16, 0, 0, 0, implicit $mode, implicit $exec |
| ; |
| ; FAKE16-LABEL: name: fmac_f16 |
| ; FAKE16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; FAKE16-NEXT: [[DEF1:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
| ; FAKE16-NEXT: [[DEF2:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
| ; FAKE16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; FAKE16-NEXT: [[V_FMAC_F16_fake16_e64_:%[0-9]+]]:vgpr_32 = nofpexcept V_FMAC_F16_fake16_e64 0, killed [[DEF1]], 0, [[DEF2]], 0, [[V_CVT_F32_U32_e64_]], 0, 0, implicit $mode, implicit $exec |
| %0:vgpr_32 = IMPLICIT_DEF |
| %1:sreg_32 = IMPLICIT_DEF |
| %2:sreg_32 = IMPLICIT_DEF |
| %3:vgpr_32 = V_CVT_F32_U32_e64 %0:vgpr_32, 0, 0, implicit $mode, implicit $exec |
| %4:sreg_32 = COPY %3:vgpr_32 |
| %5:sreg_32 = nofpexcept S_FMAC_F16 killed %1:sreg_32, %2:sreg_32, %4:sreg_32, implicit $mode |
| ... |
| |
| --- |
| name: ceil_f16 |
| body: | |
| bb.0: |
| ; REAL16-LABEL: name: ceil_f16 |
| ; REAL16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; REAL16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; REAL16-NEXT: [[V_CEIL_F16_t16_e64_:%[0-9]+]]:vgpr_16 = nofpexcept V_CEIL_F16_t16_e64 0, [[V_CVT_F32_U32_e64_]].lo16, 0, 0, 0, implicit $mode, implicit $exec |
| ; |
| ; FAKE16-LABEL: name: ceil_f16 |
| ; FAKE16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; FAKE16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; FAKE16-NEXT: [[V_CEIL_F16_fake16_e64_:%[0-9]+]]:vgpr_32 = nofpexcept V_CEIL_F16_fake16_e64 0, [[V_CVT_F32_U32_e64_]], 0, 0, implicit $mode, implicit $exec |
| %0:vgpr_32 = IMPLICIT_DEF |
| %1:vgpr_32 = V_CVT_F32_U32_e64 %0:vgpr_32, 0, 0, implicit $mode, implicit $exec |
| %2:sreg_32 = COPY %1:vgpr_32 |
| %3:sreg_32 = nofpexcept S_CEIL_F16 killed %2:sreg_32, implicit $mode |
| ... |
| |
| --- |
| name: floor_f16 |
| body: | |
| bb.0: |
| ; REAL16-LABEL: name: floor_f16 |
| ; REAL16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; REAL16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; REAL16-NEXT: [[V_FLOOR_F16_t16_e64_:%[0-9]+]]:vgpr_16 = nofpexcept V_FLOOR_F16_t16_e64 0, [[V_CVT_F32_U32_e64_]].lo16, 0, 0, 0, implicit $mode, implicit $exec |
| ; |
| ; FAKE16-LABEL: name: floor_f16 |
| ; FAKE16: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF |
| ; FAKE16-NEXT: [[V_CVT_F32_U32_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_U32_e64 [[DEF]], 0, 0, implicit $mode, implicit $exec |
| ; FAKE16-NEXT: [[V_FLOOR_F16_fake16_e64_:%[0-9]+]]:vgpr_32 = nofpexcept V_FLOOR_F16_fake16_e64 0, [[V_CVT_F32_U32_e64_]], 0, 0, implicit $mode, implicit $exec |
| %0:vgpr_32 = IMPLICIT_DEF |
| %1:vgpr_32 = V_CVT_F32_U32_e64 %0:vgpr_32, 0, 0, implicit $mode, implicit $exec |
| %2:sreg_32 = COPY %1:vgpr_32 |
| %3:sreg_32 = nofpexcept S_FLOOR_F16 killed %2:sreg_32, implicit $mode |
| ... |