| ; RUN: llc -mtriple=amdgcn < %s -verify-machineinstrs | FileCheck -check-prefix=SI %s |
| ; RUN: llc -mtriple=amdgcn -mcpu=tonga < %s -verify-machineinstrs | FileCheck -check-prefix=SI %s |
| |
| ; If this occurs it is likely due to reordering and the restore was |
| ; originally supposed to happen before SI_END_CF. |
| |
| ; SI: s_or_b64 exec, exec, [[SAVED:s\[[0-9]+:[0-9]+\]|[a-z]+]] |
| ; SI-NOT: v_readlane_b32 [[SAVED]] |
| |
| define amdgpu_ps void @main(<4 x i32> inreg %rsrc) #0 { |
| main_body: |
| %tmp = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 16, i32 0) |
| %tmp1 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 32, i32 0) |
| %tmp2 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 80, i32 0) |
| %tmp3 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 84, i32 0) |
| %tmp4 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 88, i32 0) |
| %tmp5 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 96, i32 0) |
| %tmp6 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 100, i32 0) |
| %tmp7 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 104, i32 0) |
| %tmp8 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 112, i32 0) |
| %tmp9 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 116, i32 0) |
| %tmp10 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 120, i32 0) |
| %tmp11 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 128, i32 0) |
| %tmp12 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 132, i32 0) |
| %tmp13 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 136, i32 0) |
| %tmp14 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 144, i32 0) |
| %tmp15 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 148, i32 0) |
| %tmp16 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 152, i32 0) |
| %tmp17 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 160, i32 0) |
| %tmp18 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 164, i32 0) |
| %tmp19 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 168, i32 0) |
| %tmp20 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 176, i32 0) |
| %tmp21 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 180, i32 0) |
| %tmp22 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 184, i32 0) |
| %tmp23 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 192, i32 0) |
| %tmp24 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 196, i32 0) |
| %tmp25 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 200, i32 0) |
| %tmp26 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 208, i32 0) |
| %tmp27 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 212, i32 0) |
| %tmp28 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 216, i32 0) |
| %tmp29 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 224, i32 0) |
| %tmp30 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 228, i32 0) |
| %tmp31 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 232, i32 0) |
| %tmp32 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 240, i32 0) |
| %tmp33 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 244, i32 0) |
| %tmp34 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 248, i32 0) |
| %tmp35 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 256, i32 0) |
| %tmp36 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 260, i32 0) |
| %tmp37 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 264, i32 0) |
| %tmp38 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 272, i32 0) |
| %tmp39 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 276, i32 0) |
| %tmp40 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 280, i32 0) |
| %tmp41 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 288, i32 0) |
| %tmp42 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 292, i32 0) |
| %tmp43 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 296, i32 0) |
| %tmp44 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 304, i32 0) |
| %tmp45 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 308, i32 0) |
| %tmp46 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 312, i32 0) |
| %tmp47 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 320, i32 0) |
| %tmp48 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 324, i32 0) |
| %tmp49 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 328, i32 0) |
| %tmp50 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 336, i32 0) |
| %tmp51 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 340, i32 0) |
| %tmp52 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 344, i32 0) |
| %tmp53 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 352, i32 0) |
| %tmp54 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 356, i32 0) |
| %tmp55 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 360, i32 0) |
| %tmp56 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 368, i32 0) |
| %tmp57 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 372, i32 0) |
| %tmp58 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 376, i32 0) |
| %tmp59 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 384, i32 0) |
| %tmp60 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 388, i32 0) |
| %tmp61 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 392, i32 0) |
| %tmp62 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 400, i32 0) |
| %tmp63 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 404, i32 0) |
| %tmp64 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 408, i32 0) |
| %tmp65 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 416, i32 0) |
| %tmp66 = call float @llvm.amdgcn.s.buffer.load.f32(<4 x i32> %rsrc, i32 420, i32 0) |
| br label %LOOP |
| |
| LOOP: ; preds = %ENDIF2795, %main_body |
| %temp894.0 = phi float [ 0.000000e+00, %main_body ], [ %temp894.1, %ENDIF2795 ] |
| %temp18.0 = phi float [ poison, %main_body ], [ %temp18.1, %ENDIF2795 ] |
| %tid = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %tmp67 = icmp sgt i32 %tid, 4 |
| br i1 %tmp67, label %ENDLOOP, label %ENDIF |
| |
| ENDLOOP: ; preds = %ELSE2566, %LOOP |
| %one.sub.a.i = fsub float 1.000000e+00, %tmp |
| %one.sub.ac.i = fmul float %one.sub.a.i, 0x7FF8000000000000 |
| %fmul = fmul float 0x7FF8000000000000, 0x7FF8000000000000 |
| %result.i = fadd float %fmul, %one.sub.ac.i |
| call void @llvm.amdgcn.exp.f32(i32 0, i32 15, float poison, float %result.i, float poison, float 1.000000e+00, i1 true, i1 true) #0 |
| ret void |
| |
| ENDIF: ; preds = %LOOP |
| %tmp68 = fsub float %tmp2, 0x7FF8000000000000 |
| %tmp69 = fsub float %tmp3, 0x7FF8000000000000 |
| %tmp70 = fsub float %tmp4, 0x7FF8000000000000 |
| %tmp71 = fmul float %tmp68, 0.000000e+00 |
| %tmp72 = fmul float %tmp69, 0x7FF8000000000000 |
| %tmp73 = fmul float %tmp70, 0x7FF8000000000000 |
| %tmp74 = fsub float %tmp6, 0x7FF8000000000000 |
| %tmp75 = fsub float %tmp7, 0x7FF8000000000000 |
| %tmp76 = fmul float %tmp74, 0x7FF8000000000000 |
| %tmp77 = fmul float %tmp75, 0.000000e+00 |
| %tmp78 = call float @llvm.minnum.f32(float %tmp73, float %tmp77) |
| %tmp79 = call float @llvm.maxnum.f32(float %tmp71, float 0.000000e+00) |
| %tmp80 = call float @llvm.maxnum.f32(float %tmp72, float %tmp76) |
| %tmp81 = call float @llvm.maxnum.f32(float 0x7FF8000000000000, float %tmp78) |
| %tmp82 = call float @llvm.minnum.f32(float %tmp79, float %tmp80) |
| %tmp83 = call float @llvm.minnum.f32(float %tmp82, float 0x7FF8000000000000) |
| %tmp84 = fsub float %tmp14, 0x7FF8000000000000 |
| %tmp85 = fsub float %tmp15, 0x7FF8000000000000 |
| %tmp86 = fsub float %tmp16, 0x7FF8000000000000 |
| %tmp87 = fmul float %tmp84, 0x7FF8000000000000 |
| %tmp88 = fmul float %tmp85, 0x7FF8000000000000 |
| %tmp89 = fmul float %tmp86, 0x7FF8000000000000 |
| %tmp90 = fsub float %tmp17, 0x7FF8000000000000 |
| %tmp91 = fsub float %tmp18, 0x7FF8000000000000 |
| %tmp92 = fsub float %tmp19, 0x7FF8000000000000 |
| %tmp93 = fmul float %tmp90, 0.000000e+00 |
| %tmp94 = fmul float %tmp91, 0x7FF8000000000000 |
| %tmp95 = fmul float %tmp92, 0x7FF8000000000000 |
| %tmp96 = call float @llvm.minnum.f32(float %tmp88, float %tmp94) |
| %tmp97 = call float @llvm.maxnum.f32(float %tmp87, float %tmp93) |
| %tmp98 = call float @llvm.maxnum.f32(float %tmp89, float %tmp95) |
| %tmp99 = call float @llvm.maxnum.f32(float 0x7FF8000000000000, float %tmp96) |
| %tmp100 = call float @llvm.maxnum.f32(float %tmp99, float 0x7FF8000000000000) |
| %tmp101 = call float @llvm.minnum.f32(float %tmp97, float 0x7FF8000000000000) |
| %tmp102 = call float @llvm.minnum.f32(float %tmp101, float %tmp98) |
| %tmp103 = fsub float %tmp30, 0x7FF8000000000000 |
| %tmp104 = fsub float %tmp31, 0x7FF8000000000000 |
| %tmp105 = fmul float %tmp103, 0.000000e+00 |
| %tmp106 = fmul float %tmp104, 0.000000e+00 |
| %tmp107 = call float @llvm.minnum.f32(float 0x7FF8000000000000, float %tmp105) |
| %tmp108 = call float @llvm.maxnum.f32(float 0x7FF8000000000000, float %tmp106) |
| %tmp109 = call float @llvm.maxnum.f32(float 0x7FF8000000000000, float %tmp107) |
| %tmp110 = call float @llvm.maxnum.f32(float %tmp109, float 0x7FF8000000000000) |
| %tmp111 = call float @llvm.minnum.f32(float 0x7FF8000000000000, float %tmp108) |
| %tmp112 = fsub float %tmp32, 0x7FF8000000000000 |
| %tmp113 = fsub float %tmp33, 0x7FF8000000000000 |
| %tmp114 = fsub float %tmp34, 0x7FF8000000000000 |
| %tmp115 = fmul float %tmp112, 0.000000e+00 |
| %tmp116 = fmul float %tmp113, 0x7FF8000000000000 |
| %tmp117 = fmul float %tmp114, 0x7FF8000000000000 |
| %tmp118 = fsub float %tmp35, 0x7FF8000000000000 |
| %tmp119 = fsub float %tmp36, 0x7FF8000000000000 |
| %tmp120 = fsub float %tmp37, 0x7FF8000000000000 |
| %tmp121 = fmul float %tmp118, 0x7FF8000000000000 |
| %tmp122 = fmul float %tmp119, 0x7FF8000000000000 |
| %tmp123 = fmul float %tmp120, 0x7FF8000000000000 |
| %tmp124 = call float @llvm.minnum.f32(float %tmp115, float %tmp121) |
| %tmp125 = call float @llvm.minnum.f32(float %tmp116, float %tmp122) |
| %tmp126 = call float @llvm.minnum.f32(float %tmp117, float %tmp123) |
| %tmp127 = call float @llvm.maxnum.f32(float %tmp124, float %tmp125) |
| %tmp128 = call float @llvm.maxnum.f32(float %tmp127, float %tmp126) |
| %tmp129 = fsub float %tmp38, 0x7FF8000000000000 |
| %tmp130 = fsub float %tmp39, 0x7FF8000000000000 |
| %tmp131 = fsub float %tmp40, 0x7FF8000000000000 |
| %tmp132 = fmul float %tmp129, 0.000000e+00 |
| %tmp133 = fmul float %tmp130, 0x7FF8000000000000 |
| %tmp134 = fmul float %tmp131, 0x7FF8000000000000 |
| %tmp135 = fsub float %tmp41, 0x7FF8000000000000 |
| %tmp136 = fsub float %tmp42, 0x7FF8000000000000 |
| %tmp137 = fsub float %tmp43, 0x7FF8000000000000 |
| %tmp138 = fmul float %tmp135, 0x7FF8000000000000 |
| %tmp139 = fmul float %tmp136, 0x7FF8000000000000 |
| %tmp140 = fmul float %tmp137, 0x7FF8000000000000 |
| %tmp141 = call float @llvm.minnum.f32(float %tmp132, float %tmp138) |
| %tmp142 = call float @llvm.minnum.f32(float %tmp133, float %tmp139) |
| %tmp143 = call float @llvm.minnum.f32(float %tmp134, float %tmp140) |
| %tmp144 = call float @llvm.maxnum.f32(float %tmp141, float %tmp142) |
| %tmp145 = call float @llvm.maxnum.f32(float %tmp144, float %tmp143) |
| %tmp146 = fsub float %tmp44, 0x7FF8000000000000 |
| %tmp147 = fsub float %tmp45, 0x7FF8000000000000 |
| %tmp148 = fsub float %tmp46, 0x7FF8000000000000 |
| %tmp149 = fmul float %tmp146, 0.000000e+00 |
| %tmp150 = fmul float %tmp147, 0.000000e+00 |
| %tmp151 = fmul float %tmp148, 0x7FF8000000000000 |
| %tmp152 = fsub float %tmp47, 0x7FF8000000000000 |
| %tmp153 = fsub float %tmp48, 0x7FF8000000000000 |
| %tmp154 = fsub float %tmp49, 0x7FF8000000000000 |
| %tmp155 = fmul float %tmp152, 0x7FF8000000000000 |
| %tmp156 = fmul float %tmp153, 0.000000e+00 |
| %tmp157 = fmul float %tmp154, 0x7FF8000000000000 |
| %tmp158 = call float @llvm.minnum.f32(float %tmp149, float %tmp155) |
| %tmp159 = call float @llvm.minnum.f32(float %tmp150, float %tmp156) |
| %tmp160 = call float @llvm.minnum.f32(float %tmp151, float %tmp157) |
| %tmp161 = call float @llvm.maxnum.f32(float %tmp158, float %tmp159) |
| %tmp162 = call float @llvm.maxnum.f32(float %tmp161, float %tmp160) |
| %tmp163 = fsub float %tmp50, 0x7FF8000000000000 |
| %tmp164 = fsub float %tmp51, 0x7FF8000000000000 |
| %tmp165 = fsub float %tmp52, 0x7FF8000000000000 |
| %tmp166 = fmul float %tmp163, 0x7FF8000000000000 |
| %tmp167 = fmul float %tmp164, 0.000000e+00 |
| %tmp168 = fmul float %tmp165, 0.000000e+00 |
| %tmp169 = fsub float %tmp53, 0x7FF8000000000000 |
| %tmp170 = fsub float %tmp54, 0x7FF8000000000000 |
| %tmp171 = fsub float %tmp55, 0x7FF8000000000000 |
| %tmp172 = fdiv float 1.000000e+00, %temp18.0 |
| %tmp173 = fmul float %tmp169, 0x7FF8000000000000 |
| %tmp174 = fmul float %tmp170, 0x7FF8000000000000 |
| %tmp175 = fmul float %tmp171, %tmp172 |
| %tmp176 = call float @llvm.minnum.f32(float %tmp166, float %tmp173) |
| %tmp177 = call float @llvm.minnum.f32(float %tmp167, float %tmp174) |
| %tmp178 = call float @llvm.minnum.f32(float %tmp168, float %tmp175) |
| %tmp179 = call float @llvm.maxnum.f32(float %tmp176, float %tmp177) |
| %tmp180 = call float @llvm.maxnum.f32(float %tmp179, float %tmp178) |
| %tmp181 = fsub float %tmp62, 0x7FF8000000000000 |
| %tmp182 = fsub float %tmp63, 0x7FF8000000000000 |
| %tmp183 = fsub float %tmp64, 0x7FF8000000000000 |
| %tmp184 = fmul float %tmp181, 0.000000e+00 |
| %tmp185 = fmul float %tmp182, 0x7FF8000000000000 |
| %tmp186 = fmul float %tmp183, 0x7FF8000000000000 |
| %tmp187 = fsub float %tmp65, 0x7FF8000000000000 |
| %tmp188 = fsub float %tmp66, 0x7FF8000000000000 |
| %tmp189 = fmul float %tmp187, 0x7FF8000000000000 |
| %tmp190 = fmul float %tmp188, 0x7FF8000000000000 |
| %tmp191 = call float @llvm.maxnum.f32(float %tmp184, float %tmp189) |
| %tmp192 = call float @llvm.maxnum.f32(float %tmp185, float %tmp190) |
| %tmp193 = call float @llvm.maxnum.f32(float %tmp186, float 0x7FF8000000000000) |
| %tmp194 = call float @llvm.minnum.f32(float %tmp191, float %tmp192) |
| %tmp195 = call float @llvm.minnum.f32(float %tmp194, float %tmp193) |
| %undef0 = freeze i1 poison |
| %.temp292.7 = select i1 %undef0, float %tmp162, float 0x7FF8000000000000 |
| %temp292.9 = select i1 false, float %tmp180, float %.temp292.7 |
| %undef1 = freeze i1 poison |
| %.temp292.9 = select i1 %undef1, float 0x7FF8000000000000, float %temp292.9 |
| %tmp196 = fcmp ogt float 0x7FF8000000000000, 0.000000e+00 |
| %tmp197 = fcmp olt float 0x7FF8000000000000, %tmp195 |
| %tmp198 = and i1 %tmp196, %tmp197 |
| %tmp199 = fcmp olt float 0x7FF8000000000000, %.temp292.9 |
| %tmp200 = and i1 %tmp198, %tmp199 |
| %temp292.11 = select i1 %tmp200, float 0x7FF8000000000000, float %.temp292.9 |
| %tid0 = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %cmp0 = icmp eq i32 %tid0, 0 |
| br i1 %cmp0, label %IF2565, label %ELSE2566 |
| |
| IF2565: ; preds = %ENDIF |
| %tid1 = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %cmp1 = icmp eq i32 %tid1, 0 |
| %tmp212 = fadd float %tmp1, 0x7FF8000000000000 |
| %tmp213 = fadd float 0.000000e+00, %tmp212 |
| %floor = call float @llvm.floor.f32(float %tmp213) |
| %tmp214 = fsub float %tmp213, %floor |
| %tid4 = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %cmp4 = icmp eq i32 %tid4, 0 |
| %tmp215 = fsub float 1.000000e+00, %tmp214 |
| %tmp216 = call float @llvm.sqrt.f32(float %tmp215) |
| %tmp217 = fmul float %tmp216, 0x7FF8000000000000 |
| %tmp218 = fadd float %tmp217, 0x7FF8000000000000 |
| br label %ENDIF2564 |
| |
| ELSE2566: ; preds = %ENDIF |
| %tid2 = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %tidf = bitcast i32 %tid2 to float |
| %tmp201 = fcmp oeq float %temp292.11, %tidf |
| br i1 %tmp201, label %ENDLOOP, label %ELSE2593 |
| |
| ENDIF2564: ; preds = %ENDIF2594, %IF2565 |
| %temp894.1 = phi float [ poison, %IF2565 ], [ %temp894.2, %ENDIF2594 ] |
| %temp18.1 = phi float [ %tmp218, %IF2565 ], [ poison, %ENDIF2594 ] |
| %tmp202 = fsub float %tmp5, 0x7FF8000000000000 |
| %tmp203 = fmul float %tmp202, 0x7FF8000000000000 |
| %tmp204 = call float @llvm.maxnum.f32(float 0x7FF8000000000000, float %tmp203) |
| %tmp205 = call float @llvm.minnum.f32(float %tmp204, float 0x7FF8000000000000) |
| %tmp206 = call float @llvm.minnum.f32(float %tmp205, float 0x7FF8000000000000) |
| %tmp207 = fcmp ogt float 0x7FF8000000000000, 0.000000e+00 |
| %tmp208 = fcmp olt float 0x7FF8000000000000, 1.000000e+00 |
| %tmp209 = and i1 %tmp207, %tmp208 |
| %tid3 = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) |
| %tidf3 = bitcast i32 %tid3 to float |
| %tmp210 = fcmp olt float %tidf3, %tmp206 |
| %tmp211 = and i1 %tmp209, %tmp210 |
| br i1 %tmp211, label %ENDIF2795, label %ELSE2797 |
| |
| ELSE2593: ; preds = %ELSE2566 |
| %tmp219 = fcmp oeq float %temp292.11, %tmp81 |
| %tmp220 = fcmp olt float %tmp81, %tmp83 |
| %tmp221 = and i1 %tmp219, %tmp220 |
| br i1 %tmp221, label %ENDIF2594, label %ELSE2596 |
| |
| ELSE2596: ; preds = %ELSE2593 |
| %tmp222 = fcmp oeq float %temp292.11, %tmp100 |
| %tmp223 = fcmp olt float %tmp100, %tmp102 |
| %tmp224 = and i1 %tmp222, %tmp223 |
| %undef_ELSE2596 = freeze i1 poison |
| %brmerge = or i1 %tmp224, %undef_ELSE2596 |
| br i1 %brmerge, label %ENDIF2594, label %ELSE2650 |
| |
| ENDIF2594: ; preds = %ELSE2704, %ELSE2650, %ELSE2596, %ELSE2686, %ELSE2668, %ELSE2593 |
| %temp894.2 = phi float [ 0.000000e+00, %ELSE2593 ], [ 0.000000e+00, %ELSE2686 ], [ 0.000000e+00, %ELSE2668 ], [ 0.000000e+00, %ELSE2596 ], [ 0.000000e+00, %ELSE2650 ], [ %spec.select6, %ELSE2704 ] |
| %tmp225 = fmul float %temp894.2, 0x7FF8000000000000 |
| br label %ENDIF2564 |
| |
| ELSE2650: ; preds = %ELSE2596 |
| %tmp226 = fcmp oeq float %temp292.11, %tmp110 |
| %tmp227 = fcmp olt float %tmp110, %tmp111 |
| %tmp228 = and i1 %tmp226, %tmp227 |
| br i1 %tmp228, label %ENDIF2594, label %ELSE2668 |
| |
| ELSE2668: ; preds = %ELSE2650 |
| %tmp229 = fcmp oeq float %temp292.11, %tmp128 |
| %tmp230 = fcmp olt float %tmp128, 0x7FF8000000000000 |
| %tmp231 = and i1 %tmp229, %tmp230 |
| br i1 %tmp231, label %ENDIF2594, label %ELSE2686 |
| |
| ELSE2686: ; preds = %ELSE2668 |
| %tmp232 = fcmp oeq float %temp292.11, %tmp145 |
| %tmp233 = fcmp olt float %tmp145, 0x7FF8000000000000 |
| %tmp234 = and i1 %tmp232, %tmp233 |
| br i1 %tmp234, label %ENDIF2594, label %ELSE2704 |
| |
| ELSE2704: ; preds = %ELSE2686 |
| %tmp235 = fcmp oeq float %temp292.11, %tmp180 |
| %tmp236 = fcmp olt float %tmp180, 0x7FF8000000000000 |
| %tmp237 = and i1 %tmp235, %tmp236 |
| %undef.ELSE2704 = freeze i1 poison |
| %spec.select = select i1 %undef.ELSE2704, float 0.000000e+00, float %temp894.0 |
| %spec.select6 = select i1 %tmp237, float 0.000000e+00, float %spec.select |
| br label %ENDIF2594 |
| |
| ELSE2797: ; preds = %ENDIF2564 |
| %tmp241 = fsub float %tmp8, 0x7FF8000000000000 |
| %tmp242 = fsub float %tmp9, 0x7FF8000000000000 |
| %tmp243 = fsub float %tmp10, 0x7FF8000000000000 |
| %tmp244 = fmul float %tmp241, 0x7FF8000000000000 |
| %tmp245 = fmul float %tmp242, 0x7FF8000000000000 |
| %tmp246 = fmul float %tmp243, 0x7FF8000000000000 |
| %tmp247 = fsub float %tmp11, 0x7FF8000000000000 |
| %tmp248 = fsub float %tmp12, 0x7FF8000000000000 |
| %tmp249 = fsub float %tmp13, 0x7FF8000000000000 |
| %tmp250 = fmul float %tmp247, 0x7FF8000000000000 |
| %tmp251 = fmul float %tmp248, 0x7FF8000000000000 |
| %tmp252 = fmul float %tmp249, 0x7FF8000000000000 |
| %tmp253 = call float @llvm.minnum.f32(float %tmp244, float %tmp250) |
| %tmp254 = call float @llvm.minnum.f32(float %tmp245, float %tmp251) |
| %tmp255 = call float @llvm.maxnum.f32(float %tmp246, float %tmp252) |
| %tmp256 = call float @llvm.maxnum.f32(float %tmp253, float %tmp254) |
| %tmp257 = call float @llvm.maxnum.f32(float %tmp256, float 0x7FF8000000000000) |
| %tmp258 = call float @llvm.minnum.f32(float 0x7FF8000000000000, float %tmp255) |
| %tmp259 = fcmp ogt float %tmp257, 0.000000e+00 |
| %tmp260 = fcmp olt float %tmp257, 1.000000e+00 |
| %tmp261 = and i1 %tmp259, %tmp260 |
| %tmp262 = fcmp olt float %tmp257, %tmp258 |
| %tmp263 = and i1 %tmp261, %tmp262 |
| br i1 %tmp263, label %ENDIF2795, label %ELSE2803 |
| |
| ENDIF2795: ; preds = %ELSE2806, %ELSE2797, %ELSE2824, %ELSE2821, %ELSE2803, %ENDIF2564 |
| br label %LOOP |
| |
| ELSE2803: ; preds = %ELSE2797 |
| %tmp264 = fsub float %tmp20, 0x7FF8000000000000 |
| %tmp265 = fsub float %tmp21, 0x7FF8000000000000 |
| %tmp266 = fsub float %tmp22, 0x7FF8000000000000 |
| %tmp267 = fmul float %tmp264, 0x7FF8000000000000 |
| %tmp268 = fmul float %tmp265, 0x7FF8000000000000 |
| %tmp269 = fmul float %tmp266, 0.000000e+00 |
| %tmp270 = fsub float %tmp23, 0x7FF8000000000000 |
| %tmp271 = fsub float %tmp24, 0x7FF8000000000000 |
| %tmp272 = fsub float %tmp25, 0x7FF8000000000000 |
| %tmp273 = fmul float %tmp270, 0x7FF8000000000000 |
| %tmp274 = fmul float %tmp271, 0x7FF8000000000000 |
| %tmp275 = fmul float %tmp272, 0x7FF8000000000000 |
| %tmp276 = call float @llvm.minnum.f32(float %tmp267, float %tmp273) |
| %tmp277 = call float @llvm.maxnum.f32(float %tmp268, float %tmp274) |
| %tmp278 = call float @llvm.maxnum.f32(float %tmp269, float %tmp275) |
| %tmp279 = call float @llvm.maxnum.f32(float %tmp276, float 0x7FF8000000000000) |
| %tmp280 = call float @llvm.maxnum.f32(float %tmp279, float 0x7FF8000000000000) |
| %tmp281 = call float @llvm.minnum.f32(float 0x7FF8000000000000, float %tmp277) |
| %tmp282 = call float @llvm.minnum.f32(float %tmp281, float %tmp278) |
| %tmp283 = fcmp ogt float %tmp280, 0.000000e+00 |
| %tmp284 = fcmp olt float %tmp280, 1.000000e+00 |
| %tmp285 = and i1 %tmp283, %tmp284 |
| %tmp286 = fcmp olt float %tmp280, %tmp282 |
| %tmp287 = and i1 %tmp285, %tmp286 |
| br i1 %tmp287, label %ENDIF2795, label %ELSE2806 |
| |
| ELSE2806: ; preds = %ELSE2803 |
| %tmp288 = fsub float %tmp26, 0x7FF8000000000000 |
| %tmp289 = fsub float %tmp27, 0x7FF8000000000000 |
| %tmp290 = fsub float %tmp28, 0x7FF8000000000000 |
| %tmp291 = fmul float %tmp288, 0x7FF8000000000000 |
| %tmp292 = fmul float %tmp289, 0.000000e+00 |
| %tmp293 = fmul float %tmp290, 0x7FF8000000000000 |
| %tmp294 = fsub float %tmp29, 0x7FF8000000000000 |
| %tmp295 = fmul float %tmp294, 0x7FF8000000000000 |
| %tmp296 = call float @llvm.minnum.f32(float %tmp291, float %tmp295) |
| %tmp297 = call float @llvm.minnum.f32(float %tmp292, float 0x7FF8000000000000) |
| %tmp298 = call float @llvm.maxnum.f32(float %tmp293, float 0x7FF8000000000000) |
| %tmp299 = call float @llvm.maxnum.f32(float %tmp296, float %tmp297) |
| %tmp300 = call float @llvm.maxnum.f32(float %tmp299, float 0x7FF8000000000000) |
| %tmp301 = call float @llvm.minnum.f32(float 0x7FF8000000000000, float %tmp298) |
| %tmp302 = fcmp ogt float %tmp300, 0.000000e+00 |
| %tmp303 = fcmp olt float %tmp300, 1.000000e+00 |
| %tmp304 = and i1 %tmp302, %tmp303 |
| %tmp305 = fcmp olt float %tmp300, %tmp301 |
| %tmp306 = and i1 %tmp304, %tmp305 |
| br i1 %tmp306, label %ENDIF2795, label %ELSE2821 |
| |
| ELSE2821: ; preds = %ELSE2806 |
| %tmp307 = fsub float %tmp56, 0x7FF8000000000000 |
| %tmp308 = fsub float %tmp57, 0x7FF8000000000000 |
| %tmp309 = fsub float %tmp58, 0x7FF8000000000000 |
| %tmp310 = fmul float %tmp307, 0x7FF8000000000000 |
| %tmp311 = fmul float %tmp308, 0.000000e+00 |
| %tmp312 = fmul float %tmp309, 0x7FF8000000000000 |
| %tmp313 = fsub float %tmp59, 0x7FF8000000000000 |
| %tmp314 = fsub float %tmp60, 0x7FF8000000000000 |
| %tmp315 = fsub float %tmp61, 0x7FF8000000000000 |
| %tmp316 = fmul float %tmp313, 0x7FF8000000000000 |
| %tmp317 = fmul float %tmp314, 0x7FF8000000000000 |
| %tmp318 = fmul float %tmp315, 0x7FF8000000000000 |
| %tmp319 = call float @llvm.maxnum.f32(float %tmp310, float %tmp316) |
| %tmp320 = call float @llvm.maxnum.f32(float %tmp311, float %tmp317) |
| %tmp321 = call float @llvm.maxnum.f32(float %tmp312, float %tmp318) |
| %tmp322 = call float @llvm.minnum.f32(float %tmp319, float %tmp320) |
| %tmp323 = call float @llvm.minnum.f32(float %tmp322, float %tmp321) |
| %tmp324 = fcmp ogt float 0x7FF8000000000000, 0.000000e+00 |
| %tmp325 = fcmp olt float 0x7FF8000000000000, 1.000000e+00 |
| %tmp326 = and i1 %tmp324, %tmp325 |
| %tmp327 = fcmp olt float 0x7FF8000000000000, %tmp323 |
| %tmp328 = and i1 %tmp326, %tmp327 |
| br i1 %tmp328, label %ENDIF2795, label %ELSE2824 |
| |
| ELSE2824: ; preds = %ELSE2821 |
| %undef = freeze i1 poison |
| %.2849 = select i1 %undef, float 0.000000e+00, float 1.000000e+00 |
| br label %ENDIF2795 |
| } |
| |
| declare float @llvm.floor.f32(float) #1 |
| declare float @llvm.sqrt.f32(float) #1 |
| declare float @llvm.minnum.f32(float, float) #1 |
| declare float @llvm.maxnum.f32(float, float) #1 |
| declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #1 |
| declare void @llvm.amdgcn.exp.f32(i32, i32, float, float, float, float, i1, i1) #0 |
| declare float @llvm.amdgcn.s.buffer.load.f32(<4 x i32>, i32, i32) #1 |
| |
| attributes #0 = { nounwind } |
| attributes #1 = { nounwind readnone } |