[AArch64] add tests for fadd -> fma combines; NFC

The transform to create a final fma was added with: D132837 / c98a46fee6 These tests are intended to show the minimal fast-math-flags necessary to enable the fold: currently only the final fadd needs to have "reassoc".
2022-09-21 08:56:25 -04:00 · 2022-09-21 08:56:25 -04:00 · ddd27a3d39
parent b84be9f2f1
commit ddd27a3d39
1 changed files with 32 additions and 0 deletions
--- a/llvm/test/CodeGen/AArch64/fadd-combines.ll
+++ b/llvm/test/CodeGen/AArch64/fadd-combines.ll
@ -315,5 +315,37 @@ define float @fadd_fma_fmul_extra_use_3(float %a, float %b, float %c, float %d,
  ret float %a2
 }

+define float @fmac_sequence_innermost_fmul(float %a, float %b, float %c, float %d, float %e, float %f, float %g) {
+; CHECK-LABEL: fmac_sequence_innermost_fmul:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    fmadd s0, s0, s1, s6
+; CHECK-NEXT:    fmadd s0, s2, s3, s0
+; CHECK-NEXT:    fmadd s0, s4, s5, s0
+; CHECK-NEXT:    ret
+  %t0 = fmul float %a, %b
+  %t1 = fmul contract float %c, %d
+  %t2 = fadd contract float %t0, %t1
+  %t3 = fmul contract float %e, %f
+  %t4 = fadd contract float %t2, %t3
+  %t5 = fadd contract reassoc float %t4, %g
+  ret float %t5
+}
+
+define float @fmac_sequence_innermost_fmul_intrinsics(float %a, float %b, float %c, float %d, float %e, float %f, float %g) {
+; CHECK-LABEL: fmac_sequence_innermost_fmul_intrinsics:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    fmadd s0, s0, s1, s6
+; CHECK-NEXT:    fmadd s0, s2, s3, s0
+; CHECK-NEXT:    fmadd s0, s4, s5, s0
+; CHECK-NEXT:    ret
+  %t0 = fmul float %a, %b
+  %t1 = call float @llvm.fma.f32(float %c, float %d, float %t0)
+  %t2 = call float @llvm.fma.f32(float %e, float %f, float %t1)
+  %t5 = fadd contract reassoc float %t2, %g
+  ret float %t5
+}
+
+declare float @llvm.fma.f32(float, float, float)
+
 declare void @use(double)