Compiler Explorer

Source code

@n = external local_unnamed_addr global i32, align 4
@arr = common local_unnamed_addr global [20 x float] zeroinitializer, align 16
@arr1 = common local_unnamed_addr global [20 x float] zeroinitializer, align 16
@res = external local_unnamed_addr global float, align 4

define float @baz() {
entry:
  %0 = load i32, i32* @n, align 4
  %mul = mul nsw i32 %0, 3
  %conv = sitofp i32 %mul to float
  %1 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 0), align 16
  %2 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 0), align 16
  %mul4 = fmul fast float %2, %1
  %add = fadd fast float %mul4, %conv
  %3 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 1), align 4
  %4 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 1), align 4
  %mul4.1 = fmul fast float %4, %3
  %add.1 = fadd fast float %mul4.1, %add
  %5 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 2), align 8
  %6 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 2), align 8
  %mul4.2 = fmul fast float %6, %5
  %add.2 = fadd fast float %mul4.2, %add.1
  %7 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 3), align 4
  %8 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 3), align 4
  %mul4.3 = fmul fast float %8, %7
  %add.3 = fadd fast float %mul4.3, %add.2
  %add7 = fadd fast float %add.3, %conv
  %add19 = fadd fast float %mul4, %add7
  %add19.1 = fadd fast float %mul4.1, %add19
  %add19.2 = fadd fast float %mul4.2, %add19.1
  %add19.3 = fadd fast float %mul4.3, %add19.2
  store float %add19.3, float* @res, align 4
  ret float %add19.3
}

Source code

define float @baz() {
entry:
  %0 = load i32, i32* @n, align 4
  %mul = mul nsw i32 %0, 3
  %conv = sitofp i32 %mul to float
  %1 = load <2 x float>, <2 x float>* bitcast ([20 x float]* @arr to <2 x float>*), align 16
  %2 = load <2 x float>, <2 x float>* bitcast ([20 x float]* @arr1 to <2 x float>*), align 16
  %3 = fmul fast <2 x float> %2, %1
  %4 = extractelement <2 x float> %3, i32 0
  %add = fadd fast float %4, %conv
  %5 = extractelement <2 x float> %3, i32 1
  %add.1 = fadd fast float %5, %add
  %6 = load <2 x float>, <2 x float>* bitcast (float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 2) to <2 x float>*), align 8
  %7 = load <2 x float>, <2 x float>* bitcast (float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 2) to <2 x float>*), align 8
  %8 = fmul fast <2 x float> %7, %6
  %9 = extractelement <2 x float> %8, i32 0
  %add.2 = fadd fast float %9, %add.1
  %10 = extractelement <2 x float> %8, i32 1
  %add.3 = fadd fast float %10, %add.2
  %add7 = fadd fast float %add.3, %conv
  %add19 = fadd fast float %4, %add7
  %add19.1 = fadd fast float %5, %add19
  %add19.2 = fadd fast float %9, %add19.1
  %add19.3 = fadd fast float %10, %add19.2
  store float %add19.3, float* @res, align 4
  ret float %add19.3
}

Source code

define float @baz() #0 {
entry:
  %0 = load i32, i32* @n, align 4
  %mul = mul nsw i32 %0, 3
  %conv = sitofp i32 %mul to float
  %1 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 0), align 16
  %2 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 0), align 16
  %mul4 = fmul fast float %2, %1
  %add = fadd fast float %mul4, %conv
  %3 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 1), align 4
  %4 = load float, float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 1), align 4
  %mul4.1 = fmul fast float %4, %3
  %add.1 = fadd fast float %mul4.1, %add
  %5 = load <2 x float>, <2 x float>* bitcast (float* getelementptr inbounds ([20 x float], [20 x float]* @arr, i64 0, i64 2) to <2 x float>*), align 8
  %6 = load <2 x float>, <2 x float>* bitcast (float* getelementptr inbounds ([20 x float], [20 x float]* @arr1, i64 0, i64 2) to <2 x float>*), align 8
  %7 = fmul fast <2 x float> %6, %5
  %8 = extractelement <2 x float> %7, i32 0
  %rdx.shuf = shufflevector <2 x float> %7, <2 x float> undef, <2 x i32> <i32 1, i32 undef>
  %bin.rdx = fadd fast <2 x float> %7, %rdx.shuf
  %9 = extractelement <2 x float> %bin.rdx, i32 0
  %10 = fadd fast float %9, %8
  %op.extra = fadd fast float %10, %mul4.1
  %op.extra1 = fadd fast float %op.extra, %mul4
  %op.extra2 = fadd fast float %op.extra1, %add.1
  %op.extra3 = fadd fast float %op.extra2, %conv
  %11 = extractelement <2 x float> %7, i32 1
  %add19.3 = fadd fast float %11, %op.extra3
  store float %add19.3, float* @res, align 4
  ret float %add19.3
}