Compiler Explorer

Source code

define double @julia_mydotavx_4009({}* nonnull align 16 dereferenceable(40) %0, {}* nonnull align 16 dereferenceable(40) %1) {
top:
  %2 = bitcast {}* %0 to {}**
  %3 = getelementptr inbounds {}*, {}** %2, i64 3
  %4 = bitcast {}** %3 to i64*
  %5 = load i64, i64* %4, align 8
  %6 = bitcast {}* %0 to i8**
  %7 = load i8*, i8** %6, align 8
  %8 = bitcast {}* %1 to i8**
  %9 = load i8*, i8** %8, align 8
  %10 = icmp ne i64 %5, 0
  call void @llvm.assume(i1 %10)
  %11 = add nsw i64 %5, -8
  %.not26 = icmp ult i64 %5, 8
  br i1 %.not26, label %L41, label %L34

L34:                                              ; preds = %L34, %top
  %value_phi428 = phi i64 [ %13, %L34 ], [ 0, %top ]
  %value_phi27 = phi <8 x double> [ %res.i18, %L34 ], [ zeroinitializer, %top ]
  %12 = shl i64 %value_phi428, 3
  %ptr.1.i22 = getelementptr inbounds i8, i8* %7, i64 %12
  %ptr.2.i23 = bitcast i8* %ptr.1.i22 to <8 x double>*
  %res.i24 = load <8 x double>, <8 x double>* %ptr.2.i23, align 8
  %ptr.1.i19 = getelementptr inbounds i8, i8* %9, i64 %12
  %ptr.2.i20 = bitcast i8* %ptr.1.i19 to <8 x double>*
  %res.i21 = load <8 x double>, <8 x double>* %ptr.2.i20, align 8
  %res.i18 = call reassoc nsz arcp contract afn <8 x double> @llvm.fma.v8f64(<8 x double> %res.i24, <8 x double> %res.i21, <8 x double> %value_phi27)
  %13 = add nuw nsw i64 %value_phi428, 8
  %.not = icmp sgt i64 %13, %11
  br i1 %.not, label %L41, label %L34

L41:                                              ; preds = %L34, %top
  %value_phi.lcssa = phi <8 x double> [ zeroinitializer, %top ], [ %res.i18, %L34 ]
  %value_phi4.lcssa = phi i64 [ 0, %top ], [ %13, %L34 ]
  %.not25 = icmp slt i64 %value_phi4.lcssa, %5
  br i1 %.not25, label %L44, label %L64

L44:                                              ; preds = %L41
  %14 = trunc i64 %5 to i8
  %15 = add i8 %14, 7
  %16 = and i8 %15, 7
  %17 = xor i8 %16, 7
  %18 = lshr i8 -1, %17
  %19 = shl i64 %value_phi4.lcssa, 3
  %ptr.1.i13 = getelementptr inbounds i8, i8* %7, i64 %19
  %ptr.2.i14 = bitcast i8* %ptr.1.i13 to <8 x double>*
  %mask.0.i15 = bitcast i8 %18 to <8 x i1>
  %res.i16 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.2.i14, i32 8, <8 x i1> %mask.0.i15, <8 x double> zeroinitializer)
  %ptr.1.i = getelementptr inbounds i8, i8* %9, i64 %19
  %ptr.2.i = bitcast i8* %ptr.1.i to <8 x double>*
  %res.i12 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.2.i, i32 8, <8 x i1> %mask.0.i15, <8 x double> zeroinitializer)
  %res.i10 = call reassoc nsz arcp contract afn <8 x double> @llvm.fma.v8f64(<8 x double> %res.i16, <8 x double> %res.i12, <8 x double> %value_phi.lcssa)
  %res.i9 = select reassoc nsz arcp contract <8 x i1> %mask.0.i15, <8 x double> %res.i10, <8 x double> %value_phi.lcssa
  br label %L64

L64:                                              ; preds = %L44, %L41
  %value_phi5 = phi <8 x double> [ %res.i9, %L44 ], [ %value_phi.lcssa, %L41 ]
  %res.i = call reassoc nsz arcp contract afn double @llvm.experimental.vector.reduce.v2.fadd.f64.v8f64(double 0.000000e+00, <8 x double> %value_phi5)
  ret double %res.i
}

; Function Attrs: nounwind willreturn
declare void @llvm.assume(i1) #3

; Function Attrs: nounwind readnone speculatable willreturn
declare <8 x double> @llvm.fma.v8f64(<8 x double>, <8 x double>, <8 x double>) #4

; Function Attrs: argmemonly nounwind readonly willreturn
declare <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>*, i32 immarg, <8 x i1>, <8 x double>) #5

; Function Attrs: nounwind readnone willreturn
declare double @llvm.experimental.vector.reduce.v2.fadd.f64.v8f64(double, <8 x double>) #6

; Function Attrs: argmemonly nounwind willreturn
declare void @llvm.lifetime.start.p0i8(i64 immarg, i8* nocapture) #7

; Function Attrs: argmemonly nounwind willreturn
declare void @llvm.lifetime.end.p0i8(i64 immarg, i8* nocapture) #7