Thanks for using Compiler Explorer
Sponsors
Jakt
C++
Ada
Analysis
Android Java
Android Kotlin
Assembly
C
C3
Carbon
C++ (Circle)
CIRCT
Clean
CMake
CMakeScript
COBOL
C++ for OpenCL
MLIR
Cppx
Cppx-Blue
Cppx-Gold
Cpp2-cppfront
Crystal
C#
CUDA C++
D
Dart
Elixir
Erlang
Fortran
F#
Go
Haskell
HLSL
Hook
Hylo
ispc
Java
Julia
Kotlin
LLVM IR
LLVM MIR
Modula-2
Nim
Objective-C
Objective-C++
OCaml
OpenCL C
Pascal
Pony
Python
Racket
Ruby
Rust
Snowball
Scala
Solidity
Spice
Swift
LLVM TableGen
Toit
TypeScript Native
V
Vala
Visual Basic
Zig
Javascript
GIMPLE
llvm source #1
Output
Compile to binary object
Link to binary
Execute the code
Intel asm syntax
Demangle identifiers
Verbose demangling
Filters
Unused labels
Library functions
Directives
Comments
Horizontal whitespace
Debug intrinsics
Compiler
clang (assertions trunk)
clang (trunk)
clang 10.0.0
clang 10.0.1
clang 11.0.0
clang 11.0.1
clang 12.0.0
clang 12.0.1
clang 13.0.0
clang 14.0.0
clang 15.0.0
clang 16.0.0
clang 17.0.1
clang 18.1.0
clang 4.0.1
clang 5.0.0
clang 6.0.0
clang 7.0.0
clang 8.0.0
clang 9.0.0
llc (assertions trunk)
llc (trunk)
llc 10.0.0
llc 10.0.1
llc 11.0.0
llc 11.0.1
llc 12.0.0
llc 12.0.1
llc 13.0.0
llc 14.0.0
llc 15.0.0
llc 16.0.0
llc 17.0.1
llc 18.1.0
llc 3.2
llc 3.3
llc 3.9.1
llc 4.0.0
llc 4.0.1
llc 5.0.0
llc 6.0.0
llc 7.0.0
llc 8.0.0
llc 9.0.0
opt (assertions trunk)
opt (trunk)
opt 10.0.0
opt 10.0.1
opt 11.0.0
opt 11.0.1
opt 12.0.0
opt 12.0.1
opt 13.0.0
opt 14.0.0
opt 15.0.0
opt 16.0.0
opt 17.0.1
opt 18.1.0
opt 3.2
opt 3.3
opt 3.9.1
opt 4.0.0
opt 4.0.1
opt 5.0.0
opt 6.0.0
opt 7.0.0
opt 8.0.0
opt 9.0.0
Options
Source code
; ModuleID = 'mydotavx' source_filename = "mydotavx" target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128-ni:10:11:12:13" target triple = "x86_64-generic-linux" %jl_value_t = type opaque @llvm.compiler.used = appending global [3 x i8*] [i8* bitcast (void (%jl_value_t*)* @jl_gc_queue_root to i8*), i8* bitcast (%jl_value_t* (i8*, i32, i32)* @jl_gc_pool_alloc to i8*), i8* bitcast (%jl_value_t* (i8*, i64)* @jl_gc_big_alloc to i8*)], section "llvm.metadata" define double @julia_mydotavx_8642(%jl_value_t* nonnull align 16 dereferenceable(40) %0, %jl_value_t* nonnull align 16 dereferenceable(40) %1, i64 %2) !dbg !5 { top: %3 = bitcast %jl_value_t* %0 to i64*, !dbg !7 %4 = load i64, i64* %3, align 8, !dbg !7, !tbaa !17, !range !22 %5 = bitcast %jl_value_t* %1 to i64*, !dbg !7 %6 = load i64, i64* %5, align 8, !dbg !7, !tbaa !17, !range !22 %.inv = icmp sgt i64 %2, 0, !dbg !23 call void @llvm.assume(i1 %.inv), !dbg !30 %res.i238 = add nsw i64 %2, -31, !dbg !38 %7 = icmp ugt i64 %2, 31, !dbg !41 br i1 %7, label %L49.lr.ph, label %L104, !dbg !33 L49.lr.ph: ; preds = %top %typptr.i233 = inttoptr i64 %4 to i8*, !dbg !44 %typptr.i210 = inttoptr i64 %6 to i8*, !dbg !44 br label %L49, !dbg !33 L49: ; preds = %L49, %L49.lr.ph %value_phi22243 = phi i64 [ 0, %L49.lr.ph ], [ %res.i183, %L49 ] %value_phi15242 = phi <8 x double> [ zeroinitializer, %L49.lr.ph ], [ %res.i191, %L49 ] %value_phi9241 = phi <8 x double> [ zeroinitializer, %L49.lr.ph ], [ %res.i189, %L49 ] %value_phi5240 = phi <8 x double> [ zeroinitializer, %L49.lr.ph ], [ %res.i185, %L49 ] %value_phi239 = phi <8 x double> [ zeroinitializer, %L49.lr.ph ], [ %res.i187, %L49 ] %res.i237 = shl i64 %value_phi22243, 3, !dbg !52 %offsetptr.i234 = getelementptr inbounds i8, i8* %typptr.i233, i64 %res.i237, !dbg !58 %ptr.i235 = bitcast i8* %offsetptr.i234 to <8 x double>*, !dbg !58 %res.i236 = load <8 x double>, <8 x double>* %ptr.i235, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %res.i231 = or i64 %res.i237, 64, !dbg !52 %offsetptr.i228 = getelementptr inbounds i8, i8* %typptr.i233, i64 %res.i231, !dbg !58 %ptr.i229 = bitcast i8* %offsetptr.i228 to <8 x double>*, !dbg !58 %res.i230 = load <8 x double>, <8 x double>* %ptr.i229, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %res.i225 = or i64 %res.i237, 128, !dbg !52 %offsetptr.i222 = getelementptr inbounds i8, i8* %typptr.i233, i64 %res.i225, !dbg !58 %ptr.i223 = bitcast i8* %offsetptr.i222 to <8 x double>*, !dbg !58 %res.i224 = load <8 x double>, <8 x double>* %ptr.i223, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %res.i219 = or i64 %res.i237, 192, !dbg !52 %offsetptr.i216 = getelementptr inbounds i8, i8* %typptr.i233, i64 %res.i219, !dbg !58 %ptr.i217 = bitcast i8* %offsetptr.i216 to <8 x double>*, !dbg !58 %res.i218 = load <8 x double>, <8 x double>* %ptr.i217, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i211 = getelementptr inbounds i8, i8* %typptr.i210, i64 %res.i237, !dbg !58 %ptr.i212 = bitcast i8* %offsetptr.i211 to <8 x double>*, !dbg !58 %res.i213 = load <8 x double>, <8 x double>* %ptr.i212, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i205 = getelementptr inbounds i8, i8* %typptr.i210, i64 %res.i231, !dbg !58 %ptr.i206 = bitcast i8* %offsetptr.i205 to <8 x double>*, !dbg !58 %res.i207 = load <8 x double>, <8 x double>* %ptr.i206, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i199 = getelementptr inbounds i8, i8* %typptr.i210, i64 %res.i225, !dbg !58 %ptr.i200 = bitcast i8* %offsetptr.i199 to <8 x double>*, !dbg !58 %res.i201 = load <8 x double>, <8 x double>* %ptr.i200, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i193 = getelementptr inbounds i8, i8* %typptr.i210, i64 %res.i219, !dbg !58 %ptr.i194 = bitcast i8* %offsetptr.i193 to <8 x double>*, !dbg !58 %res.i195 = load <8 x double>, <8 x double>* %ptr.i194, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %prod.i190 = fmul nnan ninf nsz arcp contract <8 x double> %res.i236, %res.i213, !dbg !64 %res.i191 = fadd fast <8 x double> %prod.i190, %value_phi15242, !dbg !64 %prod.i188 = fmul nnan ninf nsz arcp contract <8 x double> %res.i230, %res.i207, !dbg !64 %res.i189 = fadd fast <8 x double> %prod.i188, %value_phi9241, !dbg !64 %prod.i186 = fmul nnan ninf nsz arcp contract <8 x double> %res.i224, %res.i201, !dbg !64 %res.i187 = fadd fast <8 x double> %prod.i186, %value_phi239, !dbg !64 %prod.i184 = fmul nnan ninf nsz arcp contract <8 x double> %res.i218, %res.i195, !dbg !64 %res.i185 = fadd fast <8 x double> %prod.i184, %value_phi5240, !dbg !64 %res.i183 = add nuw nsw i64 %value_phi22243, 32, !dbg !72 %8 = icmp slt i64 %res.i183, %res.i238, !dbg !41 br i1 %8, label %L49, label %L22.L104_crit_edge, !dbg !33 L22.L104_crit_edge: ; preds = %L49 %res.i191.lcssa = phi <8 x double> [ %res.i191, %L49 ], !dbg !64 %res.i189.lcssa = phi <8 x double> [ %res.i189, %L49 ], !dbg !64 %res.i187.lcssa = phi <8 x double> [ %res.i187, %L49 ], !dbg !64 %res.i185.lcssa = phi <8 x double> [ %res.i185, %L49 ], !dbg !64 %9 = and i64 %2, 9223372036854775776, !dbg !33 br label %L104, !dbg !33 L104: ; preds = %L22.L104_crit_edge, %top %value_phi.lcssa = phi <8 x double> [ %res.i187.lcssa, %L22.L104_crit_edge ], [ zeroinitializer, %top ] %value_phi5.lcssa = phi <8 x double> [ %res.i185.lcssa, %L22.L104_crit_edge ], [ zeroinitializer, %top ] %value_phi9.lcssa = phi <8 x double> [ %res.i189.lcssa, %L22.L104_crit_edge ], [ zeroinitializer, %top ] %value_phi15.lcssa = phi <8 x double> [ %res.i191.lcssa, %L22.L104_crit_edge ], [ zeroinitializer, %top ] %value_phi22.lcssa = phi i64 [ %9, %L22.L104_crit_edge ], [ 0, %top ] %10 = icmp ult i64 %value_phi22.lcssa, %2, !dbg !41 br i1 %10, label %L106, label %L271, !dbg !33 L106: ; preds = %L104 %11 = trunc i64 %2 to i8, !dbg !76 %12 = add i8 %11, 7, !dbg !83 %13 = and i8 %12, 7, !dbg !85 %14 = xor i8 %13, 7, !dbg !89 %15 = lshr i8 -1, %14, !dbg !91 %res.i180 = add nsw i64 %2, -9, !dbg !38 %16 = icmp slt i64 %res.i180, %value_phi22.lcssa, !dbg !93 br i1 %16, label %L120, label %L135, !dbg !33 L120: ; preds = %L106 %res.i179 = shl nsw i64 %value_phi22.lcssa, 3, !dbg !97 %typptr.i174 = inttoptr i64 %4 to i8*, !dbg !101 %offsetptr.i175 = getelementptr inbounds i8, i8* %typptr.i174, i64 %res.i179, !dbg !101 %ptr.i176 = bitcast i8* %offsetptr.i175 to <8 x double>*, !dbg !101 %mask.i177 = bitcast i8 %15 to <8 x i1>, !dbg !101 %res.i178 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i176, i32 8, <8 x i1> %mask.i177, <8 x double> zeroinitializer), !dbg !101 %typptr.i168 = inttoptr i64 %6 to i8*, !dbg !101 %offsetptr.i169 = getelementptr inbounds i8, i8* %typptr.i168, i64 %res.i179, !dbg !101 %ptr.i170 = bitcast i8* %offsetptr.i169 to <8 x double>*, !dbg !101 %res.i172 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i170, i32 8, <8 x i1> %mask.i177, <8 x double> zeroinitializer), !dbg !101 %prod.i166 = fmul nnan ninf nsz arcp contract <8 x double> %res.i178, %res.i172, !dbg !104 %res.i167 = fadd fast <8 x double> %prod.i166, %value_phi15.lcssa, !dbg !104 %res.i165 = select fast <8 x i1> %mask.i177, <8 x double> %res.i167, <8 x double> %value_phi15.lcssa, !dbg !110 br label %L271, !dbg !33 L135: ; preds = %L106 %res.i162 = add nsw i64 %2, -17, !dbg !38 %17 = icmp slt i64 %res.i162, %value_phi22.lcssa, !dbg !93 br i1 %17, label %L139, label %L168, !dbg !33 L139: ; preds = %L135 %res.i161 = shl i64 %value_phi22.lcssa, 3, !dbg !52 %typptr.i157 = inttoptr i64 %4 to i8*, !dbg !58 %offsetptr.i158 = getelementptr inbounds i8, i8* %typptr.i157, i64 %res.i161, !dbg !58 %ptr.i159 = bitcast i8* %offsetptr.i158 to <8 x double>*, !dbg !58 %res.i160 = load <8 x double>, <8 x double>* %ptr.i159, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %res.i155 = or i64 %res.i161, 64, !dbg !97 %offsetptr.i151 = getelementptr inbounds i8, i8* %typptr.i157, i64 %res.i155, !dbg !101 %ptr.i152 = bitcast i8* %offsetptr.i151 to <8 x double>*, !dbg !101 %mask.i153 = bitcast i8 %15 to <8 x i1>, !dbg !101 %res.i154 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i152, i32 8, <8 x i1> %mask.i153, <8 x double> zeroinitializer), !dbg !101 %typptr.i145 = inttoptr i64 %6 to i8*, !dbg !58 %offsetptr.i146 = getelementptr inbounds i8, i8* %typptr.i145, i64 %res.i161, !dbg !58 %ptr.i147 = bitcast i8* %offsetptr.i146 to <8 x double>*, !dbg !58 %res.i148 = load <8 x double>, <8 x double>* %ptr.i147, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i139 = getelementptr inbounds i8, i8* %typptr.i145, i64 %res.i155, !dbg !101 %ptr.i140 = bitcast i8* %offsetptr.i139 to <8 x double>*, !dbg !101 %res.i142 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i140, i32 8, <8 x i1> %mask.i153, <8 x double> zeroinitializer), !dbg !101 %prod.i136 = fmul nnan ninf nsz arcp contract <8 x double> %res.i160, %res.i148, !dbg !64 %res.i137 = fadd fast <8 x double> %prod.i136, %value_phi15.lcssa, !dbg !64 %prod.i134 = fmul nnan ninf nsz arcp contract <8 x double> %res.i154, %res.i142, !dbg !104 %res.i135 = fadd fast <8 x double> %prod.i134, %value_phi9.lcssa, !dbg !104 %res.i133 = select fast <8 x i1> %mask.i153, <8 x double> %res.i135, <8 x double> %value_phi9.lcssa, !dbg !110 br label %L271, !dbg !33 L168: ; preds = %L135 %res.i130 = add nsw i64 %2, -25, !dbg !38 %18 = icmp slt i64 %res.i130, %value_phi22.lcssa, !dbg !93 %res.i129 = shl i64 %value_phi22.lcssa, 3, !dbg !52 %typptr.i125 = inttoptr i64 %4 to i8*, !dbg !58 %offsetptr.i126 = getelementptr inbounds i8, i8* %typptr.i125, i64 %res.i129, !dbg !58 %ptr.i127 = bitcast i8* %offsetptr.i126 to <8 x double>*, !dbg !58 %res.i128 = load <8 x double>, <8 x double>* %ptr.i127, align 8, !dbg !58, !tbaa !59 %res.i123 = or i64 %res.i129, 64, !dbg !52 %offsetptr.i120 = getelementptr inbounds i8, i8* %typptr.i125, i64 %res.i123, !dbg !58 %ptr.i121 = bitcast i8* %offsetptr.i120 to <8 x double>*, !dbg !58 %res.i122 = load <8 x double>, <8 x double>* %ptr.i121, align 8, !dbg !58, !tbaa !59 %res.i117 = or i64 %res.i129, 128, !dbg !114 %offsetptr.i113 = getelementptr inbounds i8, i8* %typptr.i125, i64 %res.i117, !dbg !114 %ptr.i114 = bitcast i8* %offsetptr.i113 to <8 x double>*, !dbg !114 br i1 %18, label %L172, label %L215, !dbg !33 L172: ; preds = %L168 %mask.i115 = bitcast i8 %15 to <8 x i1>, !dbg !101 %res.i116 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i114, i32 8, <8 x i1> %mask.i115, <8 x double> zeroinitializer), !dbg !101 %typptr.i107 = inttoptr i64 %6 to i8*, !dbg !58 %offsetptr.i108 = getelementptr inbounds i8, i8* %typptr.i107, i64 %res.i129, !dbg !58 %ptr.i109 = bitcast i8* %offsetptr.i108 to <8 x double>*, !dbg !58 %res.i110 = load <8 x double>, <8 x double>* %ptr.i109, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i102 = getelementptr inbounds i8, i8* %typptr.i107, i64 %res.i123, !dbg !58 %ptr.i103 = bitcast i8* %offsetptr.i102 to <8 x double>*, !dbg !58 %res.i104 = load <8 x double>, <8 x double>* %ptr.i103, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i95 = getelementptr inbounds i8, i8* %typptr.i107, i64 %res.i117, !dbg !101 %ptr.i96 = bitcast i8* %offsetptr.i95 to <8 x double>*, !dbg !101 %res.i98 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i96, i32 8, <8 x i1> %mask.i115, <8 x double> zeroinitializer), !dbg !101 %prod.i92 = fmul nnan ninf nsz arcp contract <8 x double> %res.i128, %res.i110, !dbg !64 %res.i93 = fadd fast <8 x double> %prod.i92, %value_phi15.lcssa, !dbg !64 %prod.i90 = fmul nnan ninf nsz arcp contract <8 x double> %res.i122, %res.i104, !dbg !64 %res.i91 = fadd fast <8 x double> %prod.i90, %value_phi9.lcssa, !dbg !64 %prod.i88 = fmul nnan ninf nsz arcp contract <8 x double> %res.i116, %res.i98, !dbg !104 %res.i89 = fadd fast <8 x double> %prod.i88, %value_phi.lcssa, !dbg !104 %res.i87 = select fast <8 x i1> %mask.i115, <8 x double> %res.i89, <8 x double> %value_phi.lcssa, !dbg !110 br label %L271, !dbg !33 L215: ; preds = %L168 %res.i71 = load <8 x double>, <8 x double>* %ptr.i114, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %res.i66 = or i64 %res.i129, 192, !dbg !97 %offsetptr.i62 = getelementptr inbounds i8, i8* %typptr.i125, i64 %res.i66, !dbg !101 %ptr.i63 = bitcast i8* %offsetptr.i62 to <8 x double>*, !dbg !101 %mask.i64 = bitcast i8 %15 to <8 x i1>, !dbg !101 %res.i65 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i63, i32 8, <8 x i1> %mask.i64, <8 x double> zeroinitializer), !dbg !101 %typptr.i56 = inttoptr i64 %6 to i8*, !dbg !58 %offsetptr.i57 = getelementptr inbounds i8, i8* %typptr.i56, i64 %res.i129, !dbg !58 %ptr.i58 = bitcast i8* %offsetptr.i57 to <8 x double>*, !dbg !58 %res.i59 = load <8 x double>, <8 x double>* %ptr.i58, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i51 = getelementptr inbounds i8, i8* %typptr.i56, i64 %res.i123, !dbg !58 %ptr.i52 = bitcast i8* %offsetptr.i51 to <8 x double>*, !dbg !58 %res.i53 = load <8 x double>, <8 x double>* %ptr.i52, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i45 = getelementptr inbounds i8, i8* %typptr.i56, i64 %res.i117, !dbg !58 %ptr.i46 = bitcast i8* %offsetptr.i45 to <8 x double>*, !dbg !58 %res.i47 = load <8 x double>, <8 x double>* %ptr.i46, align 8, !dbg !58, !tbaa !59, !alias.scope !61 %offsetptr.i = getelementptr inbounds i8, i8* %typptr.i56, i64 %res.i66, !dbg !101 %ptr.i = bitcast i8* %offsetptr.i to <8 x double>*, !dbg !101 %res.i41 = call <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>* nonnull %ptr.i, i32 8, <8 x i1> %mask.i64, <8 x double> zeroinitializer), !dbg !101 %prod.i39 = fmul nnan ninf nsz arcp contract <8 x double> %res.i128, %res.i59, !dbg !64 %res.i40 = fadd fast <8 x double> %prod.i39, %value_phi15.lcssa, !dbg !64 %prod.i37 = fmul nnan ninf nsz arcp contract <8 x double> %res.i122, %res.i53, !dbg !64 %res.i38 = fadd fast <8 x double> %prod.i37, %value_phi9.lcssa, !dbg !64 %prod.i35 = fmul nnan ninf nsz arcp contract <8 x double> %res.i71, %res.i47, !dbg !64 %res.i36 = fadd fast <8 x double> %prod.i35, %value_phi.lcssa, !dbg !64 %prod.i = fmul nnan ninf nsz arcp contract <8 x double> %res.i65, %res.i41, !dbg !104 %res.i34 = fadd fast <8 x double> %prod.i, %value_phi5.lcssa, !dbg !104 %res.i33 = select fast <8 x i1> %mask.i64, <8 x double> %res.i34, <8 x double> %value_phi5.lcssa, !dbg !110 br label %L271, !dbg !72 L271: ; preds = %L215, %L172, %L139, %L120, %L104 %value_phi23 = phi <8 x double> [ %value_phi.lcssa, %L120 ], [ %value_phi.lcssa, %L139 ], [ %res.i87, %L172 ], [ %res.i36, %L215 ], [ %value_phi.lcssa, %L104 ] %value_phi24 = phi <8 x double> [ %value_phi5.lcssa, %L120 ], [ %value_phi5.lcssa, %L139 ], [ %value_phi5.lcssa, %L172 ], [ %res.i33, %L215 ], [ %value_phi5.lcssa, %L104 ] %value_phi25 = phi <8 x double> [ %value_phi9.lcssa, %L120 ], [ %res.i133, %L139 ], [ %res.i91, %L172 ], [ %res.i38, %L215 ], [ %value_phi9.lcssa, %L104 ] %value_phi26 = phi <8 x double> [ %res.i165, %L120 ], [ %res.i137, %L139 ], [ %res.i93, %L172 ], [ %res.i40, %L215 ], [ %value_phi15.lcssa, %L104 ] %res.i31 = fadd <8 x double> %value_phi25, %value_phi26, !dbg !115 %res.i30 = fadd <8 x double> %value_phi23, %value_phi24, !dbg !115 %res.i29 = fadd <8 x double> %res.i30, %res.i31, !dbg !115 %res.i = call fast double @llvm.experimental.vector.reduce.v2.fadd.f64.v8f64(double 0.000000e+00, <8 x double> %res.i29), !dbg !123 ret double %res.i, !dbg !126 } define nonnull %jl_value_t* @jfptr_mydotavx_8643(%jl_value_t* %0, %jl_value_t** %1, i32 %2) #0 { top: %thread_ptr = call i8* asm "movq %fs:0, $0", "=r"() %ptls_i8 = getelementptr i8, i8* %thread_ptr, i64 -15720 %ptls = bitcast i8* %ptls_i8 to %jl_value_t*** %3 = load %jl_value_t*, %jl_value_t** %1, align 8, !nonnull !4, !dereferenceable !127, !align !128 %4 = getelementptr inbounds %jl_value_t*, %jl_value_t** %1, i64 1 %5 = load %jl_value_t*, %jl_value_t** %4, align 8, !nonnull !4, !dereferenceable !127, !align !128 %6 = getelementptr inbounds %jl_value_t*, %jl_value_t** %1, i64 2 %7 = bitcast %jl_value_t** %6 to i64** %8 = load i64*, i64** %7, align 8, !nonnull !4, !dereferenceable !129, !align !129 %9 = load i64, i64* %8, align 8 %10 = call double @julia_mydotavx_8642(%jl_value_t* %3, %jl_value_t* %5, i64 %9) %11 = bitcast %jl_value_t*** %ptls to i8* %12 = call noalias nonnull %jl_value_t* @jl_gc_pool_alloc(i8* %11, i32 1400, i32 16) #1 %13 = bitcast %jl_value_t* %12 to %jl_value_t** %14 = getelementptr %jl_value_t*, %jl_value_t** %13, i64 -1 store %jl_value_t* inttoptr (i64 139643866079424 to %jl_value_t*), %jl_value_t** %14, !tbaa !130 %15 = bitcast %jl_value_t* %12 to double* store double %10, double* %15, align 8, !tbaa !133 ret %jl_value_t* %12 } ; Function Attrs: allocsize(1) declare noalias nonnull %jl_value_t* @julia.gc_alloc_obj(i8*, i64, %jl_value_t*) #1 ; Function Attrs: nounwind readnone declare %jl_value_t* @julia.pointer_from_objref(%jl_value_t*) #2 declare token @llvm.julia.gc_preserve_begin(...) ; Function Attrs: nounwind willreturn declare void @llvm.assume(i1) #3 ; Function Attrs: argmemonly nounwind readonly willreturn declare <8 x double> @llvm.masked.load.v8f64.p0v8f64(<8 x double>*, i32 immarg, <8 x i1>, <8 x double>) #4 declare void @llvm.julia.gc_preserve_end(token) ; Function Attrs: nounwind readnone willreturn declare double @llvm.experimental.vector.reduce.v2.fadd.f64.v8f64(double, <8 x double>) #5 ; Function Attrs: argmemonly nounwind willreturn declare void @llvm.lifetime.start.p0i8(i64 immarg, i8* nocapture) #6 ; Function Attrs: argmemonly nounwind willreturn declare void @llvm.lifetime.end.p0i8(i64 immarg, i8* nocapture) #6 ; Function Attrs: inaccessiblemem_or_argmemonly declare void @jl_gc_queue_root(%jl_value_t*) #7 ; Function Attrs: allocsize(1) declare noalias nonnull %jl_value_t* @jl_gc_pool_alloc(i8*, i32, i32) #1 ; Function Attrs: allocsize(1) declare noalias nonnull %jl_value_t* @jl_gc_big_alloc(i8*, i64) #1 ; Function Attrs: allocsize(1) declare noalias nonnull %jl_value_t* @julia.gc_alloc_bytes(i8*, i64) #1 attributes #0 = { "thunk" } attributes #1 = { allocsize(1) } attributes #2 = { nounwind readnone } attributes #3 = { nounwind willreturn } attributes #4 = { argmemonly nounwind readonly willreturn } attributes #5 = { nounwind readnone willreturn } attributes #6 = { argmemonly nounwind willreturn } attributes #7 = { inaccessiblemem_or_argmemonly } !llvm.module.flags = !{!0, !1} !llvm.dbg.cu = !{!2} !0 = !{i32 2, !"Dwarf Version", i32 4} !1 = !{i32 1, !"Debug Info Version", i32 3} !2 = distinct !DICompileUnit(language: DW_LANG_Julia, file: !3, producer: "julia", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !4, nameTableKind: GNU) !3 = !DIFile(filename: "REPL[46]", directory: ".") !4 = !{} !5 = distinct !DISubprogram(name: "mydotavx", linkageName: "julia_mydotavx_8642", scope: null, file: !3, line: 1, type: !6, scopeLine: 1, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !6 = !DISubroutineType(types: !4) !7 = !DILocation(line: 65, scope: !8, inlinedAt: !10) !8 = distinct !DISubprogram(name: "unsafe_convert;", linkageName: "unsafe_convert", scope: !9, file: !9, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !9 = !DIFile(filename: "pointer.jl", directory: ".") !10 = !DILocation(line: 996, scope: !11, inlinedAt: !13) !11 = distinct !DISubprogram(name: "pointer;", linkageName: "pointer", scope: !12, file: !12, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !12 = !DIFile(filename: "abstractarray.jl", directory: ".") !13 = !DILocation(line: 560, scope: !14, inlinedAt: !16) !14 = distinct !DISubprogram(name: "stridedpointer;", linkageName: "stridedpointer", scope: !15, file: !15, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !15 = !DIFile(filename: "/home/chriselrod/.julia/dev/VectorizationBase/src/vectorizable.jl", directory: ".") !16 = !DILocation(line: 3, scope: !5) !17 = !{!18, !18, i64 0} !18 = !{!"jtbaa_arrayptr", !19, i64 0} !19 = !{!"jtbaa_array", !20, i64 0} !20 = !{!"jtbaa", !21, i64 0} !21 = !{!"jtbaa"} !22 = !{i64 1, i64 0} !23 = !DILocation(line: 285, scope: !24, inlinedAt: !26) !24 = distinct !DISubprogram(name: "unitrange_last;", linkageName: "unitrange_last", scope: !25, file: !25, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !25 = !DIFile(filename: "range.jl", directory: ".") !26 = !DILocation(line: 280, scope: !27, inlinedAt: !28) !27 = distinct !DISubprogram(name: "UnitRange;", linkageName: "UnitRange", scope: !25, file: !25, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !28 = !DILocation(line: 5, scope: !29, inlinedAt: !16) !29 = distinct !DISubprogram(name: "Colon;", linkageName: "Colon", scope: !25, file: !25, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !30 = !DILocation(line: 287, scope: !31, inlinedAt: !33) !31 = distinct !DISubprogram(name: "assume;", linkageName: "assume", scope: !32, file: !32, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !32 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/llvm_utils.jl", directory: ".") !33 = !DILocation(line: 469, scope: !34, inlinedAt: !36) !34 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !35, file: !35, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !35 = !DIFile(filename: "/home/chriselrod/.julia/dev/LoopVectorization/src/reconstruct_loopset.jl", directory: ".") !36 = !DILocation(line: 469, scope: !37, inlinedAt: !16) !37 = distinct !DISubprogram(name: "_avx_!;", linkageName: "_avx_!", scope: !35, file: !35, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !38 = !DILocation(line: 104, scope: !39, inlinedAt: !33) !39 = distinct !DISubprogram(name: "vsub;", linkageName: "vsub", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !40 = !DIFile(filename: "/home/chriselrod/.julia/dev/VectorizationBase/src/vector_width.jl", directory: ".") !41 = !DILocation(line: 83, scope: !42, inlinedAt: !33) !42 = distinct !DISubprogram(name: "<;", linkageName: "<", scope: !43, file: !43, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !43 = !DIFile(filename: "int.jl", directory: ".") !44 = !DILocation(line: 0, scope: !45, inlinedAt: !47) !45 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !46, file: !46, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !46 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/memory.jl", directory: ".") !47 = !DILocation(line: 132, scope: !48, inlinedAt: !49) !48 = distinct !DISubprogram(name: "vload;", linkageName: "vload", scope: !46, file: !46, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !49 = !DILocation(line: 288, scope: !48, inlinedAt: !50) !50 = !DILocation(line: 257, scope: !51, inlinedAt: !33) !51 = distinct !DISubprogram(name: "vload;", linkageName: "vload", scope: !15, file: !15, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !52 = !DILocation(line: 105, scope: !53, inlinedAt: !54) !53 = distinct !DISubprogram(name: "vmul;", linkageName: "vmul", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !54 = !DILocation(line: 177, scope: !55, inlinedAt: !56) !55 = distinct !DISubprogram(name: "vmulnp;", linkageName: "vmulnp", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !56 = !DILocation(line: 348, scope: !57, inlinedAt: !50) !57 = distinct !DISubprogram(name: "offset;", linkageName: "offset", scope: !15, file: !15, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !58 = !DILocation(line: 160, scope: !45, inlinedAt: !47) !59 = !{!60, !60, i64 0, i64 0} !60 = !{!"jtbaa_arraybuf", !21, i64 0} !61 = !{!62} !62 = !{!"noaliasscope", !63} !63 = !{!"noaliasdomain"} !64 = !DILocation(line: 554, scope: !65, inlinedAt: !67) !65 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !66, file: !66, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !66 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/floating_point_arithmetic.jl", directory: ".") !67 = !DILocation(line: 539, scope: !68, inlinedAt: !69) !68 = distinct !DISubprogram(name: "vfmadd_fast;", linkageName: "vfmadd_fast", scope: !66, file: !66, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !69 = !DILocation(line: 106, scope: !70, inlinedAt: !33) !70 = distinct !DISubprogram(name: "vfmadd_fast;", linkageName: "vfmadd_fast", scope: !71, file: !71, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !71 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/SIMDPirates.jl", directory: ".") !72 = !DILocation(line: 103, scope: !73, inlinedAt: !74) !73 = distinct !DISubprogram(name: "vadd;", linkageName: "vadd", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !74 = !DILocation(line: 155, scope: !75, inlinedAt: !33) !75 = distinct !DISubprogram(name: "valmuladd;", linkageName: "valmuladd", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !76 = !DILocation(line: 472, scope: !77, inlinedAt: !78) !77 = distinct !DISubprogram(name: "rem;", linkageName: "rem", scope: !43, file: !43, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !78 = !DILocation(line: 114, scope: !79, inlinedAt: !81) !79 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !80, file: !80, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !80 = !DIFile(filename: "/home/chriselrod/.julia/dev/VectorizationBase/src/masks.jl", directory: ".") !81 = !DILocation(line: 104, scope: !82, inlinedAt: !33) !82 = distinct !DISubprogram(name: "mask;", linkageName: "mask", scope: !80, file: !80, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !83 = !DILocation(line: 86, scope: !84, inlinedAt: !78) !84 = distinct !DISubprogram(name: "-;", linkageName: "-", scope: !43, file: !43, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !85 = !DILocation(line: 309, scope: !86, inlinedAt: !87) !86 = distinct !DISubprogram(name: "&;", linkageName: "&", scope: !43, file: !43, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !87 = !DILocation(line: 154, scope: !88, inlinedAt: !78) !88 = distinct !DISubprogram(name: "valrem;", linkageName: "valrem", scope: !40, file: !40, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !89 = !DILocation(line: 86, scope: !84, inlinedAt: !90) !90 = !DILocation(line: 115, scope: !79, inlinedAt: !81) !91 = !DILocation(line: 458, scope: !92, inlinedAt: !90) !92 = distinct !DISubprogram(name: ">>>;", linkageName: ">>>", scope: !43, file: !43, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !93 = !DILocation(line: 83, scope: !42, inlinedAt: !94) !94 = !DILocation(line: 303, scope: !95, inlinedAt: !33) !95 = distinct !DISubprogram(name: ">;", linkageName: ">", scope: !96, file: !96, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !96 = !DIFile(filename: "operators.jl", directory: ".") !97 = !DILocation(line: 105, scope: !53, inlinedAt: !98) !98 = !DILocation(line: 177, scope: !55, inlinedAt: !99) !99 = !DILocation(line: 348, scope: !57, inlinedAt: !100) !100 = !DILocation(line: 259, scope: !51, inlinedAt: !33) !101 = !DILocation(line: 231, scope: !45, inlinedAt: !102) !102 = !DILocation(line: 202, scope: !48, inlinedAt: !103) !103 = !DILocation(line: 288, scope: !48, inlinedAt: !100) !104 = !DILocation(line: 554, scope: !65, inlinedAt: !105) !105 = !DILocation(line: 539, scope: !68, inlinedAt: !106) !106 = !DILocation(line: 106, scope: !70, inlinedAt: !107) !107 = !DILocation(line: 168, scope: !108, inlinedAt: !33) !108 = distinct !DISubprogram(name: "vifelse;", linkageName: "vifelse", scope: !109, file: !109, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !109 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/conditionals.jl", directory: ".") !110 = !DILocation(line: 151, scope: !111, inlinedAt: !112) !111 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !109, file: !109, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !112 = !DILocation(line: 121, scope: !108, inlinedAt: !113) !113 = !DILocation(line: 110, scope: !108, inlinedAt: !107) !114 = !DILocation(line: 0, scope: !51, inlinedAt: !33) !115 = !DILocation(line: 125, scope: !116, inlinedAt: !118) !116 = distinct !DISubprogram(name: "macro expansion;", linkageName: "macro expansion", scope: !117, file: !117, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !117 = !DIFile(filename: "/home/chriselrod/.julia/dev/SIMDPirates/src/llvmwrap.jl", directory: ".") !118 = !DILocation(line: 102, scope: !119, inlinedAt: !120) !119 = distinct !DISubprogram(name: "llvmwrap_notfast;", linkageName: "llvmwrap_notfast", scope: !117, file: !117, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !120 = !DILocation(line: 102, scope: !119, inlinedAt: !121) !121 = !DILocation(line: 89, scope: !122, inlinedAt: !33) !122 = distinct !DISubprogram(name: "evadd;", linkageName: "evadd", scope: !71, file: !71, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !123 = !DILocation(line: 288, scope: !65, inlinedAt: !124) !124 = !DILocation(line: 276, scope: !125, inlinedAt: !16) !125 = distinct !DISubprogram(name: "reduced_add;", linkageName: "reduced_add", scope: !66, file: !66, type: !6, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !4) !126 = !DILocation(line: 6, scope: !5) !127 = !{i64 40} !128 = !{i64 16} !129 = !{i64 8} !130 = !{!131, !131, i64 0} !131 = !{!"jtbaa_tag", !132, i64 0} !132 = !{!"jtbaa_data", !20, i64 0} !133 = !{!134, !134, i64 0} !134 = !{!"jtbaa_immut", !135, i64 0} !135 = !{!"jtbaa_value", !132, i64 0}
Become a Patron
Sponsor on GitHub
Donate via PayPal
Source on GitHub
Mailing list
Installed libraries
Wiki
Report an issue
How it works
Contact the author
CE on Mastodon
About the author
Statistics
Changelog
Version tree