; ModuleID = 'kernel_gemm' source_filename = "kernel_gemm" target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" target triple = "x86_64-unknown-linux-gnu" define void @julia_kernel_gemm_68073(i64, i64, i8**, i8**, i8**) #0 !dbg !5 { top: br label %top.split top.split: ; preds = %top %5 = bitcast i8** %2 to i64** %6 = load i64*, i64** %5, align 8, !tbaa !7 %7 = getelementptr i8*, i8** %2, i64 3 %8 = bitcast i8** %7 to i64* %9 = load i64, i64* %8, align 8, !tbaa !7 %10 = bitcast i8** %3 to i64** %11 = load i64*, i64** %10, align 8, !tbaa !7 %12 = getelementptr i8*, i8** %3, i64 3 %13 = bitcast i8** %12 to i64* %14 = load i64, i64* %13, align 8, !tbaa !7 %15 = bitcast i8** %4 to i64** %16 = load i64*, i64** %15, align 8, !tbaa !7 %17 = getelementptr i8*, i8** %4, i64 3 %18 = bitcast i8** %17 to i64* %19 = load i64, i64* %18, align 8, !tbaa !7 %20 = getelementptr i8*, i8** %4, i64 4, !dbg !10 %21 = bitcast i8** %20 to i64*, !dbg !10 %22 = load i64, i64* %21, align 8, !dbg !10, !tbaa !7 %23 = icmp sgt i64 %14, 0, !dbg !11 %24 = select i1 %23, i64 %14, i64 0, !dbg !11 %25 = icmp slt i64 %14, 1, !dbg !11 br i1 %25, label %L65, label %if.lr.ph, !dbg !11 if.lr.ph: ; preds = %top.split br label %if, !dbg !11 L42.L18.loopexit_crit_edge: ; preds = %L42.loopexit br label %L18.loopexit, !dbg !12 L18.loopexit: ; preds = %L42.L18.loopexit_crit_edge, %L38 %26 = icmp eq i64 %"#temp#4.024", %24, !dbg !11 br i1 %26, label %L18.L65_crit_edge, label %if, !dbg !11 if: ; preds = %if.lr.ph, %L18.loopexit %"#temp#4.024" = phi i64 [ 1, %if.lr.ph ], [ %27, %L18.loopexit ] %27 = add i64 %"#temp#4.024", 1, !dbg !11 %28 = icmp sgt i64 %22, 0, !dbg !13 %29 = select i1 %28, i64 %22, i64 0, !dbg !13 %30 = add nuw i64 %29, 1, !dbg !13 %31 = icmp slt i64 %22, 1, !dbg !13 br i1 %31, label %L38, label %if7.lr.ph, !dbg !13 if7.lr.ph: ; preds = %if br label %if7, !dbg !13 L18.L65_crit_edge: ; preds = %L18.loopexit br label %L65, !dbg !11 L65: ; preds = %L18.L65_crit_edge, %top.split ret void, !dbg !14 if7: ; preds = %if7.lr.ph, %if7 %"#temp#.021" = phi i64 [ 1, %if7.lr.ph ], [ %32, %if7 ] %32 = add i64 %"#temp#.021", 1, !dbg !13 %33 = add i64 %"#temp#4.024", -1, !dbg !15 %34 = add i64 %"#temp#.021", -1, !dbg !15 %35 = mul i64 %34, %9, !dbg !15 %36 = add i64 %33, %35, !dbg !15 %37 = getelementptr i64, i64* %6, i64 %36, !dbg !15 %38 = load i64, i64* %37, align 8, !dbg !15, !tbaa !16 %39 = mul i64 %38, %1, !dbg !15 store i64 %39, i64* %37, align 8, !dbg !15, !tbaa !16 %40 = icmp eq i64 %32, %30, !dbg !13 br i1 %40, label %L27.L38_crit_edge, label %if7, !dbg !13 L27.L38_crit_edge: ; preds = %if7 br label %L38, !dbg !13 L38: ; preds = %L27.L38_crit_edge, %if %41 = icmp sgt i64 %19, 0, !dbg !12 %42 = select i1 %41, i64 %19, i64 0, !dbg !12 %43 = icmp slt i64 %19, 1, !dbg !12 br i1 %43, label %L18.loopexit, label %if8.lr.ph, !dbg !12 if8.lr.ph: ; preds = %L38 br label %if8, !dbg !12 L50.L42.loopexit_crit_edge: ; preds = %if9 br label %L42.loopexit, !dbg !12 L42.loopexit: ; preds = %L50.L42.loopexit_crit_edge, %if8 %44 = icmp eq i64 %"#temp#3.023", %42, !dbg !12 br i1 %44, label %L42.L18.loopexit_crit_edge, label %if8, !dbg !12 if8: ; preds = %if8.lr.ph, %L42.loopexit %"#temp#3.023" = phi i64 [ 1, %if8.lr.ph ], [ %45, %L42.loopexit ] %45 = add i64 %"#temp#3.023", 1, !dbg !12 %46 = icmp slt i64 %22, 1, !dbg !12 br i1 %46, label %L42.loopexit, label %if9.lr.ph, !dbg !12 if9.lr.ph: ; preds = %if8 br label %if9, !dbg !12 if9: ; preds = %if9.lr.ph, %if9 %"#temp#2.022" = phi i64 [ 1, %if9.lr.ph ], [ %47, %if9 ] %47 = add i64 %"#temp#2.022", 1, !dbg !12 %48 = add i64 %"#temp#4.024", -1, !dbg !14 %49 = add i64 %"#temp#2.022", -1, !dbg !14 %50 = mul i64 %49, %9, !dbg !14 %51 = add i64 %48, %50, !dbg !14 %52 = getelementptr i64, i64* %6, i64 %51, !dbg !14 %53 = load i64, i64* %52, align 8, !dbg !14, !tbaa !16 %54 = add i64 %"#temp#3.023", -1, !dbg !14 %55 = mul i64 %54, %14, !dbg !14 %56 = add i64 %48, %55, !dbg !14 %57 = getelementptr i64, i64* %11, i64 %56, !dbg !14 %58 = load i64, i64* %57, align 8, !dbg !14, !tbaa !16 %59 = mul i64 %58, %0, !dbg !14 %60 = mul i64 %49, %19, !dbg !14 %61 = add i64 %54, %60, !dbg !14 %62 = getelementptr i64, i64* %16, i64 %61, !dbg !14 %63 = load i64, i64* %62, align 8, !dbg !14, !tbaa !16 %64 = mul i64 %59, %63, !dbg !14 %65 = add i64 %64, %53, !dbg !14 store i64 %65, i64* %52, align 8, !dbg !14, !tbaa !16 %66 = icmp eq i64 %47, %30, !dbg !12 br i1 %66, label %L50.L42.loopexit_crit_edge, label %if9, !dbg !12 } define i8** @jlcall_kernel_gemm_68072(i8**, i8***, i32) #0 { top: br label %top.split top.split: ; preds = %top %3 = bitcast i8*** %1 to i64** %4 = load i64*, i64** %3, align 8 %5 = load i64, i64* %4, align 8 %6 = getelementptr i8**, i8*** %1, i64 1 %7 = bitcast i8*** %6 to i64** %8 = load i64*, i64** %7, align 8 %9 = load i64, i64* %8, align 8 %10 = getelementptr i8**, i8*** %1, i64 2 %11 = load i8**, i8*** %10, align 8 %12 = getelementptr i8**, i8*** %1, i64 3 %13 = load i8**, i8*** %12, align 8 %14 = getelementptr i8**, i8*** %1, i64 4 %15 = load i8**, i8*** %14, align 8 call void @julia_kernel_gemm_68073(i64 %5, i64 %9, i8** %11, i8** %13, i8** %15) ret i8** inttoptr (i64 140728622989328 to i8**) } declare i8**** @jl_get_ptls_states() ; Function Attrs: argmemonly nounwind declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture writeonly, i8* nocapture readonly, i32, i32, i1) #1 ; Function Attrs: argmemonly nounwind declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture writeonly, i8* nocapture readonly, i64, i32, i1) #1 declare void @jl_enter_handler(i8*) ; Function Attrs: returns_twice declare i32 @__sigsetjmp(i8*, i32) #2 attributes #0 = { "no-frame-pointer-elim"="true" } attributes #1 = { argmemonly nounwind } attributes #2 = { returns_twice } !llvm.module.flags = !{!0, !1} !llvm.dbg.cu = !{!2} !0 = !{i32 2, !"Dwarf Version", i32 4} !1 = !{i32 1, !"Debug Info Version", i32 3} !2 = distinct !DICompileUnit(language: DW_LANG_C89, file: !3, producer: "julia", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !4) !3 = !DIFile(filename: "REPL[1]", directory: ".") !4 = !{} !5 = distinct !DISubprogram(name: "kernel_gemm", linkageName: "julia_kernel_gemm_68073", scope: null, file: !3, type: !6, isLocal: false, isDefinition: true, isOptimized: true, unit: !2, variables: !4) !6 = !DISubroutineType(types: !4) !7 = !{!8, !8, i64 0, i64 1} !8 = !{!"jtbaa_const", !9, i64 0} !9 = !{!"jtbaa"} !10 = !DILocation(line: 3, scope: !5) !11 = !DILocation(line: 4, scope: !5) !12 = !DILocation(line: 8, scope: !5) !13 = !DILocation(line: 5, scope: !5) !14 = !DILocation(line: 9, scope: !5) !15 = !DILocation(line: 6, scope: !5) !16 = !{!17, !17, i64 0} !17 = !{!"jtbaa_arraybuf", !18, i64 0} !18 = !{!"jtbaa_data", !9, i64 0}