; ModuleID = 'kernel_gemm' source_filename = "kernel_gemm" target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" target triple = "x86_64-unknown-linux-gnu" ; Function Attrs: sspstrong define void @julia_kernel_gemm_72151(i64, i64, i8**, i8**, i8**) #0 !dbg !5 { top: br label %top.split, !dbg !27 top.split: ; preds = %top call void @llvm.dbg.value(metadata i8** null, i64 0, metadata !18, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i8** null, i64 0, metadata !19, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i8** null, i64 0, metadata !20, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %0, i64 0, metadata !16, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %1, i64 0, metadata !17, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i8** %2, i64 0, metadata !18, metadata !28), !dbg !27 %5 = bitcast i8** %2 to i64** %6 = load i64*, i64** %5, align 8, !tbaa !29 %7 = getelementptr i8*, i8** %2, i64 3 %8 = bitcast i8** %7 to i64* %9 = load i64, i64* %8, align 8, !tbaa !29 call void @llvm.dbg.value(metadata i8** %3, i64 0, metadata !19, metadata !28), !dbg !27 %10 = bitcast i8** %3 to i64** %11 = load i64*, i64** %10, align 8, !tbaa !29 %12 = getelementptr i8*, i8** %3, i64 3 %13 = bitcast i8** %12 to i64* %14 = load i64, i64* %13, align 8, !tbaa !29 call void @llvm.dbg.value(metadata i8** %4, i64 0, metadata !20, metadata !28), !dbg !27 %15 = bitcast i8** %4 to i64** %16 = load i64*, i64** %15, align 8, !tbaa !29 %17 = getelementptr i8*, i8** %4, i64 3 %18 = bitcast i8** %17 to i64* %19 = load i64, i64* %18, align 8, !tbaa !29 %20 = getelementptr i8*, i8** %4, i64 4, !dbg !32 %21 = bitcast i8** %20 to i64*, !dbg !32 %22 = load i64, i64* %21, align 8, !dbg !32, !tbaa !29 call void @llvm.dbg.value(metadata i64 %14, i64 0, metadata !24, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %14, i64 0, metadata !24, metadata !28), !dbg !27 %23 = icmp sgt i64 %14, 0, !dbg !33 %24 = select i1 %23, i64 %14, i64 0, !dbg !33 %25 = icmp slt i64 %14, 1, !dbg !33 br i1 %25, label %L65, label %if.lr.ph, !dbg !33 if.lr.ph: ; preds = %top.split br label %if, !dbg !33 L42.L18.loopexit_crit_edge: ; preds = %L42.loopexit br label %L18.loopexit, !dbg !34 L18.loopexit: ; preds = %L42.L18.loopexit_crit_edge, %L38 %26 = icmp eq i64 %"#temp#4.024", %24, !dbg !33 br i1 %26, label %L18.L65_crit_edge, label %if, !dbg !33 if: ; preds = %if.lr.ph, %L18.loopexit %"#temp#4.024" = phi i64 [ 1, %if.lr.ph ], [ %27, %L18.loopexit ] %27 = add i64 %"#temp#4.024", 1, !dbg !33 call void @llvm.dbg.value(metadata i64 %22, i64 0, metadata !26, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %22, i64 0, metadata !26, metadata !28), !dbg !27 %28 = icmp sgt i64 %22, 0, !dbg !35 %29 = select i1 %28, i64 %22, i64 0, !dbg !35 %30 = add nuw i64 %29, 1, !dbg !35 %31 = icmp slt i64 %22, 1, !dbg !35 br i1 %31, label %L38, label %if7.lr.ph, !dbg !35 if7.lr.ph: ; preds = %if br label %if7, !dbg !35 L18.L65_crit_edge: ; preds = %L18.loopexit br label %L65, !dbg !33 L65: ; preds = %L18.L65_crit_edge, %top.split ret void, !dbg !36 if7: ; preds = %if7.lr.ph, %if7 %"#temp#.021" = phi i64 [ 1, %if7.lr.ph ], [ %32, %if7 ] %32 = add i64 %"#temp#.021", 1, !dbg !35 call void @llvm.dbg.value(metadata i64 %"#temp#4.024", i64 0, metadata !23, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#.021", i64 0, metadata !21, metadata !28), !dbg !27 %33 = add i64 %"#temp#4.024", -1, !dbg !37 %34 = add i64 %"#temp#.021", -1, !dbg !37 %35 = mul i64 %34, %9, !dbg !37 %36 = add i64 %33, %35, !dbg !37 %37 = getelementptr i64, i64* %6, i64 %36, !dbg !37 %38 = load i64, i64* %37, align 8, !dbg !37, !tbaa !38 %39 = mul i64 %38, %1, !dbg !37 call void @llvm.dbg.value(metadata i64 %"#temp#4.024", i64 0, metadata !23, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#.021", i64 0, metadata !21, metadata !28), !dbg !27 store i64 %39, i64* %37, align 8, !dbg !37, !tbaa !38 %40 = icmp eq i64 %32, %30, !dbg !35 br i1 %40, label %L27.L38_crit_edge, label %if7, !dbg !35 L27.L38_crit_edge: ; preds = %if7 br label %L38, !dbg !35 L38: ; preds = %L27.L38_crit_edge, %if call void @llvm.dbg.value(metadata i64 %19, i64 0, metadata !25, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %19, i64 0, metadata !25, metadata !28), !dbg !27 %41 = icmp sgt i64 %19, 0, !dbg !34 %42 = select i1 %41, i64 %19, i64 0, !dbg !34 %43 = icmp slt i64 %19, 1, !dbg !34 br i1 %43, label %L18.loopexit, label %if8.lr.ph, !dbg !34 if8.lr.ph: ; preds = %L38 br label %if8, !dbg !34 L50.L42.loopexit_crit_edge: ; preds = %if9 br label %L42.loopexit, !dbg !34 L42.loopexit: ; preds = %L50.L42.loopexit_crit_edge, %if8 %44 = icmp eq i64 %"#temp#3.023", %42, !dbg !34 br i1 %44, label %L42.L18.loopexit_crit_edge, label %if8, !dbg !34 if8: ; preds = %if8.lr.ph, %L42.loopexit %"#temp#3.023" = phi i64 [ 1, %if8.lr.ph ], [ %45, %L42.loopexit ] %45 = add i64 %"#temp#3.023", 1, !dbg !34 call void @llvm.dbg.value(metadata i64 %22, i64 0, metadata !26, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %22, i64 0, metadata !26, metadata !28), !dbg !27 %46 = icmp slt i64 %22, 1, !dbg !34 br i1 %46, label %L42.loopexit, label %if9.lr.ph, !dbg !34 if9.lr.ph: ; preds = %if8 br label %if9, !dbg !34 if9: ; preds = %if9.lr.ph, %if9 %"#temp#2.022" = phi i64 [ 1, %if9.lr.ph ], [ %47, %if9 ] %47 = add i64 %"#temp#2.022", 1, !dbg !34 call void @llvm.dbg.value(metadata i64 %"#temp#4.024", i64 0, metadata !23, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#2.022", i64 0, metadata !21, metadata !28), !dbg !27 %48 = add i64 %"#temp#4.024", -1, !dbg !36 %49 = add i64 %"#temp#2.022", -1, !dbg !36 %50 = mul i64 %49, %9, !dbg !36 %51 = add i64 %48, %50, !dbg !36 %52 = getelementptr i64, i64* %6, i64 %51, !dbg !36 %53 = load i64, i64* %52, align 8, !dbg !36, !tbaa !38 call void @llvm.dbg.value(metadata i64 %"#temp#4.024", i64 0, metadata !23, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#3.023", i64 0, metadata !22, metadata !28), !dbg !27 %54 = add i64 %"#temp#3.023", -1, !dbg !36 %55 = mul i64 %54, %14, !dbg !36 %56 = add i64 %48, %55, !dbg !36 %57 = getelementptr i64, i64* %11, i64 %56, !dbg !36 %58 = load i64, i64* %57, align 8, !dbg !36, !tbaa !38 %59 = mul i64 %58, %0, !dbg !36 call void @llvm.dbg.value(metadata i64 %"#temp#3.023", i64 0, metadata !22, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#2.022", i64 0, metadata !21, metadata !28), !dbg !27 %60 = mul i64 %49, %19, !dbg !36 %61 = add i64 %54, %60, !dbg !36 %62 = getelementptr i64, i64* %16, i64 %61, !dbg !36 %63 = load i64, i64* %62, align 8, !dbg !36, !tbaa !38 %64 = mul i64 %59, %63, !dbg !36 %65 = add i64 %64, %53, !dbg !36 call void @llvm.dbg.value(metadata i64 %"#temp#4.024", i64 0, metadata !23, metadata !28), !dbg !27 call void @llvm.dbg.value(metadata i64 %"#temp#2.022", i64 0, metadata !21, metadata !28), !dbg !27 store i64 %65, i64* %52, align 8, !dbg !36, !tbaa !38 %66 = icmp eq i64 %47, %30, !dbg !34 br i1 %66, label %L50.L42.loopexit_crit_edge, label %if9, !dbg !34 } define i8** @jlcall_kernel_gemm_72150(i8**, i8***, i32) #1 { top: br label %top.split top.split: ; preds = %top %3 = bitcast i8*** %1 to i64** %4 = load i64*, i64** %3, align 8 %5 = load i64, i64* %4, align 8 %6 = getelementptr i8**, i8*** %1, i64 1 %7 = bitcast i8*** %6 to i64** %8 = load i64*, i64** %7, align 8 %9 = load i64, i64* %8, align 8 %10 = getelementptr i8**, i8*** %1, i64 2 %11 = load i8**, i8*** %10, align 8 %12 = getelementptr i8**, i8*** %1, i64 3 %13 = load i8**, i8*** %12, align 8 %14 = getelementptr i8**, i8*** %1, i64 4 %15 = load i8**, i8*** %14, align 8 call void @julia_kernel_gemm_72151(i64 %5, i64 %9, i8** %11, i8** %13, i8** %15) ret i8** inttoptr (i64 140728619237392 to i8**) } declare i8**** @jl_get_ptls_states() ; Function Attrs: nounwind readnone declare void @llvm.dbg.declare(metadata, metadata, metadata) #2 ; Function Attrs: argmemonly nounwind declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture writeonly, i8* nocapture readonly, i32, i32, i1) #3 ; Function Attrs: argmemonly nounwind declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture writeonly, i8* nocapture readonly, i64, i32, i1) #3 declare void @jl_enter_handler(i8*) ; Function Attrs: returns_twice declare i32 @__sigsetjmp(i8*, i32) #4 ; Function Attrs: nounwind readnone declare void @llvm.dbg.value(metadata, i64, metadata, metadata) #2 attributes #0 = { sspstrong "no-frame-pointer-elim"="true" } attributes #1 = { "no-frame-pointer-elim"="true" } attributes #2 = { nounwind readnone } attributes #3 = { argmemonly nounwind } attributes #4 = { returns_twice } !llvm.module.flags = !{!0, !1} !llvm.dbg.cu = !{!2} !0 = !{i32 2, !"Dwarf Version", i32 4} !1 = !{i32 1, !"Debug Info Version", i32 3} !2 = distinct !DICompileUnit(language: DW_LANG_C89, file: !3, producer: "julia", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !4) !3 = !DIFile(filename: "REPL[1]", directory: ".") !4 = !{} !5 = distinct !DISubprogram(name: "kernel_gemm", linkageName: "julia_kernel_gemm_72151", scope: null, file: !3, type: !6, isLocal: false, isDefinition: true, isOptimized: true, unit: !2, variables: !13) !6 = !DISubroutineType(types: !7) !7 = !{!8, !8, !9, !9, !9} !8 = !DIBasicType(name: "Int64", size: 64, encoding: DW_ATE_unsigned) !9 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !10, size: 64, align: 64) !10 = !DICompositeType(tag: DW_TAG_structure_type, name: "jl_value_t", file: !11, line: 71, align: 64, elements: !12) !11 = !DIFile(filename: "julia.h", directory: "") !12 = !{!9} !13 = !{!14, !16, !17, !18, !19, !20, !21, !21, !22, !23, !24, !25, !26} !14 = !DILocalVariable(name: "#self#", arg: 1, scope: !5, file: !3, line: 2, type: !15) !15 = !DICompositeType(tag: DW_TAG_structure_type, name: "#kernel_gemm", align: 8, elements: !4, runtimeLang: DW_LANG_Julia, identifier: "#kernel_gemm_72086") !16 = !DILocalVariable(name: "alpha", arg: 2, scope: !5, file: !3, line: 2, type: !8) !17 = !DILocalVariable(name: "beta", arg: 3, scope: !5, file: !3, line: 2, type: !8) !18 = !DILocalVariable(name: "C", arg: 4, scope: !5, file: !3, line: 2, type: !9) !19 = !DILocalVariable(name: "A", arg: 5, scope: !5, file: !3, line: 2, type: !9) !20 = !DILocalVariable(name: "B", arg: 6, scope: !5, file: !3, line: 2, type: !9) !21 = !DILocalVariable(name: "j", scope: !5, file: !3, line: 2, type: !8) !22 = !DILocalVariable(name: "k", scope: !5, file: !3, line: 2, type: !8) !23 = !DILocalVariable(name: "i", scope: !5, file: !3, line: 2, type: !8) !24 = !DILocalVariable(name: "ni", scope: !5, file: !3, line: 2, type: !8) !25 = !DILocalVariable(name: "nk", scope: !5, file: !3, line: 2, type: !8) !26 = !DILocalVariable(name: "nj", scope: !5, file: !3, line: 2, type: !8) !27 = !DILocation(line: 2, scope: !5) !28 = !DIExpression() !29 = !{!30, !30, i64 0, i64 1} !30 = !{!"jtbaa_const", !31, i64 0} !31 = !{!"jtbaa"} !32 = !DILocation(line: 3, scope: !5) !33 = !DILocation(line: 4, scope: !5) !34 = !DILocation(line: 8, scope: !5) !35 = !DILocation(line: 5, scope: !5) !36 = !DILocation(line: 9, scope: !5) !37 = !DILocation(line: 6, scope: !5) !38 = !{!39, !39, i64 0} !39 = !{!"jtbaa_arraybuf", !40, i64 0} !40 = !{!"jtbaa_data", !31, i64 0}